PyPI - teradataml - Versions diffs - 17.20.0.7__py3-none-any.whl → 20.0.0.1__py3-none-any.whl - Mend

teradataml 17.20.0.7py3-none-any.whl → 20.0.0.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of teradataml might be problematic. Click here for more details.

Files changed (1303) hide show

teradataml/LICENSE-3RD-PARTY.pdf +0 -0
teradataml/LICENSE.pdf +0 -0
teradataml/README.md +1935 -1640
teradataml/__init__.py +70 -60
teradataml/_version.py +11 -11
teradataml/analytics/Transformations.py +2995 -2995
teradataml/analytics/__init__.py +81 -83
teradataml/analytics/analytic_function_executor.py +2040 -2010
teradataml/analytics/analytic_query_generator.py +958 -958
teradataml/analytics/byom/H2OPredict.py +514 -514
teradataml/analytics/byom/PMMLPredict.py +437 -437
teradataml/analytics/byom/__init__.py +14 -14
teradataml/analytics/json_parser/__init__.py +130 -130
teradataml/analytics/json_parser/analytic_functions_argument.py +1707 -1707
teradataml/analytics/json_parser/json_store.py +191 -191
teradataml/analytics/json_parser/metadata.py +1637 -1637
teradataml/analytics/json_parser/utils.py +798 -803
teradataml/analytics/meta_class.py +196 -196
teradataml/analytics/sqle/DecisionTreePredict.py +455 -470
teradataml/analytics/sqle/NaiveBayesPredict.py +419 -428
teradataml/analytics/sqle/__init__.py +97 -110
teradataml/analytics/sqle/json/decisiontreepredict_sqle.json +78 -78
teradataml/analytics/sqle/json/naivebayespredict_sqle.json +62 -62
teradataml/analytics/table_operator/__init__.py +10 -10
teradataml/analytics/uaf/__init__.py +63 -63
teradataml/analytics/utils.py +693 -692
teradataml/analytics/valib.py +1603 -1600
teradataml/automl/__init__.py +1683 -0
teradataml/automl/custom_json_utils.py +1270 -0
teradataml/automl/data_preparation.py +1011 -0
teradataml/automl/data_transformation.py +789 -0
teradataml/automl/feature_engineering.py +1580 -0
teradataml/automl/feature_exploration.py +554 -0
teradataml/automl/model_evaluation.py +151 -0
teradataml/automl/model_training.py +1026 -0
teradataml/catalog/__init__.py +1 -3
teradataml/catalog/byom.py +1759 -1716
teradataml/catalog/function_argument_mapper.py +859 -861
teradataml/catalog/model_cataloging_utils.py +491 -1510
teradataml/clients/auth_client.py +133 -0
teradataml/clients/pkce_client.py +481 -481
teradataml/common/aed_utils.py +7 -2
teradataml/common/bulk_exposed_utils.py +111 -111
teradataml/common/constants.py +1438 -1441
teradataml/common/deprecations.py +160 -0
teradataml/common/exceptions.py +73 -73
teradataml/common/formula.py +742 -742
teradataml/common/garbagecollector.py +597 -635
teradataml/common/messagecodes.py +424 -431
teradataml/common/messages.py +228 -231
teradataml/common/sqlbundle.py +693 -693
teradataml/common/td_coltype_code_to_tdtype.py +48 -48
teradataml/common/utils.py +2424 -2500
teradataml/common/warnings.py +25 -25
teradataml/common/wrapper_utils.py +1 -110
teradataml/config/dummy_file1.cfg +4 -4
teradataml/config/dummy_file2.cfg +2 -2
teradataml/config/sqlengine_alias_definitions_v1.0 +13 -13
teradataml/config/sqlengine_alias_definitions_v1.1 +19 -19
teradataml/config/sqlengine_alias_definitions_v1.3 +18 -18
teradataml/context/aed_context.py +217 -217
teradataml/context/context.py +1091 -999
teradataml/data/A_loan.csv +19 -19
teradataml/data/BINARY_REALS_LEFT.csv +11 -11
teradataml/data/BINARY_REALS_RIGHT.csv +11 -11
teradataml/data/B_loan.csv +49 -49
teradataml/data/BuoyData2.csv +17 -17
teradataml/data/CONVOLVE2_COMPLEX_LEFT.csv +5 -5
teradataml/data/CONVOLVE2_COMPLEX_RIGHT.csv +5 -5
teradataml/data/Convolve2RealsLeft.csv +5 -5
teradataml/data/Convolve2RealsRight.csv +5 -5
teradataml/data/Convolve2ValidLeft.csv +11 -11
teradataml/data/Convolve2ValidRight.csv +11 -11
teradataml/data/DFFTConv_Real_8_8.csv +65 -65
teradataml/data/Orders1_12mf.csv +24 -24
teradataml/data/Pi_loan.csv +7 -7
teradataml/data/SMOOTHED_DATA.csv +7 -7
teradataml/data/TestDFFT8.csv +9 -9
teradataml/data/TestRiver.csv +109 -109
teradataml/data/Traindata.csv +28 -28
teradataml/data/acf.csv +17 -17
teradataml/data/adaboost_example.json +34 -34
teradataml/data/adaboostpredict_example.json +24 -24
teradataml/data/additional_table.csv +10 -10
teradataml/data/admissions_test.csv +21 -21
teradataml/data/admissions_train.csv +41 -41
teradataml/data/admissions_train_nulls.csv +41 -41
teradataml/data/advertising.csv +201 -0
teradataml/data/ageandheight.csv +13 -13
teradataml/data/ageandpressure.csv +31 -31
teradataml/data/antiselect_example.json +36 -36
teradataml/data/antiselect_input.csv +8 -8
teradataml/data/antiselect_input_mixed_case.csv +8 -8
teradataml/data/applicant_external.csv +6 -6
teradataml/data/applicant_reference.csv +6 -6
teradataml/data/arima_example.json +9 -9
teradataml/data/assortedtext_input.csv +8 -8
teradataml/data/attribution_example.json +33 -33
teradataml/data/attribution_sample_table.csv +27 -27
teradataml/data/attribution_sample_table1.csv +6 -6
teradataml/data/attribution_sample_table2.csv +11 -11
teradataml/data/bank_churn.csv +10001 -0
teradataml/data/bank_marketing.csv +11163 -0
teradataml/data/bank_web_clicks1.csv +42 -42
teradataml/data/bank_web_clicks2.csv +91 -91
teradataml/data/bank_web_url.csv +85 -85
teradataml/data/barrier.csv +2 -2
teradataml/data/barrier_new.csv +3 -3
teradataml/data/betweenness_example.json +13 -13
teradataml/data/bike_sharing.csv +732 -0
teradataml/data/bin_breaks.csv +8 -8
teradataml/data/bin_fit_ip.csv +3 -3
teradataml/data/binary_complex_left.csv +11 -11
teradataml/data/binary_complex_right.csv +11 -11
teradataml/data/binary_matrix_complex_left.csv +21 -21
teradataml/data/binary_matrix_complex_right.csv +21 -21
teradataml/data/binary_matrix_real_left.csv +21 -21
teradataml/data/binary_matrix_real_right.csv +21 -21
teradataml/data/blood2ageandweight.csv +26 -26
teradataml/data/bmi.csv +501 -0
teradataml/data/boston.csv +507 -507
teradataml/data/boston2cols.csv +721 -0
teradataml/data/breast_cancer.csv +570 -0
teradataml/data/buoydata_mix.csv +11 -11
teradataml/data/burst_data.csv +5 -5
teradataml/data/burst_example.json +20 -20
teradataml/data/byom_example.json +17 -17
teradataml/data/bytes_table.csv +3 -3
teradataml/data/cal_housing_ex_raw.csv +70 -70
teradataml/data/callers.csv +7 -7
teradataml/data/calls.csv +10 -10
teradataml/data/cars_hist.csv +33 -33
teradataml/data/cat_table.csv +24 -24
teradataml/data/ccm_example.json +31 -31
teradataml/data/ccm_input.csv +91 -91
teradataml/data/ccm_input2.csv +13 -13
teradataml/data/ccmexample.csv +101 -101
teradataml/data/ccmprepare_example.json +8 -8
teradataml/data/ccmprepare_input.csv +91 -91
teradataml/data/cfilter_example.json +12 -12
teradataml/data/changepointdetection_example.json +18 -18
teradataml/data/changepointdetectionrt_example.json +8 -8
teradataml/data/chi_sq.csv +2 -2
teradataml/data/churn_data.csv +14 -14
teradataml/data/churn_emission.csv +35 -35
teradataml/data/churn_initial.csv +3 -3
teradataml/data/churn_state_transition.csv +5 -5
teradataml/data/citedges_2.csv +745 -745
teradataml/data/citvertices_2.csv +1210 -1210
teradataml/data/clicks2.csv +16 -16
teradataml/data/clickstream.csv +12 -12
teradataml/data/clickstream1.csv +11 -11
teradataml/data/closeness_example.json +15 -15
teradataml/data/complaints.csv +21 -21
teradataml/data/complaints_mini.csv +3 -3
teradataml/data/complaints_testtoken.csv +224 -224
teradataml/data/complaints_tokens_test.csv +353 -353
teradataml/data/complaints_traintoken.csv +472 -472
teradataml/data/computers_category.csv +1001 -1001
teradataml/data/computers_test1.csv +1252 -1252
teradataml/data/computers_train1.csv +5009 -5009
teradataml/data/computers_train1_clustered.csv +5009 -5009
teradataml/data/confusionmatrix_example.json +9 -9
teradataml/data/conversion_event_table.csv +3 -3
teradataml/data/corr_input.csv +17 -17
teradataml/data/correlation_example.json +11 -11
teradataml/data/coxhazardratio_example.json +39 -39
teradataml/data/coxph_example.json +15 -15
teradataml/data/coxsurvival_example.json +28 -28
teradataml/data/cpt.csv +41 -41
teradataml/data/credit_ex_merged.csv +45 -45
teradataml/data/customer_loyalty.csv +301 -301
teradataml/data/customer_loyalty_newseq.csv +31 -31
teradataml/data/customer_segmentation_test.csv +2628 -0
teradataml/data/customer_segmentation_train.csv +8069 -0
teradataml/data/dataframe_example.json +146 -146
teradataml/data/decisionforest_example.json +37 -37
teradataml/data/decisionforestpredict_example.json +38 -38
teradataml/data/decisiontree_example.json +21 -21
teradataml/data/decisiontreepredict_example.json +45 -45
teradataml/data/dfft2_size4_real.csv +17 -17
teradataml/data/dfft2_test_matrix16.csv +17 -17
teradataml/data/dfft2conv_real_4_4.csv +65 -65
teradataml/data/diabetes.csv +443 -443
teradataml/data/diabetes_test.csv +89 -89
teradataml/data/dict_table.csv +5 -5
teradataml/data/docperterm_table.csv +4 -4
teradataml/data/docs/__init__.py +1 -1
teradataml/data/docs/byom/docs/DataRobotPredict.py +180 -180
teradataml/data/docs/byom/docs/DataikuPredict.py +177 -177
teradataml/data/docs/byom/docs/H2OPredict.py +324 -324
teradataml/data/docs/byom/docs/ONNXPredict.py +283 -283
teradataml/data/docs/byom/docs/PMMLPredict.py +277 -277
teradataml/data/docs/sqle/docs_17_10/Antiselect.py +82 -82
teradataml/data/docs/sqle/docs_17_10/Attribution.py +199 -199
teradataml/data/docs/sqle/docs_17_10/BincodeFit.py +171 -171
teradataml/data/docs/sqle/docs_17_10/BincodeTransform.py +131 -130
teradataml/data/docs/sqle/docs_17_10/CategoricalSummary.py +86 -86
teradataml/data/docs/sqle/docs_17_10/ChiSq.py +90 -90
teradataml/data/docs/sqle/docs_17_10/ColumnSummary.py +85 -85
teradataml/data/docs/sqle/docs_17_10/ConvertTo.py +95 -95
teradataml/data/docs/sqle/docs_17_10/DecisionForestPredict.py +139 -139
teradataml/data/docs/sqle/docs_17_10/DecisionTreePredict.py +151 -151
teradataml/data/docs/sqle/docs_17_10/FTest.py +160 -160
teradataml/data/docs/sqle/docs_17_10/FillRowId.py +82 -82
teradataml/data/docs/sqle/docs_17_10/Fit.py +87 -87
teradataml/data/docs/sqle/docs_17_10/GLMPredict.py +144 -144
teradataml/data/docs/sqle/docs_17_10/GetRowsWithMissingValues.py +84 -84
teradataml/data/docs/sqle/docs_17_10/GetRowsWithoutMissingValues.py +81 -81
teradataml/data/docs/sqle/docs_17_10/Histogram.py +164 -164
teradataml/data/docs/sqle/docs_17_10/MovingAverage.py +134 -134
teradataml/data/docs/sqle/docs_17_10/NGramSplitter.py +208 -208
teradataml/data/docs/sqle/docs_17_10/NPath.py +265 -265
teradataml/data/docs/sqle/docs_17_10/NaiveBayesPredict.py +116 -116
teradataml/data/docs/sqle/docs_17_10/NaiveBayesTextClassifierPredict.py +176 -176
teradataml/data/docs/sqle/docs_17_10/NumApply.py +147 -147
teradataml/data/docs/sqle/docs_17_10/OneHotEncodingFit.py +134 -132
teradataml/data/docs/sqle/docs_17_10/OneHotEncodingTransform.py +109 -103
teradataml/data/docs/sqle/docs_17_10/OutlierFilterFit.py +165 -165
teradataml/data/docs/sqle/docs_17_10/OutlierFilterTransform.py +105 -101
teradataml/data/docs/sqle/docs_17_10/Pack.py +128 -128
teradataml/data/docs/sqle/docs_17_10/PolynomialFeaturesFit.py +111 -111
teradataml/data/docs/sqle/docs_17_10/PolynomialFeaturesTransform.py +102 -102
teradataml/data/docs/sqle/docs_17_10/QQNorm.py +104 -104
teradataml/data/docs/sqle/docs_17_10/RoundColumns.py +109 -109
teradataml/data/docs/sqle/docs_17_10/RowNormalizeFit.py +117 -117
teradataml/data/docs/sqle/docs_17_10/RowNormalizeTransform.py +99 -98
teradataml/data/docs/sqle/docs_17_10/SVMSparsePredict.py +152 -152
teradataml/data/docs/sqle/docs_17_10/ScaleFit.py +197 -197
teradataml/data/docs/sqle/docs_17_10/ScaleTransform.py +99 -98
teradataml/data/docs/sqle/docs_17_10/Sessionize.py +113 -113
teradataml/data/docs/sqle/docs_17_10/SimpleImputeFit.py +116 -116
teradataml/data/docs/sqle/docs_17_10/SimpleImputeTransform.py +98 -98
teradataml/data/docs/sqle/docs_17_10/StrApply.py +187 -187
teradataml/data/docs/sqle/docs_17_10/StringSimilarity.py +145 -145
teradataml/data/docs/sqle/docs_17_10/Transform.py +105 -104
teradataml/data/docs/sqle/docs_17_10/UnivariateStatistics.py +141 -141
teradataml/data/docs/sqle/docs_17_10/Unpack.py +214 -214
teradataml/data/docs/sqle/docs_17_10/WhichMax.py +83 -83
teradataml/data/docs/sqle/docs_17_10/WhichMin.py +83 -83
teradataml/data/docs/sqle/docs_17_10/ZTest.py +155 -155
teradataml/data/docs/sqle/docs_17_20/ANOVA.py +186 -126
teradataml/data/docs/sqle/docs_17_20/Antiselect.py +82 -82
teradataml/data/docs/sqle/docs_17_20/Attribution.py +200 -200
teradataml/data/docs/sqle/docs_17_20/BincodeFit.py +171 -171
teradataml/data/docs/sqle/docs_17_20/BincodeTransform.py +139 -138
teradataml/data/docs/sqle/docs_17_20/CategoricalSummary.py +86 -86
teradataml/data/docs/sqle/docs_17_20/ChiSq.py +90 -90
teradataml/data/docs/sqle/docs_17_20/ClassificationEvaluator.py +166 -166
teradataml/data/docs/sqle/docs_17_20/ColumnSummary.py +85 -85
teradataml/data/docs/sqle/docs_17_20/ColumnTransformer.py +245 -243
teradataml/data/docs/sqle/docs_17_20/ConvertTo.py +113 -113
teradataml/data/docs/sqle/docs_17_20/DecisionForest.py +279 -279
teradataml/data/docs/sqle/docs_17_20/DecisionForestPredict.py +144 -144
teradataml/data/docs/sqle/docs_17_20/DecisionTreePredict.py +135 -135
teradataml/data/docs/sqle/docs_17_20/FTest.py +239 -160
teradataml/data/docs/sqle/docs_17_20/FillRowId.py +82 -82
teradataml/data/docs/sqle/docs_17_20/Fit.py +87 -87
teradataml/data/docs/sqle/docs_17_20/GLM.py +541 -380
teradataml/data/docs/sqle/docs_17_20/GLMPerSegment.py +414 -414
teradataml/data/docs/sqle/docs_17_20/GLMPredict.py +144 -144
teradataml/data/docs/sqle/docs_17_20/GLMPredictPerSegment.py +233 -234
teradataml/data/docs/sqle/docs_17_20/GetFutileColumns.py +125 -123
teradataml/data/docs/sqle/docs_17_20/GetRowsWithMissingValues.py +108 -108
teradataml/data/docs/sqle/docs_17_20/GetRowsWithoutMissingValues.py +105 -105
teradataml/data/docs/sqle/docs_17_20/Histogram.py +223 -223
teradataml/data/docs/sqle/docs_17_20/KMeans.py +251 -204
teradataml/data/docs/sqle/docs_17_20/KMeansPredict.py +144 -143
teradataml/data/docs/sqle/docs_17_20/KNN.py +214 -214
teradataml/data/docs/sqle/docs_17_20/MovingAverage.py +134 -134
teradataml/data/docs/sqle/docs_17_20/NGramSplitter.py +208 -208
teradataml/data/docs/sqle/docs_17_20/NPath.py +265 -265
teradataml/data/docs/sqle/docs_17_20/NaiveBayesPredict.py +116 -116
teradataml/data/docs/sqle/docs_17_20/NaiveBayesTextClassifierPredict.py +177 -176
teradataml/data/docs/sqle/docs_17_20/NaiveBayesTextClassifierTrainer.py +126 -126
teradataml/data/docs/sqle/docs_17_20/NonLinearCombineFit.py +118 -117
teradataml/data/docs/sqle/docs_17_20/NonLinearCombineTransform.py +112 -112
teradataml/data/docs/sqle/docs_17_20/NumApply.py +147 -147
teradataml/data/docs/sqle/docs_17_20/OneClassSVM.py +307 -307
teradataml/data/docs/sqle/docs_17_20/OneClassSVMPredict.py +185 -184
teradataml/data/docs/sqle/docs_17_20/OneHotEncodingFit.py +230 -225
teradataml/data/docs/sqle/docs_17_20/OneHotEncodingTransform.py +121 -115
teradataml/data/docs/sqle/docs_17_20/OrdinalEncodingFit.py +219 -219
teradataml/data/docs/sqle/docs_17_20/OrdinalEncodingTransform.py +127 -127
teradataml/data/docs/sqle/docs_17_20/OutlierFilterFit.py +189 -189
teradataml/data/docs/sqle/docs_17_20/OutlierFilterTransform.py +117 -112
teradataml/data/docs/sqle/docs_17_20/Pack.py +128 -128
teradataml/data/docs/sqle/docs_17_20/PolynomialFeaturesFit.py +111 -111
teradataml/data/docs/sqle/docs_17_20/PolynomialFeaturesTransform.py +112 -111
teradataml/data/docs/sqle/docs_17_20/QQNorm.py +104 -104
teradataml/data/docs/sqle/docs_17_20/ROC.py +164 -163
teradataml/data/docs/sqle/docs_17_20/RandomProjectionFit.py +154 -154
teradataml/data/docs/sqle/docs_17_20/RandomProjectionMinComponents.py +106 -106
teradataml/data/docs/sqle/docs_17_20/RandomProjectionTransform.py +120 -120
teradataml/data/docs/sqle/docs_17_20/RegressionEvaluator.py +211 -211
teradataml/data/docs/sqle/docs_17_20/RoundColumns.py +108 -108
teradataml/data/docs/sqle/docs_17_20/RowNormalizeFit.py +117 -117
teradataml/data/docs/sqle/docs_17_20/RowNormalizeTransform.py +111 -110
teradataml/data/docs/sqle/docs_17_20/SVM.py +413 -413
teradataml/data/docs/sqle/docs_17_20/SVMPredict.py +213 -202
teradataml/data/docs/sqle/docs_17_20/SVMSparsePredict.py +152 -152
teradataml/data/docs/sqle/docs_17_20/ScaleFit.py +315 -197
teradataml/data/docs/sqle/docs_17_20/ScaleTransform.py +202 -109
teradataml/data/docs/sqle/docs_17_20/SentimentExtractor.py +206 -206
teradataml/data/docs/sqle/docs_17_20/Sessionize.py +113 -113
teradataml/data/docs/sqle/docs_17_20/Silhouette.py +152 -152
teradataml/data/docs/sqle/docs_17_20/SimpleImputeFit.py +116 -116
teradataml/data/docs/sqle/docs_17_20/SimpleImputeTransform.py +109 -108
teradataml/data/docs/sqle/docs_17_20/StrApply.py +187 -187
teradataml/data/docs/sqle/docs_17_20/StringSimilarity.py +145 -145
teradataml/data/docs/sqle/docs_17_20/TDDecisionForestPredict.py +207 -207
teradataml/data/docs/sqle/docs_17_20/TDGLMPredict.py +333 -171
teradataml/data/docs/sqle/docs_17_20/TargetEncodingFit.py +266 -266
teradataml/data/docs/sqle/docs_17_20/TargetEncodingTransform.py +141 -140
teradataml/data/docs/sqle/docs_17_20/TextParser.py +172 -172
teradataml/data/docs/sqle/docs_17_20/TrainTestSplit.py +159 -159
teradataml/data/docs/sqle/docs_17_20/Transform.py +123 -123
teradataml/data/docs/sqle/docs_17_20/UnivariateStatistics.py +141 -141
teradataml/data/docs/sqle/docs_17_20/Unpack.py +214 -214
teradataml/data/docs/sqle/docs_17_20/VectorDistance.py +168 -168
teradataml/data/docs/sqle/docs_17_20/WhichMax.py +83 -83
teradataml/data/docs/sqle/docs_17_20/WhichMin.py +83 -83
teradataml/data/docs/sqle/docs_17_20/WordEmbeddings.py +236 -236
teradataml/data/docs/sqle/docs_17_20/XGBoost.py +361 -353
teradataml/data/docs/sqle/docs_17_20/XGBoostPredict.py +281 -275
teradataml/data/docs/sqle/docs_17_20/ZTest.py +220 -155
teradataml/data/docs/tableoperator/docs_17_00/ReadNOS.py +429 -429
teradataml/data/docs/tableoperator/docs_17_05/ReadNOS.py +429 -429
teradataml/data/docs/tableoperator/docs_17_05/WriteNOS.py +347 -347
teradataml/data/docs/tableoperator/docs_17_10/ReadNOS.py +428 -428
teradataml/data/docs/tableoperator/docs_17_10/WriteNOS.py +347 -347
teradataml/data/docs/tableoperator/docs_17_20/ReadNOS.py +439 -439
teradataml/data/docs/tableoperator/docs_17_20/WriteNOS.py +386 -386
teradataml/data/docs/uaf/docs_17_20/ACF.py +195 -195
teradataml/data/docs/uaf/docs_17_20/ArimaEstimate.py +369 -369
teradataml/data/docs/uaf/docs_17_20/ArimaForecast.py +142 -142
teradataml/data/docs/uaf/docs_17_20/ArimaValidate.py +159 -159
teradataml/data/docs/uaf/docs_17_20/BinaryMatrixOp.py +247 -247
teradataml/data/docs/uaf/docs_17_20/BinarySeriesOp.py +252 -252
teradataml/data/docs/uaf/docs_17_20/BreuschGodfrey.py +177 -177
teradataml/data/docs/uaf/docs_17_20/BreuschPaganGodfrey.py +174 -174
teradataml/data/docs/uaf/docs_17_20/Convolve.py +226 -226
teradataml/data/docs/uaf/docs_17_20/Convolve2.py +214 -214
teradataml/data/docs/uaf/docs_17_20/CumulPeriodogram.py +183 -183
teradataml/data/docs/uaf/docs_17_20/DFFT.py +203 -203
teradataml/data/docs/uaf/docs_17_20/DFFT2.py +216 -216
teradataml/data/docs/uaf/docs_17_20/DFFT2Conv.py +215 -215
teradataml/data/docs/uaf/docs_17_20/DFFTConv.py +191 -191
teradataml/data/docs/uaf/docs_17_20/DTW.py +179 -179
teradataml/data/docs/uaf/docs_17_20/DickeyFuller.py +144 -144
teradataml/data/docs/uaf/docs_17_20/DurbinWatson.py +183 -183
teradataml/data/docs/uaf/docs_17_20/ExtractResults.py +184 -184
teradataml/data/docs/uaf/docs_17_20/FitMetrics.py +172 -172
teradataml/data/docs/uaf/docs_17_20/GenseriesFormula.py +205 -205
teradataml/data/docs/uaf/docs_17_20/GenseriesSinusoids.py +142 -142
teradataml/data/docs/uaf/docs_17_20/HoltWintersForecaster.py +258 -258
teradataml/data/docs/uaf/docs_17_20/IDFFT.py +164 -164
teradataml/data/docs/uaf/docs_17_20/IDFFT2.py +198 -198
teradataml/data/docs/uaf/docs_17_20/InputValidator.py +120 -120
teradataml/data/docs/uaf/docs_17_20/LineSpec.py +155 -155
teradataml/data/docs/uaf/docs_17_20/LinearRegr.py +214 -214
teradataml/data/docs/uaf/docs_17_20/MAMean.py +173 -173
teradataml/data/docs/uaf/docs_17_20/MInfo.py +133 -133
teradataml/data/docs/uaf/docs_17_20/MatrixMultiply.py +135 -135
teradataml/data/docs/uaf/docs_17_20/MultivarRegr.py +190 -190
teradataml/data/docs/uaf/docs_17_20/PACF.py +158 -158
teradataml/data/docs/uaf/docs_17_20/Portman.py +216 -216
teradataml/data/docs/uaf/docs_17_20/PowerTransform.py +154 -154
teradataml/data/docs/uaf/docs_17_20/Resample.py +228 -228
teradataml/data/docs/uaf/docs_17_20/SInfo.py +122 -122
teradataml/data/docs/uaf/docs_17_20/SeasonalNormalize.py +165 -165
teradataml/data/docs/uaf/docs_17_20/SelectionCriteria.py +173 -173
teradataml/data/docs/uaf/docs_17_20/SignifPeriodicities.py +170 -170
teradataml/data/docs/uaf/docs_17_20/SignifResidmean.py +163 -163
teradataml/data/docs/uaf/docs_17_20/SimpleExp.py +179 -179
teradataml/data/docs/uaf/docs_17_20/Smoothma.py +207 -207
teradataml/data/docs/uaf/docs_17_20/TrackingOp.py +150 -150
teradataml/data/docs/uaf/docs_17_20/UNDIFF.py +171 -171
teradataml/data/docs/uaf/docs_17_20/Unnormalize.py +201 -201
teradataml/data/docs/uaf/docs_17_20/WhitesGeneral.py +169 -169
teradataml/data/dtw_example.json +17 -17
teradataml/data/dtw_t1.csv +11 -11
teradataml/data/dtw_t2.csv +4 -4
teradataml/data/dwt2d_example.json +15 -15
teradataml/data/dwt_example.json +14 -14
teradataml/data/dwt_filter_dim.csv +5 -5
teradataml/data/emission.csv +9 -9
teradataml/data/emp_table_by_dept.csv +19 -19
teradataml/data/employee_info.csv +4 -4
teradataml/data/employee_table.csv +6 -6
teradataml/data/excluding_event_table.csv +2 -2
teradataml/data/finance_data.csv +6 -6
teradataml/data/finance_data2.csv +61 -61
teradataml/data/finance_data3.csv +93 -93
teradataml/data/fish.csv +160 -0
teradataml/data/fm_blood2ageandweight.csv +26 -26
teradataml/data/fmeasure_example.json +11 -11
teradataml/data/followers_leaders.csv +10 -10
teradataml/data/fpgrowth_example.json +12 -12
teradataml/data/frequentpaths_example.json +29 -29
teradataml/data/friends.csv +9 -9
teradataml/data/fs_input.csv +33 -33
teradataml/data/fs_input1.csv +33 -33
teradataml/data/genData.csv +513 -513
teradataml/data/geodataframe_example.json +39 -39
teradataml/data/glass_types.csv +215 -0
teradataml/data/glm_admissions_model.csv +12 -12
teradataml/data/glm_example.json +56 -29
teradataml/data/glml1l2_example.json +28 -28
teradataml/data/glml1l2predict_example.json +54 -54
teradataml/data/glmpredict_example.json +54 -54
teradataml/data/gq_t1.csv +21 -21
teradataml/data/hconvolve_complex_right.csv +5 -5
teradataml/data/hconvolve_complex_rightmulti.csv +5 -5
teradataml/data/histogram_example.json +11 -11
teradataml/data/hmmdecoder_example.json +78 -78
teradataml/data/hmmevaluator_example.json +24 -24
teradataml/data/hmmsupervised_example.json +10 -10
teradataml/data/hmmunsupervised_example.json +7 -7
teradataml/data/house_values.csv +12 -12
teradataml/data/house_values2.csv +13 -13
teradataml/data/housing_cat.csv +7 -7
teradataml/data/housing_data.csv +9 -9
teradataml/data/housing_test.csv +47 -47
teradataml/data/housing_test_binary.csv +47 -47
teradataml/data/housing_train.csv +493 -493
teradataml/data/housing_train_attribute.csv +4 -4
teradataml/data/housing_train_binary.csv +437 -437
teradataml/data/housing_train_parameter.csv +2 -2
teradataml/data/housing_train_response.csv +493 -493
teradataml/data/housing_train_segment.csv +201 -0
teradataml/data/ibm_stock.csv +370 -370
teradataml/data/ibm_stock1.csv +370 -370
teradataml/data/identitymatch_example.json +21 -21
teradataml/data/idf_table.csv +4 -4
teradataml/data/impressions.csv +101 -101
teradataml/data/inflation.csv +21 -21
teradataml/data/initial.csv +3 -3
teradataml/data/insect2Cols.csv +61 -0
teradataml/data/insect_sprays.csv +12 -12
teradataml/data/insurance.csv +1339 -1339
teradataml/data/interpolator_example.json +12 -12
teradataml/data/iris_altinput.csv +481 -481
teradataml/data/iris_attribute_output.csv +8 -8
teradataml/data/iris_attribute_test.csv +121 -121
teradataml/data/iris_attribute_train.csv +481 -481
teradataml/data/iris_category_expect_predict.csv +31 -31
teradataml/data/iris_data.csv +151 -0
teradataml/data/iris_input.csv +151 -151
teradataml/data/iris_response_train.csv +121 -121
teradataml/data/iris_test.csv +31 -31
teradataml/data/iris_train.csv +121 -121
teradataml/data/join_table1.csv +4 -4
teradataml/data/join_table2.csv +4 -4
teradataml/data/jsons/anly_function_name.json +6 -6
teradataml/data/jsons/byom/dataikupredict.json +147 -147
teradataml/data/jsons/byom/datarobotpredict.json +146 -146
teradataml/data/jsons/byom/h2opredict.json +194 -194
teradataml/data/jsons/byom/onnxpredict.json +186 -186
teradataml/data/jsons/byom/pmmlpredict.json +146 -146
teradataml/data/jsons/paired_functions.json +435 -435
teradataml/data/jsons/sqle/16.20/Antiselect.json +56 -56
teradataml/data/jsons/sqle/16.20/Attribution.json +249 -249
teradataml/data/jsons/sqle/16.20/DecisionForestPredict.json +156 -156
teradataml/data/jsons/sqle/16.20/DecisionTreePredict.json +170 -170
teradataml/data/jsons/sqle/16.20/GLMPredict.json +122 -122
teradataml/data/jsons/sqle/16.20/MovingAverage.json +367 -367
teradataml/data/jsons/sqle/16.20/NGramSplitter.json +239 -239
teradataml/data/jsons/sqle/16.20/NaiveBayesPredict.json +136 -136
teradataml/data/jsons/sqle/16.20/NaiveBayesTextClassifierPredict.json +235 -235
teradataml/data/jsons/sqle/16.20/Pack.json +98 -98
teradataml/data/jsons/sqle/16.20/SVMSparsePredict.json +162 -162
teradataml/data/jsons/sqle/16.20/Sessionize.json +105 -105
teradataml/data/jsons/sqle/16.20/StringSimilarity.json +86 -86
teradataml/data/jsons/sqle/16.20/Unpack.json +166 -166
teradataml/data/jsons/sqle/16.20/nPath.json +269 -269
teradataml/data/jsons/sqle/17.00/Antiselect.json +56 -56
teradataml/data/jsons/sqle/17.00/Attribution.json +249 -249
teradataml/data/jsons/sqle/17.00/DecisionForestPredict.json +156 -156
teradataml/data/jsons/sqle/17.00/DecisionTreePredict.json +170 -170
teradataml/data/jsons/sqle/17.00/GLMPredict.json +122 -122
teradataml/data/jsons/sqle/17.00/MovingAverage.json +367 -367
teradataml/data/jsons/sqle/17.00/NGramSplitter.json +239 -239
teradataml/data/jsons/sqle/17.00/NaiveBayesPredict.json +136 -136
teradataml/data/jsons/sqle/17.00/NaiveBayesTextClassifierPredict.json +235 -235
teradataml/data/jsons/sqle/17.00/Pack.json +98 -98
teradataml/data/jsons/sqle/17.00/SVMSparsePredict.json +162 -162
teradataml/data/jsons/sqle/17.00/Sessionize.json +105 -105
teradataml/data/jsons/sqle/17.00/StringSimilarity.json +86 -86
teradataml/data/jsons/sqle/17.00/Unpack.json +166 -166
teradataml/data/jsons/sqle/17.00/nPath.json +269 -269
teradataml/data/jsons/sqle/17.05/Antiselect.json +56 -56
teradataml/data/jsons/sqle/17.05/Attribution.json +249 -249
teradataml/data/jsons/sqle/17.05/DecisionForestPredict.json +156 -156
teradataml/data/jsons/sqle/17.05/DecisionTreePredict.json +170 -170
teradataml/data/jsons/sqle/17.05/GLMPredict.json +122 -122
teradataml/data/jsons/sqle/17.05/MovingAverage.json +367 -367
teradataml/data/jsons/sqle/17.05/NGramSplitter.json +239 -239
teradataml/data/jsons/sqle/17.05/NaiveBayesPredict.json +136 -136
teradataml/data/jsons/sqle/17.05/NaiveBayesTextClassifierPredict.json +235 -235
teradataml/data/jsons/sqle/17.05/Pack.json +98 -98
teradataml/data/jsons/sqle/17.05/SVMSparsePredict.json +162 -162
teradataml/data/jsons/sqle/17.05/Sessionize.json +105 -105
teradataml/data/jsons/sqle/17.05/StringSimilarity.json +86 -86
teradataml/data/jsons/sqle/17.05/Unpack.json +166 -166
teradataml/data/jsons/sqle/17.05/nPath.json +269 -269
teradataml/data/jsons/sqle/17.10/Antiselect.json +56 -56
teradataml/data/jsons/sqle/17.10/Attribution.json +249 -249
teradataml/data/jsons/sqle/17.10/DecisionForestPredict.json +185 -185
teradataml/data/jsons/sqle/17.10/DecisionTreePredict.json +171 -171
teradataml/data/jsons/sqle/17.10/GLMPredict.json +151 -151
teradataml/data/jsons/sqle/17.10/MovingAverage.json +368 -368
teradataml/data/jsons/sqle/17.10/NGramSplitter.json +239 -239
teradataml/data/jsons/sqle/17.10/NaiveBayesPredict.json +149 -149
teradataml/data/jsons/sqle/17.10/NaiveBayesTextClassifierPredict.json +288 -288
teradataml/data/jsons/sqle/17.10/Pack.json +133 -133
teradataml/data/jsons/sqle/17.10/SVMSparsePredict.json +193 -193
teradataml/data/jsons/sqle/17.10/Sessionize.json +105 -105
teradataml/data/jsons/sqle/17.10/StringSimilarity.json +86 -86
teradataml/data/jsons/sqle/17.10/TD_BinCodeFit.json +239 -239
teradataml/data/jsons/sqle/17.10/TD_BinCodeTransform.json +70 -70
teradataml/data/jsons/sqle/17.10/TD_CategoricalSummary.json +53 -53
teradataml/data/jsons/sqle/17.10/TD_Chisq.json +67 -67
teradataml/data/jsons/sqle/17.10/TD_ColumnSummary.json +53 -53
teradataml/data/jsons/sqle/17.10/TD_ConvertTo.json +68 -68
teradataml/data/jsons/sqle/17.10/TD_FTest.json +187 -187
teradataml/data/jsons/sqle/17.10/TD_FillRowID.json +51 -51
teradataml/data/jsons/sqle/17.10/TD_FunctionFit.json +46 -46
teradataml/data/jsons/sqle/17.10/TD_FunctionTransform.json +72 -71
teradataml/data/jsons/sqle/17.10/TD_GetRowsWithMissingValues.json +52 -52
teradataml/data/jsons/sqle/17.10/TD_GetRowsWithoutMissingValues.json +52 -52
teradataml/data/jsons/sqle/17.10/TD_Histogram.json +132 -132
teradataml/data/jsons/sqle/17.10/TD_NumApply.json +147 -147
teradataml/data/jsons/sqle/17.10/TD_OneHotEncodingFit.json +182 -182
teradataml/data/jsons/sqle/17.10/TD_OneHotEncodingTransform.json +65 -64
teradataml/data/jsons/sqle/17.10/TD_OutlierFilterFit.json +196 -196
teradataml/data/jsons/sqle/17.10/TD_OutlierFilterTransform.json +48 -47
teradataml/data/jsons/sqle/17.10/TD_PolynomialFeaturesFit.json +114 -114
teradataml/data/jsons/sqle/17.10/TD_PolynomialFeaturesTransform.json +72 -71
teradataml/data/jsons/sqle/17.10/TD_QQNorm.json +111 -111
teradataml/data/jsons/sqle/17.10/TD_RoundColumns.json +93 -93
teradataml/data/jsons/sqle/17.10/TD_RowNormalizeFit.json +127 -127
teradataml/data/jsons/sqle/17.10/TD_RowNormalizeTransform.json +70 -69
teradataml/data/jsons/sqle/17.10/TD_ScaleFit.json +156 -156
teradataml/data/jsons/sqle/17.10/TD_ScaleTransform.json +70 -69
teradataml/data/jsons/sqle/17.10/TD_SimpleImputeFit.json +147 -147
teradataml/data/jsons/sqle/17.10/TD_SimpleImputeTransform.json +48 -47
teradataml/data/jsons/sqle/17.10/TD_StrApply.json +240 -240
teradataml/data/jsons/sqle/17.10/TD_UnivariateStatistics.json +118 -118
teradataml/data/jsons/sqle/17.10/TD_WhichMax.json +52 -52
teradataml/data/jsons/sqle/17.10/TD_WhichMin.json +52 -52
teradataml/data/jsons/sqle/17.10/TD_ZTest.json +171 -171
teradataml/data/jsons/sqle/17.10/Unpack.json +188 -188
teradataml/data/jsons/sqle/17.10/nPath.json +269 -269
teradataml/data/jsons/sqle/17.20/Antiselect.json +56 -56
teradataml/data/jsons/sqle/17.20/Attribution.json +249 -249
teradataml/data/jsons/sqle/17.20/DecisionForestPredict.json +185 -185
teradataml/data/jsons/sqle/17.20/DecisionTreePredict.json +172 -172
teradataml/data/jsons/sqle/17.20/GLMPredict.json +151 -151
teradataml/data/jsons/sqle/17.20/MovingAverage.json +367 -367
teradataml/data/jsons/sqle/17.20/NGramSplitter.json +239 -239
teradataml/data/jsons/sqle/17.20/NaiveBayesPredict.json +149 -149
teradataml/data/jsons/sqle/17.20/NaiveBayesTextClassifierPredict.json +287 -287
teradataml/data/jsons/sqle/17.20/Pack.json +133 -133
teradataml/data/jsons/sqle/17.20/SVMSparsePredict.json +192 -192
teradataml/data/jsons/sqle/17.20/Sessionize.json +105 -105
teradataml/data/jsons/sqle/17.20/StringSimilarity.json +86 -86
teradataml/data/jsons/sqle/17.20/TD_ANOVA.json +148 -76
teradataml/data/jsons/sqle/17.20/TD_BinCodeFit.json +239 -239
teradataml/data/jsons/sqle/17.20/TD_BinCodeTransform.json +71 -71
teradataml/data/jsons/sqle/17.20/TD_CategoricalSummary.json +53 -53
teradataml/data/jsons/sqle/17.20/TD_Chisq.json +67 -67
teradataml/data/jsons/sqle/17.20/TD_ClassificationEvaluator.json +145 -145
teradataml/data/jsons/sqle/17.20/TD_ColumnSummary.json +53 -53
teradataml/data/jsons/sqle/17.20/TD_ColumnTransformer.json +218 -218
teradataml/data/jsons/sqle/17.20/TD_ConvertTo.json +92 -92
teradataml/data/jsons/sqle/17.20/TD_DecisionForest.json +259 -259
teradataml/data/jsons/sqle/17.20/TD_DecisionForestPredict.json +139 -139
teradataml/data/jsons/sqle/17.20/TD_FTest.json +269 -186
teradataml/data/jsons/sqle/17.20/TD_FillRowID.json +52 -52
teradataml/data/jsons/sqle/17.20/TD_FunctionFit.json +46 -46
teradataml/data/jsons/sqle/17.20/TD_FunctionTransform.json +72 -72
teradataml/data/jsons/sqle/17.20/TD_GLM.json +507 -431
teradataml/data/jsons/sqle/17.20/TD_GLMPREDICT.json +168 -125
teradataml/data/jsons/sqle/17.20/TD_GLMPerSegment.json +411 -411
teradataml/data/jsons/sqle/17.20/TD_GLMPredictPerSegment.json +146 -146
teradataml/data/jsons/sqle/17.20/TD_GetFutileColumns.json +93 -91
teradataml/data/jsons/sqle/17.20/TD_GetRowsWithMissingValues.json +76 -76
teradataml/data/jsons/sqle/17.20/TD_GetRowsWithoutMissingValues.json +76 -76
teradataml/data/jsons/sqle/17.20/TD_Histogram.json +152 -152
teradataml/data/jsons/sqle/17.20/TD_KMeans.json +231 -211
teradataml/data/jsons/sqle/17.20/TD_KMeansPredict.json +86 -86
teradataml/data/jsons/sqle/17.20/TD_KNN.json +262 -262
teradataml/data/jsons/sqle/17.20/TD_NaiveBayesTextClassifierTrainer.json +137 -137
teradataml/data/jsons/sqle/17.20/TD_NonLinearCombineFit.json +102 -101
teradataml/data/jsons/sqle/17.20/TD_NonLinearCombineTransform.json +71 -71
teradataml/data/jsons/sqle/17.20/TD_NumApply.json +147 -147
teradataml/data/jsons/sqle/17.20/TD_OneClassSVM.json +315 -315
teradataml/data/jsons/sqle/17.20/TD_OneClassSVMPredict.json +123 -123
teradataml/data/jsons/sqle/17.20/TD_OneHotEncodingFit.json +271 -271
teradataml/data/jsons/sqle/17.20/TD_OneHotEncodingTransform.json +65 -65
teradataml/data/jsons/sqle/17.20/TD_OrdinalEncodingFit.json +229 -229
teradataml/data/jsons/sqle/17.20/TD_OrdinalEncodingTransform.json +75 -75
teradataml/data/jsons/sqle/17.20/TD_OutlierFilterFit.json +217 -217
teradataml/data/jsons/sqle/17.20/TD_OutlierFilterTransform.json +48 -48
teradataml/data/jsons/sqle/17.20/TD_PolynomialFeaturesFit.json +114 -114
teradataml/data/jsons/sqle/17.20/TD_PolynomialFeaturesTransform.json +72 -72
teradataml/data/jsons/sqle/17.20/TD_QQNorm.json +111 -111
teradataml/data/jsons/sqle/17.20/TD_ROC.json +178 -177
teradataml/data/jsons/sqle/17.20/TD_RandomProjectionFit.json +178 -178
teradataml/data/jsons/sqle/17.20/TD_RandomProjectionMinComponents.json +73 -73
teradataml/data/jsons/sqle/17.20/TD_RandomProjectionTransform.json +74 -74
teradataml/data/jsons/sqle/17.20/TD_RegressionEvaluator.json +137 -137
teradataml/data/jsons/sqle/17.20/TD_RoundColumns.json +93 -93
teradataml/data/jsons/sqle/17.20/TD_RowNormalizeFit.json +127 -127
teradataml/data/jsons/sqle/17.20/TD_RowNormalizeTransform.json +70 -70
teradataml/data/jsons/sqle/17.20/TD_SVM.json +389 -389
teradataml/data/jsons/sqle/17.20/TD_SVMPredict.json +142 -124
teradataml/data/jsons/sqle/17.20/TD_ScaleFit.json +309 -156
teradataml/data/jsons/sqle/17.20/TD_ScaleTransform.json +119 -70
teradataml/data/jsons/sqle/17.20/TD_SentimentExtractor.json +193 -193
teradataml/data/jsons/sqle/17.20/TD_Silhouette.json +142 -142
teradataml/data/jsons/sqle/17.20/TD_SimpleImputeFit.json +147 -147
teradataml/data/jsons/sqle/17.20/TD_SimpleImputeTransform.json +48 -48
teradataml/data/jsons/sqle/17.20/TD_StrApply.json +240 -240
teradataml/data/jsons/sqle/17.20/TD_TargetEncodingFit.json +248 -248
teradataml/data/jsons/sqle/17.20/TD_TargetEncodingTransform.json +75 -75
teradataml/data/jsons/sqle/17.20/TD_TextParser.json +192 -192
teradataml/data/jsons/sqle/17.20/TD_TrainTestSplit.json +142 -142
teradataml/data/jsons/sqle/17.20/TD_UnivariateStatistics.json +117 -117
teradataml/data/jsons/sqle/17.20/TD_VectorDistance.json +182 -182
teradataml/data/jsons/sqle/17.20/TD_WhichMax.json +52 -52
teradataml/data/jsons/sqle/17.20/TD_WhichMin.json +52 -52
teradataml/data/jsons/sqle/17.20/TD_WordEmbeddings.json +241 -241
teradataml/data/jsons/sqle/17.20/TD_XGBoost.json +330 -312
teradataml/data/jsons/sqle/17.20/TD_XGBoostPredict.json +195 -182
teradataml/data/jsons/sqle/17.20/TD_ZTest.json +247 -170
teradataml/data/jsons/sqle/17.20/Unpack.json +188 -188
teradataml/data/jsons/sqle/17.20/nPath.json +269 -269
teradataml/data/jsons/tableoperator/17.00/read_nos.json +197 -197
teradataml/data/jsons/tableoperator/17.05/read_nos.json +197 -197
teradataml/data/jsons/tableoperator/17.05/write_nos.json +194 -194
teradataml/data/jsons/tableoperator/17.10/read_nos.json +183 -183
teradataml/data/jsons/tableoperator/17.10/write_nos.json +194 -194
teradataml/data/jsons/tableoperator/17.20/read_nos.json +182 -182
teradataml/data/jsons/tableoperator/17.20/write_nos.json +223 -223
teradataml/data/jsons/uaf/17.20/TD_ACF.json +149 -149
teradataml/data/jsons/uaf/17.20/TD_ARIMAESTIMATE.json +409 -409
teradataml/data/jsons/uaf/17.20/TD_ARIMAFORECAST.json +79 -79
teradataml/data/jsons/uaf/17.20/TD_ARIMAVALIDATE.json +151 -151
teradataml/data/jsons/uaf/17.20/TD_BINARYMATRIXOP.json +109 -109
teradataml/data/jsons/uaf/17.20/TD_BINARYSERIESOP.json +107 -107
teradataml/data/jsons/uaf/17.20/TD_BREUSCH_GODFREY.json +87 -87
teradataml/data/jsons/uaf/17.20/TD_BREUSCH_PAGAN_GODFREY.json +106 -106
teradataml/data/jsons/uaf/17.20/TD_CONVOLVE.json +80 -80
teradataml/data/jsons/uaf/17.20/TD_CONVOLVE2.json +67 -67
teradataml/data/jsons/uaf/17.20/TD_CUMUL_PERIODOGRAM.json +91 -91
teradataml/data/jsons/uaf/17.20/TD_DFFT.json +136 -136
teradataml/data/jsons/uaf/17.20/TD_DFFT2.json +148 -148
teradataml/data/jsons/uaf/17.20/TD_DFFT2CONV.json +108 -108
teradataml/data/jsons/uaf/17.20/TD_DFFTCONV.json +109 -109
teradataml/data/jsons/uaf/17.20/TD_DICKEY_FULLER.json +86 -86
teradataml/data/jsons/uaf/17.20/TD_DIFF.json +91 -91
teradataml/data/jsons/uaf/17.20/TD_DTW.json +116 -116
teradataml/data/jsons/uaf/17.20/TD_DURBIN_WATSON.json +100 -100
teradataml/data/jsons/uaf/17.20/TD_EXTRACT_RESULTS.json +38 -38
teradataml/data/jsons/uaf/17.20/TD_FITMETRICS.json +100 -100
teradataml/data/jsons/uaf/17.20/TD_GENSERIES4FORMULA.json +84 -84
teradataml/data/jsons/uaf/17.20/TD_GENSERIES4SINUSOIDS.json +70 -70
teradataml/data/jsons/uaf/17.20/TD_GOLDFELD_QUANDT.json +152 -152
teradataml/data/jsons/uaf/17.20/TD_HOLT_WINTERS_FORECAST.json +313 -313
teradataml/data/jsons/uaf/17.20/TD_IDFFT.json +57 -57
teradataml/data/jsons/uaf/17.20/TD_IDFFT2.json +94 -94
teradataml/data/jsons/uaf/17.20/TD_INPUTVALIDATOR.json +63 -63
teradataml/data/jsons/uaf/17.20/TD_LINEAR_REGR.json +181 -181
teradataml/data/jsons/uaf/17.20/TD_LINESPEC.json +102 -102
teradataml/data/jsons/uaf/17.20/TD_MAMEAN.json +182 -182
teradataml/data/jsons/uaf/17.20/TD_MATRIXMULTIPLY.json +67 -67
teradataml/data/jsons/uaf/17.20/TD_MINFO.json +66 -66
teradataml/data/jsons/uaf/17.20/TD_MULTIVAR_REGR.json +178 -178
teradataml/data/jsons/uaf/17.20/TD_PACF.json +114 -114
teradataml/data/jsons/uaf/17.20/TD_PORTMAN.json +118 -118
teradataml/data/jsons/uaf/17.20/TD_POWERSPEC.json +175 -175
teradataml/data/jsons/uaf/17.20/TD_POWERTRANSFORM.json +97 -97
teradataml/data/jsons/uaf/17.20/TD_RESAMPLE.json +173 -173
teradataml/data/jsons/uaf/17.20/TD_SEASONALNORMALIZE.json +136 -136
teradataml/data/jsons/uaf/17.20/TD_SELECTION_CRITERIA.json +89 -89
teradataml/data/jsons/uaf/17.20/TD_SIGNIF_PERIODICITIES.json +79 -79
teradataml/data/jsons/uaf/17.20/TD_SIGNIF_RESIDMEAN.json +67 -67
teradataml/data/jsons/uaf/17.20/TD_SIMPLEEXP.json +184 -184
teradataml/data/jsons/uaf/17.20/TD_SINFO.json +57 -57
teradataml/data/jsons/uaf/17.20/TD_SMOOTHMA.json +162 -162
teradataml/data/jsons/uaf/17.20/TD_TRACKINGOP.json +100 -100
teradataml/data/jsons/uaf/17.20/TD_UNDIFF.json +111 -111
teradataml/data/jsons/uaf/17.20/TD_UNNORMALIZE.json +95 -95
teradataml/data/jsons/uaf/17.20/TD_WHITES_GENERAL.json +77 -77
teradataml/data/kmeans_example.json +22 -17
teradataml/data/kmeans_table.csv +10 -0
teradataml/data/kmeans_us_arrests_data.csv +0 -0
teradataml/data/knn_example.json +18 -18
teradataml/data/knnrecommender_example.json +6 -6
teradataml/data/knnrecommenderpredict_example.json +12 -12
teradataml/data/lar_example.json +17 -17
teradataml/data/larpredict_example.json +30 -30
teradataml/data/lc_new_predictors.csv +5 -5
teradataml/data/lc_new_reference.csv +9 -9
teradataml/data/lda_example.json +8 -8
teradataml/data/ldainference_example.json +14 -14
teradataml/data/ldatopicsummary_example.json +8 -8
teradataml/data/levendist_input.csv +13 -13
teradataml/data/levenshteindistance_example.json +10 -10
teradataml/data/linreg_example.json +9 -9
teradataml/data/load_example_data.py +326 -323
teradataml/data/loan_prediction.csv +295 -295
teradataml/data/lungcancer.csv +138 -138
teradataml/data/mappingdata.csv +12 -12
teradataml/data/milk_timeseries.csv +157 -157
teradataml/data/min_max_titanic.csv +4 -4
teradataml/data/minhash_example.json +6 -6
teradataml/data/ml_ratings.csv +7547 -7547
teradataml/data/ml_ratings_10.csv +2445 -2445
teradataml/data/model1_table.csv +5 -5
teradataml/data/model2_table.csv +5 -5
teradataml/data/models/iris_db_glm_model.pmml +56 -56
teradataml/data/models/iris_db_xgb_model.pmml +4471 -4471
teradataml/data/modularity_example.json +12 -12
teradataml/data/movavg_example.json +7 -7
teradataml/data/mtx1.csv +7 -7
teradataml/data/mtx2.csv +13 -13
teradataml/data/multi_model_classification.csv +401 -0
teradataml/data/multi_model_regression.csv +401 -0
teradataml/data/mvdfft8.csv +9 -9
teradataml/data/naivebayes_example.json +9 -9
teradataml/data/naivebayespredict_example.json +19 -19
teradataml/data/naivebayestextclassifier2_example.json +6 -6
teradataml/data/naivebayestextclassifier_example.json +8 -8
teradataml/data/naivebayestextclassifierpredict_example.json +20 -20
teradataml/data/name_Find_configure.csv +10 -10
teradataml/data/namedentityfinder_example.json +14 -14
teradataml/data/namedentityfinderevaluator_example.json +10 -10
teradataml/data/namedentityfindertrainer_example.json +6 -6
teradataml/data/nb_iris_input_test.csv +31 -31
teradataml/data/nb_iris_input_train.csv +121 -121
teradataml/data/nbp_iris_model.csv +13 -13
teradataml/data/ner_extractor_text.csv +2 -2
teradataml/data/ner_sports_test2.csv +29 -29
teradataml/data/ner_sports_train.csv +501 -501
teradataml/data/nerevaluator_example.json +5 -5
teradataml/data/nerextractor_example.json +18 -18
teradataml/data/nermem_sports_test.csv +17 -17
teradataml/data/nermem_sports_train.csv +50 -50
teradataml/data/nertrainer_example.json +6 -6
teradataml/data/ngrams_example.json +6 -6
teradataml/data/notebooks/sqlalchemy/Teradata Vantage Aggregate Functions using SQLAlchemy.ipynb +1455 -1455
teradataml/data/notebooks/sqlalchemy/Teradata Vantage Arithmetic Functions Using SQLAlchemy.ipynb +1993 -1993
teradataml/data/notebooks/sqlalchemy/Teradata Vantage Bit-Byte Manipulation Functions using SQLAlchemy.ipynb +1492 -1492
teradataml/data/notebooks/sqlalchemy/Teradata Vantage Built-in functions using SQLAlchemy.ipynb +536 -536
teradataml/data/notebooks/sqlalchemy/Teradata Vantage Regular Expressions Using SQLAlchemy.ipynb +570 -570
teradataml/data/notebooks/sqlalchemy/Teradata Vantage String Functions Using SQLAlchemy.ipynb +2559 -2559
teradataml/data/notebooks/sqlalchemy/Teradata Vantage Window Aggregate Functions using SQLAlchemy.ipynb +2911 -2911
teradataml/data/notebooks/sqlalchemy/Using Generic SQLAlchemy ClauseElements teradataml DataFrame assign method.ipynb +698 -698
teradataml/data/notebooks/sqlalchemy/teradataml filtering using SQLAlchemy ClauseElements.ipynb +784 -784
teradataml/data/npath_example.json +23 -23
teradataml/data/ntree_example.json +14 -14
teradataml/data/numeric_strings.csv +4 -4
teradataml/data/numerics.csv +4 -4
teradataml/data/ocean_buoy.csv +17 -17
teradataml/data/ocean_buoy2.csv +17 -17
teradataml/data/ocean_buoys.csv +27 -27
teradataml/data/ocean_buoys2.csv +10 -10
teradataml/data/ocean_buoys_nonpti.csv +28 -28
teradataml/data/ocean_buoys_seq.csv +29 -29
teradataml/data/onehot_encoder_train.csv +4 -0
teradataml/data/openml_example.json +92 -0
teradataml/data/optional_event_table.csv +4 -4
teradataml/data/orders1.csv +11 -11
teradataml/data/orders1_12.csv +12 -12
teradataml/data/orders_ex.csv +4 -4
teradataml/data/pack_example.json +8 -8
teradataml/data/package_tracking.csv +19 -19
teradataml/data/package_tracking_pti.csv +18 -18
teradataml/data/pagerank_example.json +13 -13
teradataml/data/paragraphs_input.csv +6 -6
teradataml/data/pathanalyzer_example.json +7 -7
teradataml/data/pathgenerator_example.json +7 -7
teradataml/data/phrases.csv +7 -7
teradataml/data/pivot_example.json +8 -8
teradataml/data/pivot_input.csv +22 -22
teradataml/data/playerRating.csv +31 -31
teradataml/data/postagger_example.json +6 -6
teradataml/data/posttagger_output.csv +44 -44
teradataml/data/production_data.csv +16 -16
teradataml/data/production_data2.csv +7 -7
teradataml/data/randomsample_example.json +31 -31
teradataml/data/randomwalksample_example.json +8 -8
teradataml/data/rank_table.csv +6 -6
teradataml/data/ref_mobile_data.csv +4 -4
teradataml/data/ref_mobile_data_dense.csv +2 -2
teradataml/data/ref_url.csv +17 -17
teradataml/data/restaurant_reviews.csv +7 -7
teradataml/data/river_data.csv +145 -145
teradataml/data/roc_example.json +7 -7
teradataml/data/roc_input.csv +101 -101
teradataml/data/rule_inputs.csv +6 -6
teradataml/data/rule_table.csv +2 -2
teradataml/data/sales.csv +7 -7
teradataml/data/sales_transaction.csv +501 -501
teradataml/data/salesdata.csv +342 -342
teradataml/data/sample_cities.csv +2 -2
teradataml/data/sample_shapes.csv +10 -10
teradataml/data/sample_streets.csv +2 -2
teradataml/data/sampling_example.json +15 -15
teradataml/data/sax_example.json +8 -8
teradataml/data/scale_attributes.csv +3 -0
teradataml/data/scale_example.json +74 -23
teradataml/data/scale_housing.csv +11 -11
teradataml/data/scale_housing_test.csv +6 -6
teradataml/data/scale_input_part_sparse.csv +31 -0
teradataml/data/scale_input_partitioned.csv +16 -0
teradataml/data/scale_input_sparse.csv +11 -0
teradataml/data/scale_parameters.csv +3 -0
teradataml/data/scale_stat.csv +11 -11
teradataml/data/scalebypartition_example.json +13 -13
teradataml/data/scalemap_example.json +13 -13
teradataml/data/scalesummary_example.json +12 -12
teradataml/data/score_category.csv +101 -101
teradataml/data/score_summary.csv +4 -4
teradataml/data/script_example.json +9 -9
teradataml/data/scripts/deploy_script.py +84 -0
teradataml/data/scripts/mapper.R +20 -0
teradataml/data/scripts/mapper.py +15 -15
teradataml/data/scripts/mapper_replace.py +15 -15
teradataml/data/scripts/sklearn/__init__.py +0 -0
teradataml/data/scripts/sklearn/sklearn_fit.py +171 -0
teradataml/data/scripts/sklearn/sklearn_fit_predict.py +127 -0
teradataml/data/scripts/sklearn/sklearn_function.template +108 -0
teradataml/data/scripts/sklearn/sklearn_model_selection_split.py +148 -0
teradataml/data/scripts/sklearn/sklearn_neighbors.py +143 -0
teradataml/data/scripts/sklearn/sklearn_score.py +119 -0
teradataml/data/scripts/sklearn/sklearn_transform.py +171 -0
teradataml/data/seeds.csv +10 -10
teradataml/data/sentenceextractor_example.json +6 -6
teradataml/data/sentiment_extract_input.csv +11 -11
teradataml/data/sentiment_train.csv +16 -16
teradataml/data/sentiment_word.csv +20 -20
teradataml/data/sentiment_word_input.csv +19 -19
teradataml/data/sentimentextractor_example.json +24 -24
teradataml/data/sentimenttrainer_example.json +8 -8
teradataml/data/sequence_table.csv +10 -10
teradataml/data/seriessplitter_example.json +7 -7
teradataml/data/sessionize_example.json +17 -17
teradataml/data/sessionize_table.csv +116 -116
teradataml/data/setop_test1.csv +24 -24
teradataml/data/setop_test2.csv +22 -22
teradataml/data/soc_nw_edges.csv +10 -10
teradataml/data/soc_nw_vertices.csv +7 -7
teradataml/data/souvenir_timeseries.csv +167 -167
teradataml/data/sparse_iris_attribute.csv +5 -5
teradataml/data/sparse_iris_test.csv +121 -121
teradataml/data/sparse_iris_train.csv +601 -601
teradataml/data/star1.csv +6 -6
teradataml/data/state_transition.csv +5 -5
teradataml/data/stock_data.csv +53 -53
teradataml/data/stock_movement.csv +11 -11
teradataml/data/stock_vol.csv +76 -76
teradataml/data/stop_words.csv +8 -8
teradataml/data/store_sales.csv +37 -37
teradataml/data/stringsimilarity_example.json +7 -7
teradataml/data/strsimilarity_input.csv +13 -13
teradataml/data/students.csv +101 -101
teradataml/data/svm_iris_input_test.csv +121 -121
teradataml/data/svm_iris_input_train.csv +481 -481
teradataml/data/svm_iris_model.csv +7 -7
teradataml/data/svmdense_example.json +9 -9
teradataml/data/svmdensepredict_example.json +18 -18
teradataml/data/svmsparse_example.json +7 -7
teradataml/data/svmsparsepredict_example.json +13 -13
teradataml/data/svmsparsesummary_example.json +7 -7
teradataml/data/target_mobile_data.csv +13 -13
teradataml/data/target_mobile_data_dense.csv +5 -5
teradataml/data/templatedata.csv +1201 -1201
teradataml/data/templates/open_source_ml.json +9 -0
teradataml/data/teradataml_example.json +150 -1
teradataml/data/test_classification.csv +101 -0
teradataml/data/test_loan_prediction.csv +53 -53
teradataml/data/test_pacf_12.csv +37 -37
teradataml/data/test_prediction.csv +101 -0
teradataml/data/test_regression.csv +101 -0
teradataml/data/test_river2.csv +109 -109
teradataml/data/text_inputs.csv +6 -6
teradataml/data/textchunker_example.json +7 -7
teradataml/data/textclassifier_example.json +6 -6
teradataml/data/textclassifier_input.csv +7 -7
teradataml/data/textclassifiertrainer_example.json +6 -6
teradataml/data/textmorph_example.json +5 -5
teradataml/data/textparser_example.json +15 -15
teradataml/data/texttagger_example.json +11 -11
teradataml/data/texttokenizer_example.json +6 -6
teradataml/data/texttrainer_input.csv +11 -11
teradataml/data/tf_example.json +6 -6
teradataml/data/tfidf_example.json +13 -13
teradataml/data/tfidf_input1.csv +201 -201
teradataml/data/tfidf_train.csv +6 -6
teradataml/data/time_table1.csv +535 -535
teradataml/data/time_table2.csv +14 -14
teradataml/data/timeseriesdata.csv +1601 -1601
teradataml/data/timeseriesdatasetsd4.csv +105 -105
teradataml/data/titanic.csv +892 -892
teradataml/data/token_table.csv +696 -696
teradataml/data/train_multiclass.csv +101 -0
teradataml/data/train_regression.csv +101 -0
teradataml/data/train_regression_multiple_labels.csv +101 -0
teradataml/data/train_tracking.csv +27 -27
teradataml/data/transformation_table.csv +5 -5
teradataml/data/transformation_table_new.csv +1 -1
teradataml/data/tv_spots.csv +16 -16
teradataml/data/twod_climate_data.csv +117 -117
teradataml/data/uaf_example.json +475 -475
teradataml/data/univariatestatistics_example.json +8 -8
teradataml/data/unpack_example.json +9 -9
teradataml/data/unpivot_example.json +9 -9
teradataml/data/unpivot_input.csv +8 -8
teradataml/data/us_air_pass.csv +36 -36
teradataml/data/us_population.csv +624 -624
teradataml/data/us_states_shapes.csv +52 -52
teradataml/data/varmax_example.json +17 -17
teradataml/data/vectordistance_example.json +25 -25
teradataml/data/ville_climatedata.csv +121 -121
teradataml/data/ville_tempdata.csv +12 -12
teradataml/data/ville_tempdata1.csv +12 -12
teradataml/data/ville_temperature.csv +11 -11
teradataml/data/waveletTable.csv +1605 -1605
teradataml/data/waveletTable2.csv +1605 -1605
teradataml/data/weightedmovavg_example.json +8 -8
teradataml/data/wft_testing.csv +5 -5
teradataml/data/wine_data.csv +1600 -0
teradataml/data/word_embed_input_table1.csv +5 -5
teradataml/data/word_embed_input_table2.csv +4 -4
teradataml/data/word_embed_model.csv +22 -22
teradataml/data/words_input.csv +13 -13
teradataml/data/xconvolve_complex_left.csv +6 -6
teradataml/data/xconvolve_complex_leftmulti.csv +6 -6
teradataml/data/xgboost_example.json +35 -35
teradataml/data/xgboostpredict_example.json +31 -31
teradataml/data/ztest_example.json +16 -0
teradataml/dataframe/copy_to.py +1769 -1698
teradataml/dataframe/data_transfer.py +2812 -2745
teradataml/dataframe/dataframe.py +17630 -16946
teradataml/dataframe/dataframe_utils.py +1875 -1740
teradataml/dataframe/fastload.py +794 -603
teradataml/dataframe/indexer.py +424 -424
teradataml/dataframe/setop.py +1179 -1166
teradataml/dataframe/sql.py +10174 -6432
teradataml/dataframe/sql_function_parameters.py +439 -388
teradataml/dataframe/sql_functions.py +652 -652
teradataml/dataframe/sql_interfaces.py +220 -220
teradataml/dataframe/vantage_function_types.py +674 -630
teradataml/dataframe/window.py +693 -692
teradataml/dbutils/__init__.py +3 -3
teradataml/dbutils/dbutils.py +1167 -1150
teradataml/dbutils/filemgr.py +267 -267
teradataml/gen_ai/__init__.py +2 -2
teradataml/gen_ai/convAI.py +472 -472
teradataml/geospatial/__init__.py +3 -3
teradataml/geospatial/geodataframe.py +1105 -1094
teradataml/geospatial/geodataframecolumn.py +392 -387
teradataml/geospatial/geometry_types.py +925 -925
teradataml/hyperparameter_tuner/__init__.py +1 -1
teradataml/hyperparameter_tuner/optimizer.py +3783 -2993
teradataml/hyperparameter_tuner/utils.py +281 -187
teradataml/lib/aed_0_1.dll +0 -0
teradataml/lib/libaed_0_1.dylib +0 -0
teradataml/lib/libaed_0_1.so +0 -0
teradataml/libaed_0_1.dylib +0 -0
teradataml/libaed_0_1.so +0 -0
teradataml/opensource/__init__.py +1 -0
teradataml/opensource/sklearn/__init__.py +1 -0
teradataml/opensource/sklearn/_class.py +255 -0
teradataml/opensource/sklearn/_sklearn_wrapper.py +1715 -0
teradataml/opensource/sklearn/_wrapper_utils.py +268 -0
teradataml/opensource/sklearn/constants.py +54 -0
teradataml/options/__init__.py +130 -124
teradataml/options/configure.py +358 -336
teradataml/options/display.py +176 -176
teradataml/plot/__init__.py +2 -2
teradataml/plot/axis.py +1388 -1388
teradataml/plot/constants.py +15 -15
teradataml/plot/figure.py +398 -398
teradataml/plot/plot.py +760 -760
teradataml/plot/query_generator.py +83 -83
teradataml/plot/subplot.py +216 -216
teradataml/scriptmgmt/UserEnv.py +3791 -3761
teradataml/scriptmgmt/__init__.py +3 -3
teradataml/scriptmgmt/lls_utils.py +1719 -1604
teradataml/series/series.py +532 -532
teradataml/series/series_utils.py +71 -71
teradataml/table_operators/Apply.py +949 -917
teradataml/table_operators/Script.py +1718 -1982
teradataml/table_operators/TableOperator.py +1255 -1616
teradataml/table_operators/__init__.py +2 -3
teradataml/table_operators/apply_query_generator.py +262 -262
teradataml/table_operators/query_generator.py +507 -507
teradataml/table_operators/table_operator_query_generator.py +460 -460
teradataml/table_operators/table_operator_util.py +631 -639
teradataml/table_operators/templates/dataframe_apply.template +184 -184
teradataml/table_operators/templates/dataframe_map.template +176 -176
teradataml/table_operators/templates/script_executor.template +170 -170
teradataml/utils/dtypes.py +684 -684
teradataml/utils/internal_buffer.py +84 -84
teradataml/utils/print_versions.py +205 -205
teradataml/utils/utils.py +410 -410
teradataml/utils/validators.py +2277 -2115
{teradataml-17.20.0.7.dist-info → teradataml-20.0.0.1.dist-info}/METADATA +346 -45
teradataml-20.0.0.1.dist-info/RECORD +1056 -0
{teradataml-17.20.0.7.dist-info → teradataml-20.0.0.1.dist-info}/WHEEL +1 -1
{teradataml-17.20.0.7.dist-info → teradataml-20.0.0.1.dist-info}/zip-safe +1 -1
teradataml/analytics/mle/AdaBoost.py +0 -651
teradataml/analytics/mle/AdaBoostPredict.py +0 -564
teradataml/analytics/mle/Antiselect.py +0 -342
teradataml/analytics/mle/Arima.py +0 -641
teradataml/analytics/mle/ArimaPredict.py +0 -477
teradataml/analytics/mle/Attribution.py +0 -1070
teradataml/analytics/mle/Betweenness.py +0 -658
teradataml/analytics/mle/Burst.py +0 -711
teradataml/analytics/mle/CCM.py +0 -600
teradataml/analytics/mle/CCMPrepare.py +0 -324
teradataml/analytics/mle/CFilter.py +0 -460
teradataml/analytics/mle/ChangePointDetection.py +0 -572
teradataml/analytics/mle/ChangePointDetectionRT.py +0 -477
teradataml/analytics/mle/Closeness.py +0 -737
teradataml/analytics/mle/ConfusionMatrix.py +0 -420
teradataml/analytics/mle/Correlation.py +0 -477
teradataml/analytics/mle/Correlation2.py +0 -573
teradataml/analytics/mle/CoxHazardRatio.py +0 -679
teradataml/analytics/mle/CoxPH.py +0 -556
teradataml/analytics/mle/CoxSurvival.py +0 -478
teradataml/analytics/mle/CumulativeMovAvg.py +0 -363
teradataml/analytics/mle/DTW.py +0 -623
teradataml/analytics/mle/DWT.py +0 -564
teradataml/analytics/mle/DWT2D.py +0 -599
teradataml/analytics/mle/DecisionForest.py +0 -716
teradataml/analytics/mle/DecisionForestEvaluator.py +0 -363
teradataml/analytics/mle/DecisionForestPredict.py +0 -561
teradataml/analytics/mle/DecisionTree.py +0 -830
teradataml/analytics/mle/DecisionTreePredict.py +0 -528
teradataml/analytics/mle/ExponentialMovAvg.py +0 -418
teradataml/analytics/mle/FMeasure.py +0 -402
teradataml/analytics/mle/FPGrowth.py +0 -734
teradataml/analytics/mle/FrequentPaths.py +0 -695
teradataml/analytics/mle/GLM.py +0 -558
teradataml/analytics/mle/GLML1L2.py +0 -547
teradataml/analytics/mle/GLML1L2Predict.py +0 -519
teradataml/analytics/mle/GLMPredict.py +0 -529
teradataml/analytics/mle/HMMDecoder.py +0 -945
teradataml/analytics/mle/HMMEvaluator.py +0 -901
teradataml/analytics/mle/HMMSupervised.py +0 -521
teradataml/analytics/mle/HMMUnsupervised.py +0 -572
teradataml/analytics/mle/Histogram.py +0 -561
teradataml/analytics/mle/IDWT.py +0 -476
teradataml/analytics/mle/IDWT2D.py +0 -493
teradataml/analytics/mle/IdentityMatch.py +0 -763
teradataml/analytics/mle/Interpolator.py +0 -918
teradataml/analytics/mle/KMeans.py +0 -485
teradataml/analytics/mle/KNN.py +0 -627
teradataml/analytics/mle/KNNRecommender.py +0 -488
teradataml/analytics/mle/KNNRecommenderPredict.py +0 -581
teradataml/analytics/mle/LAR.py +0 -439
teradataml/analytics/mle/LARPredict.py +0 -478
teradataml/analytics/mle/LDA.py +0 -548
teradataml/analytics/mle/LDAInference.py +0 -492
teradataml/analytics/mle/LDATopicSummary.py +0 -464
teradataml/analytics/mle/LevenshteinDistance.py +0 -450
teradataml/analytics/mle/LinReg.py +0 -433
teradataml/analytics/mle/LinRegPredict.py +0 -438
teradataml/analytics/mle/MinHash.py +0 -544
teradataml/analytics/mle/Modularity.py +0 -587
teradataml/analytics/mle/NEREvaluator.py +0 -410
teradataml/analytics/mle/NERExtractor.py +0 -595
teradataml/analytics/mle/NERTrainer.py +0 -458
teradataml/analytics/mle/NGrams.py +0 -570
teradataml/analytics/mle/NPath.py +0 -634
teradataml/analytics/mle/NTree.py +0 -549
teradataml/analytics/mle/NaiveBayes.py +0 -462
teradataml/analytics/mle/NaiveBayesPredict.py +0 -513
teradataml/analytics/mle/NaiveBayesTextClassifier.py +0 -607
teradataml/analytics/mle/NaiveBayesTextClassifier2.py +0 -531
teradataml/analytics/mle/NaiveBayesTextClassifierPredict.py +0 -799
teradataml/analytics/mle/NamedEntityFinder.py +0 -529
teradataml/analytics/mle/NamedEntityFinderEvaluator.py +0 -414
teradataml/analytics/mle/NamedEntityFinderTrainer.py +0 -396
teradataml/analytics/mle/POSTagger.py +0 -417
teradataml/analytics/mle/Pack.py +0 -411
teradataml/analytics/mle/PageRank.py +0 -535
teradataml/analytics/mle/PathAnalyzer.py +0 -426
teradataml/analytics/mle/PathGenerator.py +0 -367
teradataml/analytics/mle/PathStart.py +0 -464
teradataml/analytics/mle/PathSummarizer.py +0 -470
teradataml/analytics/mle/Pivot.py +0 -471
teradataml/analytics/mle/ROC.py +0 -425
teradataml/analytics/mle/RandomSample.py +0 -637
teradataml/analytics/mle/RandomWalkSample.py +0 -490
teradataml/analytics/mle/SAX.py +0 -779
teradataml/analytics/mle/SVMDense.py +0 -677
teradataml/analytics/mle/SVMDensePredict.py +0 -536
teradataml/analytics/mle/SVMDenseSummary.py +0 -437
teradataml/analytics/mle/SVMSparse.py +0 -557
teradataml/analytics/mle/SVMSparsePredict.py +0 -553
teradataml/analytics/mle/SVMSparseSummary.py +0 -435
teradataml/analytics/mle/Sampling.py +0 -549
teradataml/analytics/mle/Scale.py +0 -565
teradataml/analytics/mle/ScaleByPartition.py +0 -496
teradataml/analytics/mle/ScaleMap.py +0 -378
teradataml/analytics/mle/ScaleSummary.py +0 -320
teradataml/analytics/mle/SentenceExtractor.py +0 -363
teradataml/analytics/mle/SentimentEvaluator.py +0 -432
teradataml/analytics/mle/SentimentExtractor.py +0 -578
teradataml/analytics/mle/SentimentTrainer.py +0 -405
teradataml/analytics/mle/SeriesSplitter.py +0 -641
teradataml/analytics/mle/Sessionize.py +0 -475
teradataml/analytics/mle/SimpleMovAvg.py +0 -397
teradataml/analytics/mle/StringSimilarity.py +0 -425
teradataml/analytics/mle/TF.py +0 -389
teradataml/analytics/mle/TFIDF.py +0 -504
teradataml/analytics/mle/TextChunker.py +0 -414
teradataml/analytics/mle/TextClassifier.py +0 -399
teradataml/analytics/mle/TextClassifierEvaluator.py +0 -413
teradataml/analytics/mle/TextClassifierTrainer.py +0 -565
teradataml/analytics/mle/TextMorph.py +0 -494
teradataml/analytics/mle/TextParser.py +0 -623
teradataml/analytics/mle/TextTagger.py +0 -530
teradataml/analytics/mle/TextTokenizer.py +0 -502
teradataml/analytics/mle/UnivariateStatistics.py +0 -488
teradataml/analytics/mle/Unpack.py +0 -526
teradataml/analytics/mle/Unpivot.py +0 -438
teradataml/analytics/mle/VarMax.py +0 -776
teradataml/analytics/mle/VectorDistance.py +0 -762
teradataml/analytics/mle/WeightedMovAvg.py +0 -400
teradataml/analytics/mle/XGBoost.py +0 -842
teradataml/analytics/mle/XGBoostPredict.py +0 -627
teradataml/analytics/mle/__init__.py +0 -123
teradataml/analytics/mle/json/adaboost_mle.json +0 -135
teradataml/analytics/mle/json/adaboostpredict_mle.json +0 -85
teradataml/analytics/mle/json/antiselect_mle.json +0 -34
teradataml/analytics/mle/json/antiselect_mle_mle.json +0 -34
teradataml/analytics/mle/json/arima_mle.json +0 -172
teradataml/analytics/mle/json/arimapredict_mle.json +0 -52
teradataml/analytics/mle/json/attribution_mle_mle.json +0 -143
teradataml/analytics/mle/json/betweenness_mle.json +0 -97
teradataml/analytics/mle/json/burst_mle.json +0 -140
teradataml/analytics/mle/json/ccm_mle.json +0 -124
teradataml/analytics/mle/json/ccmprepare_mle.json +0 -14
teradataml/analytics/mle/json/cfilter_mle.json +0 -93
teradataml/analytics/mle/json/changepointdetection_mle.json +0 -92
teradataml/analytics/mle/json/changepointdetectionrt_mle.json +0 -78
teradataml/analytics/mle/json/closeness_mle.json +0 -104
teradataml/analytics/mle/json/confusionmatrix_mle.json +0 -79
teradataml/analytics/mle/json/correlation_mle.json +0 -86
teradataml/analytics/mle/json/correlationreduce_mle.json +0 -49
teradataml/analytics/mle/json/coxhazardratio_mle.json +0 -89
teradataml/analytics/mle/json/coxph_mle.json +0 -98
teradataml/analytics/mle/json/coxsurvival_mle.json +0 -79
teradataml/analytics/mle/json/cumulativemovavg_mle.json +0 -34
teradataml/analytics/mle/json/decisionforest_mle.json +0 -167
teradataml/analytics/mle/json/decisionforestevaluator_mle.json +0 -33
teradataml/analytics/mle/json/decisionforestpredict_mle_mle.json +0 -74
teradataml/analytics/mle/json/decisiontree_mle.json +0 -194
teradataml/analytics/mle/json/decisiontreepredict_mle_mle.json +0 -86
teradataml/analytics/mle/json/dtw_mle.json +0 -97
teradataml/analytics/mle/json/dwt2d_mle.json +0 -116
teradataml/analytics/mle/json/dwt_mle.json +0 -101
teradataml/analytics/mle/json/exponentialmovavg_mle.json +0 -55
teradataml/analytics/mle/json/fmeasure_mle.json +0 -58
teradataml/analytics/mle/json/fpgrowth_mle.json +0 -159
teradataml/analytics/mle/json/frequentpaths_mle.json +0 -129
teradataml/analytics/mle/json/glm_mle.json +0 -111
teradataml/analytics/mle/json/glml1l2_mle.json +0 -106
teradataml/analytics/mle/json/glml1l2predict_mle.json +0 -57
teradataml/analytics/mle/json/glmpredict_mle_mle.json +0 -74
teradataml/analytics/mle/json/histogram_mle.json +0 -100
teradataml/analytics/mle/json/hmmdecoder_mle.json +0 -192
teradataml/analytics/mle/json/hmmevaluator_mle.json +0 -206
teradataml/analytics/mle/json/hmmsupervised_mle.json +0 -91
teradataml/analytics/mle/json/hmmunsupervised_mle.json +0 -114
teradataml/analytics/mle/json/identitymatch_mle.json +0 -88
teradataml/analytics/mle/json/idwt2d_mle.json +0 -73
teradataml/analytics/mle/json/idwt_mle.json +0 -66
teradataml/analytics/mle/json/interpolator_mle.json +0 -151
teradataml/analytics/mle/json/kmeans_mle.json +0 -97
teradataml/analytics/mle/json/knn_mle.json +0 -141
teradataml/analytics/mle/json/knnrecommender_mle.json +0 -111
teradataml/analytics/mle/json/knnrecommenderpredict_mle.json +0 -75
teradataml/analytics/mle/json/lar_mle.json +0 -78
teradataml/analytics/mle/json/larpredict_mle.json +0 -69
teradataml/analytics/mle/json/lda_mle.json +0 -130
teradataml/analytics/mle/json/ldainference_mle.json +0 -78
teradataml/analytics/mle/json/ldatopicsummary_mle.json +0 -64
teradataml/analytics/mle/json/levenshteindistance_mle.json +0 -92
teradataml/analytics/mle/json/linreg_mle.json +0 -42
teradataml/analytics/mle/json/linregpredict_mle.json +0 -56
teradataml/analytics/mle/json/minhash_mle.json +0 -113
teradataml/analytics/mle/json/modularity_mle.json +0 -91
teradataml/analytics/mle/json/naivebayespredict_mle_mle.json +0 -85
teradataml/analytics/mle/json/naivebayesreduce_mle.json +0 -52
teradataml/analytics/mle/json/naivebayestextclassifierpredict_mle_mle.json +0 -147
teradataml/analytics/mle/json/naivebayestextclassifiertrainer2_mle.json +0 -108
teradataml/analytics/mle/json/naivebayestextclassifiertrainer_mle.json +0 -102
teradataml/analytics/mle/json/namedentityfinder_mle.json +0 -84
teradataml/analytics/mle/json/namedentityfinderevaluatorreduce_mle.json +0 -43
teradataml/analytics/mle/json/namedentityfindertrainer_mle.json +0 -64
teradataml/analytics/mle/json/nerevaluator_mle.json +0 -54
teradataml/analytics/mle/json/nerextractor_mle.json +0 -87
teradataml/analytics/mle/json/nertrainer_mle.json +0 -89
teradataml/analytics/mle/json/ngrams_mle.json +0 -137
teradataml/analytics/mle/json/ngramsplitter_mle_mle.json +0 -137
teradataml/analytics/mle/json/npath@coprocessor_mle.json +0 -73
teradataml/analytics/mle/json/ntree@coprocessor_mle.json +0 -123
teradataml/analytics/mle/json/pack_mle.json +0 -58
teradataml/analytics/mle/json/pack_mle_mle.json +0 -58
teradataml/analytics/mle/json/pagerank_mle.json +0 -81
teradataml/analytics/mle/json/pathanalyzer_mle.json +0 -63
teradataml/analytics/mle/json/pathgenerator_mle.json +0 -40
teradataml/analytics/mle/json/pathstart_mle.json +0 -62
teradataml/analytics/mle/json/pathsummarizer_mle.json +0 -72
teradataml/analytics/mle/json/pivoting_mle.json +0 -71
teradataml/analytics/mle/json/postagger_mle.json +0 -51
teradataml/analytics/mle/json/randomsample_mle.json +0 -131
teradataml/analytics/mle/json/randomwalksample_mle.json +0 -85
teradataml/analytics/mle/json/roc_mle.json +0 -73
teradataml/analytics/mle/json/sampling_mle.json +0 -75
teradataml/analytics/mle/json/sax_mle.json +0 -154
teradataml/analytics/mle/json/scale_mle.json +0 -93
teradataml/analytics/mle/json/scalebypartition_mle.json +0 -89
teradataml/analytics/mle/json/scalemap_mle.json +0 -44
teradataml/analytics/mle/json/scalesummary_mle.json +0 -14
teradataml/analytics/mle/json/sentenceextractor_mle.json +0 -41
teradataml/analytics/mle/json/sentimentevaluator_mle.json +0 -43
teradataml/analytics/mle/json/sentimentextractor_mle.json +0 -100
teradataml/analytics/mle/json/sentimenttrainer_mle.json +0 -68
teradataml/analytics/mle/json/seriessplitter_mle.json +0 -133
teradataml/analytics/mle/json/sessionize_mle_mle.json +0 -62
teradataml/analytics/mle/json/simplemovavg_mle.json +0 -48
teradataml/analytics/mle/json/stringsimilarity_mle.json +0 -50
teradataml/analytics/mle/json/stringsimilarity_mle_mle.json +0 -50
teradataml/analytics/mle/json/svmdense_mle.json +0 -165
teradataml/analytics/mle/json/svmdensepredict_mle.json +0 -95
teradataml/analytics/mle/json/svmdensesummary_mle.json +0 -58
teradataml/analytics/mle/json/svmsparse_mle.json +0 -148
teradataml/analytics/mle/json/svmsparsepredict_mle_mle.json +0 -103
teradataml/analytics/mle/json/svmsparsesummary_mle.json +0 -57
teradataml/analytics/mle/json/textchunker_mle.json +0 -40
teradataml/analytics/mle/json/textclassifier_mle.json +0 -51
teradataml/analytics/mle/json/textclassifierevaluator_mle.json +0 -43
teradataml/analytics/mle/json/textclassifiertrainer_mle.json +0 -103
teradataml/analytics/mle/json/textmorph_mle.json +0 -63
teradataml/analytics/mle/json/textparser_mle.json +0 -166
teradataml/analytics/mle/json/texttagger_mle.json +0 -81
teradataml/analytics/mle/json/texttokenizer_mle.json +0 -91
teradataml/analytics/mle/json/tf_mle.json +0 -33
teradataml/analytics/mle/json/tfidf_mle.json +0 -34
teradataml/analytics/mle/json/univariatestatistics_mle.json +0 -81
teradataml/analytics/mle/json/unpack_mle.json +0 -91
teradataml/analytics/mle/json/unpack_mle_mle.json +0 -91
teradataml/analytics/mle/json/unpivoting_mle.json +0 -63
teradataml/analytics/mle/json/varmax_mle.json +0 -176
teradataml/analytics/mle/json/vectordistance_mle.json +0 -179
teradataml/analytics/mle/json/weightedmovavg_mle.json +0 -48
teradataml/analytics/mle/json/xgboost_mle.json +0 -178
teradataml/analytics/mle/json/xgboostpredict_mle.json +0 -104
teradataml/analytics/sqle/Antiselect.py +0 -321
teradataml/analytics/sqle/Attribution.py +0 -603
teradataml/analytics/sqle/DecisionForestPredict.py +0 -408
teradataml/analytics/sqle/GLMPredict.py +0 -430
teradataml/analytics/sqle/MovingAverage.py +0 -543
teradataml/analytics/sqle/NGramSplitter.py +0 -548
teradataml/analytics/sqle/NPath.py +0 -632
teradataml/analytics/sqle/NaiveBayesTextClassifierPredict.py +0 -515
teradataml/analytics/sqle/Pack.py +0 -388
teradataml/analytics/sqle/SVMSparsePredict.py +0 -464
teradataml/analytics/sqle/Sessionize.py +0 -390
teradataml/analytics/sqle/StringSimilarity.py +0 -400
teradataml/analytics/sqle/Unpack.py +0 -503
teradataml/analytics/sqle/json/antiselect_sqle.json +0 -21
teradataml/analytics/sqle/json/attribution_sqle.json +0 -92
teradataml/analytics/sqle/json/decisionforestpredict_sqle.json +0 -48
teradataml/analytics/sqle/json/glmpredict_sqle.json +0 -48
teradataml/analytics/sqle/json/h2opredict_sqle.json +0 -63
teradataml/analytics/sqle/json/movingaverage_sqle.json +0 -58
teradataml/analytics/sqle/json/naivebayestextclassifierpredict_sqle.json +0 -76
teradataml/analytics/sqle/json/ngramsplitter_sqle.json +0 -126
teradataml/analytics/sqle/json/npath_sqle.json +0 -67
teradataml/analytics/sqle/json/pack_sqle.json +0 -47
teradataml/analytics/sqle/json/pmmlpredict_sqle.json +0 -55
teradataml/analytics/sqle/json/sessionize_sqle.json +0 -43
teradataml/analytics/sqle/json/stringsimilarity_sqle.json +0 -39
teradataml/analytics/sqle/json/svmsparsepredict_sqle.json +0 -74
teradataml/analytics/sqle/json/unpack_sqle.json +0 -80
teradataml/catalog/model_cataloging.py +0 -980
teradataml/config/mlengine_alias_definitions_v1.0 +0 -118
teradataml/config/mlengine_alias_definitions_v1.1 +0 -127
teradataml/config/mlengine_alias_definitions_v1.3 +0 -129
teradataml/table_operators/sandbox_container_util.py +0 -643
teradataml-17.20.0.7.dist-info/RECORD +0 -1280
{teradataml-17.20.0.7.dist-info → teradataml-20.0.0.1.dist-info}/top_level.txt +0 -0

teradataml/dataframe/dataframe_utils.py CHANGED Viewed

@@ -1,1740 +1,1875 @@
-# -*- coding: utf-8 -*-
-"""
-Unpublished work.
-Copyright (c) 2018 by Teradata Corporation. All rights reserved.
-TERADATA CORPORATION CONFIDENTIAL AND TRADE SECRET
-Primary Owner: mark.sandan@teradata.com
-Secondary Owner:
-This file implements util functions of data frame.
-"""
-import numbers
-import pandas as pd
-from collections import OrderedDict
-from teradataml.common.utils import UtilFuncs
-from teradataml.common.aed_utils import AedUtils
-from teradataml.common.constants import AEDConstants, PTITableConstants, \
-    SQLPattern, PythonTypes
-from teradataml.common.sqlbundle import SQLBundle
-from teradataml.common.exceptions import TeradataMlException
-from teradataml.common.messages import Messages
-from teradataml.common.messagecodes import MessageCodes
-from teradataml.context.context import get_context, get_connection
-from teradataml.context.context import _get_current_databasename
-from teradataml.dbutils.dbutils import _execute_query_and_generate_pandas_df
-from teradataml.options.display import display
-from teradataml.options.configure import configure
-from teradataml.utils.utils import execute_sql
-from teradatasqlalchemy.types import FLOAT, NUMBER, DECIMAL, PERIOD_TIMESTAMP
-from teradatasqlalchemy.dialect import preparer, dialect as td_dialect
-import teradataml.dataframe as tdmldf
-from sqlalchemy.sql import select
-from sqlalchemy.sql.expression import text
-from sqlalchemy import table, column, func
-from datetime import datetime, date, time
-from decimal import Decimal
-# TODO - Need to write unit testcases for these functions
-class DataFrameUtils():
-    @staticmethod
-    def _execute_node_return_db_object_name(nodeid, metaexpression = None):
-        """
-        Fetches queries and view names from AED node and creates views from queries
-        Additionally inspects the metaexpression for consistency
-        PARAMETERS:
-            nodeid: nodeid to execute
-            metaexpression: (optional) updated _metaexpr to validate
-        EXAMPLES:
-             _execute_node_return_db_object_name(nodeid)
-             _execute_node_return_db_object_name(nodeid, metaexpr)
-        RETURNS:
-            Top level view name.
-        """
-        aed_obj = AedUtils()
-        if not aed_obj._aed_is_node_executed(nodeid):
-            view_query_node_type_list = aed_obj._aed_get_exec_query(nodeid)
-            view_names, queries, node_query_types, node_ids = view_query_node_type_list
-            # Executing Nodes / Creating Views
-            for index in range(len(queries) - 1, -1, -1):
-                is_persist = False
-                if metaexpression and metaexpression._is_persist:
-                    is_persist = True
-                try:
-                    if node_query_types[index] == AEDConstants.AED_QUERY_NODE_TYPE_ML_QUERY_MULTI_OUTPUT.value or\
-                       ("OUT TABLE " in queries[index] and SQLPattern.SQLMR.value.match(queries[index])) or \
-                            is_persist:
-                        # TODO:: OR condition in above needs to be removed once AED support is added.
-                        UtilFuncs._create_table(view_names[index], queries[index])
-                    elif node_query_types in ['groupby', 'groupbytime']:
-                        # If query_type is either groupby or groupbytime get it's parent
-                        # nodeid and execute queries for the same
-                        parent_nodeid = aed_obj._aed_get_parent_nodeids(nodeid)[0]
-                        DataFrameUtils._execute_node_return_db_object_name(parent_nodeid)
-                    elif node_query_types[index] == AEDConstants.AED_QUERY_NODE_TYPE_REFERENCE.value:
-                        # Reference nodes - To be ignored.
-                        pass
-                    else:
-                        UtilFuncs._create_view(view_names[index], queries[index])
-                    # Updating Node Status for executed Node
-                    aed_obj._aed_update_node_state_single(node_ids[index], AEDConstants.AED_NODE_EXECUTED.value)
-                except Exception as emsg:
-                    # TODO:: Append node execution details to emsg.
-                    #        Node description, such as nodeType or node operation, should be added
-                    #        here in 'emsg' to give away more information, where exactly
-                    #        node execution failed.
-                    raise TeradataMlException(Messages.get_message(MessageCodes.TDMLDF_EXEC_SQL_FAILED, str(emsg)),
-                                      MessageCodes.TDMLDF_EXEC_SQL_FAILED)
-        # Setting New Table name retrieved to TDML DF
-        result_table_view_name = aed_obj._aed_get_tablename(nodeid)
-        # validate the metaexpression
-        if configure._validate_metaexpression:
-            DataFrameUtils._validate_metaexpression(result_table_view_name, metaexpression)
-        return result_table_view_name
-    @staticmethod
-    def _validate_metaexpression(result_table_view_name, metaexpression):
-        """
-        Inspects the metaexpression for consistency with the underlying table/view
-        PARAMETERS:
-            result_table_view_name: a string representing the table/view name to check column metadata
-            metaexpression: the metaexpr of the DataFrame to compare against the result_table_view_name
-        EXAMPLES:
-             _validate_metaexpression('t1', df._metaexpr)
-             _execute_node_return_db_object_name(nodeid, metaexpr)
-        RETURNS:
-            None
-            Outputs RuntimeWarnings if mismatches are found
-        """
-        # metaexpression should have already been updated
-        if metaexpression is not None:
-            name = lambda x: x[0]
-            type_ = lambda x: x[1]
-            # compare sorted by name of column
-            df = sorted(UtilFuncs._describe_column(DataFrameUtils._get_metadata_from_table(result_table_view_name)), key = lambda x: x[0])
-            meta = sorted(metaexpression.c, key = lambda x: x.name)
-            # check length
-            if len(df) == len(meta):
-                for i in range(len(df)):
-                    # map Teradata type to python type
-                    meta_type = UtilFuncs._teradata_type_to_python_type(meta[i].type)
-                    # compare column names and types
-                    if meta[i].name != name(df[i]) or meta_type != type_(df[i]):
-                        err_msg = "[Mismatch when checking %s]\n\t[Table/View] %s %s\n\t[MetaExpression] %s %s (mapped from => %s)\n"
-                        raise RuntimeError(err_msg % (result_table_view_name,
-                                                      name(df[i]), type_(df[i]),
-                                                      meta[i].name, meta_type, meta[i].type))
-            else:
-                err_msg = "[Length mismatch when checking %s]\nSource Table/View has length %s but MetaExpression has length %s"
-                raise RuntimeError(err_msg % (result_table_view_name, len(df), len(meta)))
-    @staticmethod
-    def _get_dataframe_print_string(table_name, index_label, orderby=None, undropped_index=None):
-        """
-        Builds string output for teradataml DataFrame
-        PARAMETERS:
-            table_name - Name of the database table to read from.
-            index_label - String/List specifying column to use as index.
-            orderby - order expression to sort returned rows
-        EXAMPLES:
-             _get_dataframe_print_string('table_name', None, None)
-        RETURNS:
-            String representation of a pandas DataFrame.
-        """
-        read_query = SQLBundle._build_top_n_print_query(table_name, display.max_rows, orderby)
-        if index_label is not None:
-            pandas_df = _execute_query_and_generate_pandas_df(read_query, index=index_label)
-        else:
-            pandas_df = _execute_query_and_generate_pandas_df(read_query)
-        return pandas_df.to_string()
-    @staticmethod
-    def _get_pprint_dtypes(column_names_and_types, null_count=False):
-        """
-        returns a string containing the column names and types.
-        If null_count is not None, the string will also contain
-        the number of non-null values for each column.
-        PARAMETERS:
-            column_names_and_types - List of column names and types.
-            null_count(optional) - List of the non-null count for each column.
-        EXAMPLES:
-            >>>print(_get_pprint_dtypes(column_names_and_types)
-            accounts      str
-            Feb         float
-            Jan           int
-            Mar           int
-            Apr           int
-            datetime      str
-            >>>print(_get_pprint_dtypes(column_names_and_types, null_count)
-            accounts    3 non-null str
-            Feb         3 non-null float
-            Jan         3 non-null int
-            Mar         3 non-null int
-            Apr         3 non-null int
-            datetime    3 non-null str
-        RAISES:
-        """
-        col_names = [i[0] for i in column_names_and_types]
-        col_types = [i[1] for i in column_names_and_types]
-        max_col_names = len(max(col_names, key=len)) + 4
-        max_col_types = len(max(col_types, key=len))
-        dtypes_string = ""
-        if not null_count:
-            for colname, coltype in column_names_and_types:
-                dtypes_string += "{0: <{name_width}}{1: >{type_width}}\n".format(colname, coltype,
-                                                                                 name_width=max_col_names,
-                                                                                 type_width=max_col_types)
-        else:
-            null_count = [i[2] for i in column_names_and_types]
-            max_null_count = len(str(max(null_count, key=len)))
-            for colname, coltype, num_nulls in column_names_and_types:
-                dtypes_string += "{0: <{name_width}}{1: <{count_width}} non-null {2: <{type_width}}\n".format(colname,
-                                                                                                              num_nulls,
-                                                                                                              coltype,
-                                                                                                              name_width=max_col_names,
-                                                                                                              count_width=max_null_count,
-                                                                                                              type_width=max_col_types)
-        # Remove last new line character.
-        dtypes_string = dtypes_string[:-1]
-        return dtypes_string
-    @staticmethod
-    def _get_metadata_from_table(table_name):
-        """
-        Retrieves column metadata by executing a HELP COLUMN command.
-        PARAMETERS:
-            table_name - The table name or view name.
-        RETURNS:
-            returns the result set (column information) from HELP COLUMN.
-        RAISES:
-            Database error if an error occurred while executing the HELP COLUMN.
-        EXAMPLES:
-            df = DataFrame.from_table('mytab')
-            metadata = _get_metadata_from_table(df._table_name)
-        """
-        # Construct HELP COLUMN command.
-        help_col_sql = SQLBundle._build_help_column(table_name)
-        # Execute HELP COLUMN command.
-        return UtilFuncs._execute_query(help_col_sql)
-    @staticmethod
-    def _extract_select_string(select_expression):
-        """
-        Takes in a string/list representing a Pandas selection clause of any of the forms (only):
-            a) "col1" or 'col1'
-            b) ["col 1"] or ['col 1']
-            c) ["col1", "col2", "col3"] or ['col1', 'col2', 'col3']
-            d) [['col1', 'col2', 'col3']] or [["col1", "col2", "col3"]]
-        And returns a list with column strings representing the selection of the form:
-            a)  ['col1']
-            b)  ['col 1']
-            c)  ['col1','col2','col3']
-            d)  ['col1','col2','col3']
-        Column Names ("col1", "col2"..) are Strings representing database table Columns.
-        All Standard Teradata Data-Types for columns supported: INTEGER, VARCHAR(5), FLOAT.
-        PARAMETERS:
-            selection_expression -  Expression representing column selection
-            Type - String or List of Strings or List of List (Single level only)
-            Required - Yes
-        EXAMPLES:
-            UtilFuncs._extract_select_string([['col1', 'col2']])
-            UtilFuncs._extract_select_string("col1")
-            UtilFuncs._extract_select_string(["col1"])
-            UtilFuncs._extract_select_string(["col1","col2","col3"])
-        RETURNS:
-            List of Strings representing column names.
-        RAISES:
-            TeradataMlException
-        """
-        tdp = preparer(td_dialect)
-        column_list = []
-        # Single String column
-        if isinstance(select_expression, str):
-            # Error handling - Empty String
-            if select_expression ==  "":
-                raise TeradataMlException(Messages.get_message(MessageCodes.TDMLDF_SELECT_NONE_OR_EMPTY),
-                                      MessageCodes.TDMLDF_SELECT_NONE_OR_EMPTY)
-            else:
-                column_list.append(tdp.quote("{0}".format(select_expression.strip())))
-        # Error Handling -  [],  [""], [None], ["None"], ['col1', None], ['col1', '']
-        elif isinstance(select_expression, list) and (len(select_expression) ==  0  or
-                                                    any(element in [None, "None", ""] for element in select_expression)):
-            raise TeradataMlException(Messages.get_message(MessageCodes.TDMLDF_SELECT_NONE_OR_EMPTY),
-                                      MessageCodes.TDMLDF_SELECT_NONE_OR_EMPTY)
-        # List - ["col1"] or ["col1", "col2", "col3"]
-        elif isinstance(select_expression, list) and all(isinstance(element, str) for element in select_expression):
-            if len(select_expression) == 1:
-                column_list.append(tdp.quote("{0}".format(select_expression[0].strip())))
-            else:
-                column_list = [tdp.quote("{0}".format(element.strip())) for element in select_expression]
-        # List of List (Single level only - Pandas Syntax) - [["col1", "col2", "col3"]]
-        elif isinstance(select_expression, list) and isinstance(select_expression[0], list):
-            # Error Handling - [[]], [[""]], [[None]], [['col1', None]], [['col1', "None"]], ["col1", ""]
-            if len(select_expression[0]) ==  0  or any(element in [None, "None", ""] for element in select_expression[0]):
-                raise TeradataMlException(Messages.get_message(MessageCodes.TDMLDF_SELECT_NONE_OR_EMPTY),
-                                      MessageCodes.TDMLDF_SELECT_NONE_OR_EMPTY)
-            else:
-                column_list = [tdp.quote("{0}".format(element.strip())) for element in select_expression[0]]
-        # Any other Format - Raise Format Exception
-        else:
-            raise TeradataMlException(Messages.get_message(MessageCodes.TDMLDF_SELECT_INVALID_FORMAT),
-                                      MessageCodes.TDMLDF_SELECT_INVALID_FORMAT)
-        return column_list
-    @staticmethod
-    def _get_primary_index_from_table(table_name):
-        """
-        Retrieves the primary index by executing a HELP INDEX command.
-        PARAMETERS:
-            table_name - The table name or volatile table name.
-        RETURNS:
-            Returns a list containing the primary index columns from HELP INDEX.
-            If the there are no primary index (NoPI table), then returns None.
-        RAISES:
-            Database error if an error occurred while executing the HELP INDEX.
-        EXAMPLES:
-            df = DataFrame.from_table('mytab')
-            index_labels = df._get_metadata_from_table(df._table_name)
-        """
-        # Construct HELP INDEX command.
-        help_index_sql = SQLBundle._build_help_index(table_name)
-        # Execute HELP INDEX command.
-        rows = UtilFuncs._execute_query(help_index_sql)
-        index_labels = []
-        for row in rows:
-            # row[1] specifies whether the Index is 'Primary or Secondary?'
-            if row[1].rstrip() == 'P':
-                # row[2] specifies a string of comma separated column names that form the primary index
-                if "," in row[2]:
-                    index_cols = row[2].split(',')
-                else:
-                    index_cols = [row[2]]
-                for index_col in index_cols:
-                    # Since TD_TIMEBUCKET column in PTI tables is not functionally available, it can be ignored
-                    # from the index information as well (else a warning is generated by SQLAlchemy).
-                    # row[12] corresponds to 'Timebucket' column in the results of 'help index' SQL command, which
-                    # is available only when the version supports PTI tables.
-                    if index_col == PTITableConstants.TD_TIMEBUCKET.value and len(row) > 11 and row[12] is not None:
-                        continue
-                    else:
-                        index_labels.append(index_col)
-        if len(index_labels) > 0:
-            return index_labels
-        else:
-            return None
-    @staticmethod
-    def __validate_sort_type_raise_exception(sort_col_type):
-        """
-        Function to raise TeradatamlException for errors encountered for invalid/incorrect
-        "sort_col_type" in "_validate_sort_type" function.
-        PARAMETERS:
-            sort_col_type: The sort column type.
-        RETURNS:
-            None
-        RAISES:
-            TeradataMlException
-        EXAMPLES:
-            df_utils.__validate_sort_type_raise_exception(PythonTypes.PY_STRING_TYPE.value)
-        """
-        msg = Messages.get_message(MessageCodes.TDMLDF_DROP_INVALID_INDEX_TYPE).format(sort_col_type)
-        raise TeradataMlException(msg, MessageCodes.TDMLDF_DROP_INVALID_INDEX_TYPE)
-    @staticmethod
-    def _validate_sort_col_type(sort_col_type, sort_col_values):
-        """
-        Validates a list of sort column values with the sort column type.
-        PARAMETERS:
-            sort_col_type - The sort column type.
-            sort_col_values - A single value or list-like values
-        RETURNS:
-            None
-        RAISES:
-            TeradataMlException
-        EXAMPLES:
-            df_utils._validate_sort_col_type(PythonTypes.PY_STRING_TYPE.value, ["Jan", "Feb"])
-            df_utils._validate_sort_col_type(PythonTypes.PY_STRING_TYPE.value, "Jan")
-            df_utils._validate_sort_col_type(PythonTypes.PY_INT_TYPE.value, [1, 2])
-        """
-        if isinstance(sort_col_values, list):
-            if sort_col_type == PythonTypes.PY_STRING_TYPE.value:
-                if not all(isinstance(i, str) for i in sort_col_values):
-                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
-            elif sort_col_type == PythonTypes.PY_FLOAT_TYPE.value:
-                if not all(isinstance(i, float) for i in sort_col_values):
-                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
-            elif sort_col_type == PythonTypes.PY_DECIMAL_TYPE.value:
-                if not all(isinstance(i, Decimal) for i in sort_col_values):
-                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
-            elif sort_col_type == PythonTypes.PY_DATETIME_TYPE.value:
-                if not all(isinstance(i, datetime) for i in sort_col_values):
-                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
-            elif sort_col_type == PythonTypes.PY_TIME_TYPE.value:
-                if not all(isinstance(i, time) for i in sort_col_values):
-                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
-            elif sort_col_type == PythonTypes.PY_DATE_TYPE.value:
-                if not all(isinstance(i, date) for i in sort_col_values):
-                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
-            elif sort_col_type == PythonTypes.PY_BYTES_TYPE.value:
-                if not all(isinstance(i, bytes) for i in sort_col_values):
-                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
-            else:  # numeric type
-                if not all(isinstance(i, numbers.Integral) for i in sort_col_values):
-                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
-        elif isinstance(sort_col_values, (tuple, dict)):
-            raise TeradataMlException(Messages.get_message(MessageCodes.TDMLDF_DROP_ARGS),
-                                      MessageCodes.TDMLDF_DROP_ARGS)
-        else:
-            if sort_col_type == PythonTypes.PY_STRING_TYPE.value:
-                if not isinstance(sort_col_values, str):
-                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
-            elif sort_col_type == PythonTypes.PY_FLOAT_TYPE.value:
-                if not isinstance(sort_col_values, float):
-                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
-            elif sort_col_type == PythonTypes.PY_DECIMAL_TYPE.value:
-                if not isinstance(sort_col_values, Decimal):
-                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
-            elif sort_col_type == PythonTypes.PY_DATETIME_TYPE.value:
-                if not isinstance(sort_col_values, datetime):
-                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
-            elif sort_col_type == PythonTypes.PY_TIME_TYPE.value:
-                if not isinstance(sort_col_values, time):
-                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
-            elif sort_col_type == PythonTypes.PY_DATE_TYPE.value:
-                if not isinstance(sort_col_values, date):
-                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
-            elif sort_col_type == PythonTypes.PY_BYTES_TYPE.value:
-                if not isinstance(sort_col_values, bytes):
-                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
-            else:  # numeric type
-                if not isinstance(sort_col_values, numbers.Integral):
-                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
-    def _get_required_columns_types_from_metaexpr(metaexpr, col_list = None):
-        """
-        Retrieves column names and types from meta expression. If you want to get types for only some columns,
-        pass those columns to 'col_list' argument.
-        PARAMETERS:
-           metaexpr - Meta expression from which columns and types to be retrieved.
-           col_list - Column list for which you want to get types
-        RETURNS:
-           Dictionary: key as column name and datatype as value.
-        EXAMPLES:
-           df = DataFrame.from_table('mytab')
-           metadata = _get_required_columns_types_from_metaexpr()
-        """
-        if isinstance(col_list, str):
-            col_list = [col_list]
-        if col_list is not None and not isinstance(col_list, list):
-            return None
-        meta_cols = metaexpr.t.c
-        meta_columns = [c.name for c in meta_cols]
-        col_names = []
-        col_types = []
-        # When column list to retrieve is not provided, return meta-data for all columns.
-        if col_list is None:
-            for col_name in meta_columns:
-                    col_names.append(meta_cols[col_name].name)
-                    col_types.append(meta_cols[col_name].type)
-        # Return meta-data for only requested columns otherwise.
-        else:
-            for col_name in col_list:
-                if DataFrameUtils._check_column_exists(col_name, meta_columns):
-                    # _metaexpr saves columns without quotes, so unquoting.
-                    unquoted_col_name = col_name.replace('"', "")
-                    col_names.append(meta_cols[unquoted_col_name].name)
-                    col_types.append(meta_cols[unquoted_col_name].type)
-        return OrderedDict(zip(col_names, col_types))
-    @staticmethod
-    def _check_column_exists(column_name, df_columns):
-        """
-         Checks provide column present in list of columns or not.
-         Note:
-             It is calling functions responsibility to send the column and columns list in proper case.
-             By default the look up is case-sensitive. If they would like to have it case insensitive, then
-             one should send the the column_name and df_columns list in lower case.
-         PARAMETERS:
-            column_name - Column name which need to be check.
-            df_columns  - List columns in which column to be check.
-         RETURNS:
-            True if column exists otherwase False.
-         EXAMPLES:
-            df = DataFrame.from_table('mytab')
-            metadata = _check_column_exists("col1", df.columns)
-        """
-        unquoted_df_columns = [column.replace('"', "") for column in df_columns]
-        if column_name.replace('"', "") in unquoted_df_columns:
-            return True
-        else:
-            return False
-    @staticmethod
-    def _validate_agg_function(func, col_names):
-        """
-        Internal function to validate column names against actual
-        column names passed as parameter and aggregate operations
-        against valid aggregate operations.
-        PARAMETERS:
-            func  - (Required) Specifies the function(s) to be
-                    applied on teradataml DataFrame columns.
-                    Acceptable formats for function(s) are string,
-                    dictionary or list of strings/functions.
-                    Accepted combinations are:
-                    1. String function name
-                    2. List of string functions
-                    3. Dictionary of column names -> string function
-                       (or list of string functions)
-            col_names - List. Names of the columns in Dataframe.
-        RETURNS:
-            operations - dict of columns -> aggregate operations
-            Unified dictionary, similar to func, even for string and
-            list of strings or functions.
-        RAISES:
-            1. TDMLDF_INVALID_AGGREGATE_OPERATION - If the aggregate
-                operation(s) received in parameter 'func' is/are
-                invalid.
-                Possible Value :
-                Invalid aggregate operation(s): minimum, counter.
-                Valid aggregate operation(s): count, max, mean, min,
-                std, sum.
-            2. TDMLDF_AGGREGATE_INVALID_COLUMN - If any of the columns
-                specified in 'func' is not present in the dataframe.
-                Possible Value :
-                Invalid column(s) given in parameter func: col1.
-                Valid column(s) : A, B, C, D.
-        EXAMPLES:
-            Let the dataframe contain 2 columns, col1 and col2.
-            VALID EXAMPLES:
-            1. operations = DataFrameUtils._validate_agg_function(
-                    operation = 'mean', ['col1', 'col2'])
-            2. operations = DataFrameUtils._validate_agg_function(
-                    operation = ['mean', 'min'], ['col1', 'col2'])
-            3. operations = DataFrameUtils._validate_agg_function(
-                    {'col1' : ['mean', 'min'], 'col2' : 'count'},
-                                                    ['col1', 'col2'])
-            INVALID EXAMPLES:
-            1. operations = DataFrameUtils._validate_agg_function(
-                    operation = 'counter', ['col1', 'col2'])
-            2. operations = DataFrameUtils._validate_agg_function(
-                    {'col1' : ['mean', 'min'], 'col55' : 'count'},
-                                                    ['col1', 'col2'])
-        """
-        operations = OrderedDict()
-        valid_aggregate_operations = UtilFuncs._get_valid_aggregate_operations()
-        if isinstance(func, str):
-            for column in col_names:
-                operations[column] = [func]
-        elif isinstance(func, list):
-            for column in col_names:
-                operations[column] = func
-        else:
-            for column in func:
-                if isinstance(func[column], str):
-                    func[column] = [func[column]] # Converts string inside dict to list
-            operations = func
-        given_columns = operations.keys()
-        invalid_columns = []
-        all_operations = []
-        for col in given_columns:
-            all_operations.extend(operations[col])
-            if col not in col_names:
-                invalid_columns.append(col)
-        if len(invalid_columns) > 0:  # If any of the columns specified is not present in dataframe
-            col_names.sort()
-            invalid_columns.sort()
-            msg = Messages.get_message(MessageCodes.TDMLDF_AGGREGATE_INVALID_COLUMN). \
-                format(", ".join(invalid_columns), 'func', ", ".join(col_names))
-            raise TeradataMlException(msg, MessageCodes.TDMLDF_AGGREGATE_INVALID_COLUMN)
-        all_operations = list(set(all_operations))
-        invalid_aggregates = []
-        for operation in all_operations:
-            if operation not in valid_aggregate_operations \
-                    and operation not in UtilFuncs._get_valid_time_series_aggregate_operations():
-                invalid_aggregates.append(operation)
-        if len(invalid_aggregates) > 0: # If any of the aggregate operations specified is not valid
-            # To raise error message, let's add other time series aggregate operations those can be
-            # used with DataFrame.agg() method.
-            valid_aggregate_operations = valid_aggregate_operations + ['first', 'last', 'mode']
-            valid_aggregate_operations.sort()
-            invalid_aggregates.sort()
-            msg = Messages.get_message(MessageCodes.TDMLDF_INVALID_AGGREGATE_OPERATION). \
-                format(", ".join(invalid_aggregates), ", ".join(valid_aggregate_operations))
-            raise TeradataMlException(msg, MessageCodes.TDMLDF_INVALID_AGGREGATE_OPERATION)
-        return operations
-    @staticmethod
-    def _generate_aggregate_column_expression(df, column, operation, describe_op, tdp, **kwargs):
-        """
-        Function generate the aggregate column expression for the provided column
-        and aggregate function.
-        PARAMETERS:
-            df:
-                Required Argument.
-                Specifies teradataml DataFrame which is to be used to get the
-                desired aggregate column expression.
-                Types: teradataml DataFrame
-            column:
-                Required Argument.
-                Specifies the column name for which desired aggregate operation is
-                to be used.
-                Types: str
-            operation:
-                Required Argument.
-                Specifies the aggregate operation.
-                Types: str
-            describe_op:
-                Required Argument.
-                Specifies a boolean flag, that will decide whether the aggregate
-                operation is being performed for DataFrame.describe() or not.
-                Types: bool
-            tdp:
-                Required Argument.
-                Specifies a TeradataIdentifierPreparer object. It is required for
-                quoting.
-                Types: TeradataIdentifierPreparer
-            kwargs:
-                Specifies miscellaneous keyword arguments that can be passed to
-                aggregate functions.
-        RAISES:
-            AttributeError - In case ColumnExpression does not have desired aggregate
-            function implemnted.
-        RETURNS:
-            A boolean stating whether column is supported or not, New column name,
-            New column type, A string representing column aggregate expression,
-            invalid column information in case column has unsupported type for an
-            aggregate operation.
-        EXAMPLES:
-            column_supported, new_column_name, new_column_type, column_aggr_expr, invalid_column_str = \
-                DataFrameUtils._generate_aggregate_column_expression(df=df, column=column, operation=func,
-                                                                     describe_op=describe_op, percentile=percentile,
-                                                                     tdp=tdp, **kwargs)
-        """
-        try:
-            key_to_process = ""
-            # quote column names same as that of the Teradata reserved keywords.
-            if "sort_columns" in kwargs:
-                key_to_process = "sort_columns"
-            elif "sort_column" in kwargs:
-                key_to_process = "sort_column"
-            if key_to_process:
-                quoted_columns = UtilFuncs._process_for_teradata_keyword(kwargs[key_to_process])
-                kwargs[key_to_process] = quoted_columns
-            func_expression = getattr(df[column], operation)(describe_op=describe_op, **kwargs)
-            new_column_name = column if describe_op else "{1}_{0}".format(column, operation)
-            # column_supported, new_column_name, new_column_type, column_aggr_expr, invalid_column_str
-            return True, new_column_name, NUMBER() if describe_op else func_expression.type, \
-                   func_expression.compile_label(new_column_name), None
-        except AttributeError:
-            # We are here means, provided operation is invalid and is not supported.
-            # This if for internal purpose only.
-            # Validation of operations for "agg" should be done in "agg" only.
-            raise RuntimeError("Invalid aggregate function: {}".format(operation))
-        except RuntimeError:
-            # We are here means, column does not support the provided operation.
-            # We will ignore this and add the column to invalid column list.
-            # invalid_columns[operation].append("({0} - {1})".format(column, column_type)) OR
-            # We will raise Generic message, mentioning DF does not have any column with type
-            # supported to perform an operation.
-            if describe_op:
-                return True, tdp.quote(column), NUMBER(), 'null as {}'.format(tdp.quote(column)), None
-            else:
-                return False, None, None, None, "({0} - {1})".format(column, df[column].type)
-        except Exception:
-            raise
-    @staticmethod
-    def _construct_sql_expression_for_aggregations(df, column_names, column_types, func, percentile=.5,
-                                                   describe_op=False, **kwargs):
-        """
-        Internal function to create and return the sql expression
-        corresponding to given operation, given column_names and
-        column_types.
-        Column_types are used to check whether all the datatypes are
-        valid types for given operation and throw exception if they
-        are not.
-        PARAMETERS :
-            df:
-                Required Argument.
-                Specifies teradataml DataFrame which is to be used to get the desired
-                aggregate column expression.
-                Types: teradataml DataFrame
-            column_names:
-                Required Argument.
-                Specifies the column names for which desired aggregate operation is
-                to be executed.
-                Types: List of strings
-            column_types:
-                Required Argument.
-                Specifies the respective column types for column names.
-                Types: List of teradatasqlalchemy types
-            func:
-                Required Argument.
-                Specifies the aggregate function(s) to be applied on teradataml
-                DataFrame columns.
-                Types: string, dictionary or list of strings/functions.
-                       Accepted combinations are:
-                            1. String function name
-                            2. List of functions
-                            3. Dictionary containing column name as key and aggregate
-                               function name (string or list of strings) as value
-            percentile:
-                Optional Argument.
-                Specifies a value between 0 and 1 that can only be used with func = 'percentile'.
-                The default is .5, which returns the 50th percentiles.
-                Types: float
-            describe_op:
-                Optional Argument.
-                Specifies a boolean flag, that will decide whether the aggregate operation being
-                performed is for DataFrame.describe() or not.
-                Types: bool
-            kwargs:
-                Specifies miscellaneous keyword arguments that can be passed to aggregate functions.
-        RETURNS :
-            a)sql expression as
-                1. 'min(col1) as min_col1, min(col2) as min_col2' if
-                        col1 and col2 are the columns in Dataframe and
-                        operation is 'min'
-                2. 'max(col1) as max_col1, max(col2) as max_col2' if
-                        col1 and col2 are the columns in Dataframe and
-                        operation is 'max'
-                3. 'min(col1) as min_col1, stddev_samp(col2) as
-                        std_col2' if col1, col2 are the columns in
-                        Dataframe and operations are min, std.
-                etc...
-            b) new columns' names (eg min_col1, min_col2 ...)
-            c) new columns' types
-        RAISES:
-            TeradataMLException
-            1. TDMLDF_AGGREGATE_COMBINED_ERR - If the provided
-                aggregate operations do not support specified columns.
-                Possible Value :
-                No results. Below is/are the error message(s):
-                All selected columns [(col1 - VARCHAR)] is/are
-                unsupported for 'sum' operation.
-            2. TDMLDF_INVALID_AGGREGATE_OPERATION - If the aggregate
-                operation(s) received in parameter 'func' is/are
-                invalid.
-                Possible Value :
-                Invalid aggregate operation(s): minimum, counter.
-                Valid aggregate operation(s): count, max, mean, min,
-                std, sum.
-            3. TDMLDF_AGGREGATE_INVALID_COLUMN - If any of the columns
-                specified in func is not present in the dataframe.
-                Possible Value :
-                Invalid column(s) given in parameter func: col1.
-                Valid column(s) : A, B, C, D.
-        EXAMPLES:
-            col_names, col_types = \
-            df_utils._get_column_names_and_types_from_metaexpr(
-                                                     self._metaexpr)
-            expr, new_col_names, new_col_types = \
-            df_utils._construct_sql_expression_for_aggregations(
-                                    col_names, col_types, 'min')
-            expr1, new_col_names1, new_col_types1 = \
-            df_utils._construct_sql_expression_for_aggregations(
-                                col_names, col_types, ['min', 'sum'])
-            expr2, new_col_names2, new_col_types2 = \
-            df_utils._construct_sql_expression_for_aggregations(
-                    col_names, col_types, {'col1 : ['min', 'sum'],
-                                                'col2' : 'mean'})
-        """
-        # eg of column_types: [VARCHAR(length=13), INTEGER(), VARCHAR(length=60), VARCHAR(length=5),
-        # FLOAT(precision=0)]
-        # eg of types of each column are <class 'teradatasqlalchemy.types.VARCHAR'>,
-        # <class 'teradatasqlalchemy.types.INTEGER'>, <class 'teradatasqlalchemy.types.FLOAT'>,
-        # <class 'teradatasqlalchemy.types.INTERVAL_MINUTE_TO_SECOND'> etc..
-        # If function is of type time series aggregates, we process aggregation differently.
-        if not isinstance(func, str):
-            # If func is not instance of string, that means function call is
-            # from DataFrame.agg(). And is made to process multiple functions.
-            # We will process the same differently, as we need to map and serialize the
-            # column names and aggregate function operate on.
-            # If we have just function to be executed on complete DataFrame, then we don't need
-            # this extra processing. Also, if call is from DataFrame.agg(), time series aggregate check
-            # is not required. As special Time Series aggregate functions cannot be used in
-            # DataFrame.agg().
-            return DataFrameUtils._construct_sql_expression_for_aggregations_for_agg(df, column_names, column_types,
-                                                                                     func, percentile, describe_op,
-                                                                                     **kwargs)
-        as_time_series_aggregate = False
-        if "as_time_series_aggregate" in kwargs.keys():
-            as_time_series_aggregate = kwargs["as_time_series_aggregate"]
-        if as_time_series_aggregate and func in ['bottom', 'bottom with ties', 'delta_t', 'mad', 'top',
-                                                 'top with ties']:
-            return DataFrameUtils._construct_sql_expression_for_time_series_aggregations(df, column_names, column_types,
-                                                                                         func, **kwargs)
-        tdp = preparer(td_dialect)
-        # This variable is used to decide whether DataFrame has all columns unsupported
-        # for the provided operations.
-        all_unsupported_columns = True
-        valid_columns = []
-        invalid_columns = []
-        new_column_names = []
-        new_column_types = []
-        for column in column_names:
-            column_supported, new_column_name, new_column_type, column_aggr_expr, invalid_column_str = \
-                DataFrameUtils._generate_aggregate_column_expression(df=df, column=column, operation=func,
-                                                                     describe_op=describe_op, percentile=percentile,
-                                                                     tdp=tdp, **kwargs)
-            if column_supported:
-                all_unsupported_columns = False
-                new_column_names.append(new_column_name)
-                new_column_types.append(new_column_type)
-                valid_columns.append(column_aggr_expr)
-            else:
-                invalid_columns.append("({0} - {1})".format(column, df[column].type))
-        if all_unsupported_columns:
-            error_msgs = []
-            invalid_columns.sort()  # Helps in catching the columns in lexicographic order
-            error = MessageCodes.TDMLDF_AGGREGATE_UNSUPPORTED.value.format(", ".join(invalid_columns),
-                                                                           func)
-            error_msgs.append(error)
-            if len(valid_columns) == 0:  # No supported columns in the given list of columns
-                raise TeradataMlException(Messages.get_message(
-                    MessageCodes.TDMLDF_AGGREGATE_COMBINED_ERR).format("\n".join(error_msgs)),
-                                          MessageCodes.TDMLDF_AGGREGATE_COMBINED_ERR)
-        # quote column names same as that of the Teradata reserved keywords.
-        quote_column_name = [UtilFuncs._process_for_teradata_keyword(col) for col in column_names]
-        # Actual columns should be retained if "drop_columns" is set to False.
-        if kwargs.get("drop_columns") is False:
-            valid_columns = quote_column_name + valid_columns
-            new_column_names = column_names + new_column_names
-            new_column_types = column_types + new_column_types
-        aggregate_expr = ", ".join(valid_columns)
-        return aggregate_expr, new_column_names, new_column_types
-    @staticmethod
-    def _construct_sql_expression_for_aggregations_for_agg(df, column_names, column_types, func, percentile=.5,
-                                                           describe_op=False, **kwargs):
-        """
-        Internal function to create and return the sql expression
-        corresponding to given operation, given column_names and
-        column_types.
-        Column_types are used to check whether all the datatypes are
-        valid types for given operation and throw exception if they
-        are not.
-        PARAMETERS :
-            df:
-                Required Argument.
-                Specifies teradataml DataFrame which is to be used to get the desired
-                aggregate column expression.
-                Types: teradataml DataFrame
-            column_names:
-                Required Argument.
-                Specifies the column names for which desired aggregate operation is
-                to be executed.
-                Types: List of strings
-            column_types:
-                Required Argument.
-                Specifies the respective column types for column names.
-                Types: List of teradatasqlalchemy types
-            func:
-                Required Argument.
-                Specifies the aggregate function(s) to be applied on teradataml
-                DataFrame columns.
-                Types: string, dictionary or list of strings/functions.
-                       Accepted combinations are:
-                            1. String function name
-                            2. List of functions
-                            3. Dictionary containing column name as key and aggregate
-                               function name (string or list of strings) as value
-            percentile:
-                Optional Argument.
-                Specifies a value between 0 and 1 that can only be used with func = 'percentile'.
-                The default is .5, which returns the 50th percentiles.
-                Types: float
-            describe_op:
-                Optional Argument.
-                Specifies a boolean flag, that will decide whether the aggregate operation being
-                performed is for DataFrame.describe() or not.
-                Types: bool
-            kwargs:
-                Specifies miscellaneous keyword arguments that can be passed to aggregate functions.
-        RETURNS :
-            a)sql expression as
-                1. 'min(col1) as min_col1, min(col2) as min_col2' if
-                        col1 and col2 are the columns in Dataframe and
-                        operation is 'min'
-                2. 'max(col1) as max_col1, max(col2) as max_col2' if
-                        col1 and col2 are the columns in Dataframe and
-                        operation is 'max'
-                3. 'min(col1) as min_col1, stddev_samp(col2) as
-                        std_col2' if col1, col2 are the columns in
-                        Dataframe and operations are min, std.
-                etc...
-            b) new columns' names (eg min_col1, min_col2 ...)
-            c) new columns' types
-        RAISES:
-            TeradataMLException
-            1. TDMLDF_AGGREGATE_COMBINED_ERR - If the provided
-                aggregate operations do not support specified columns.
-                Possible Value :
-                No results. Below is/are the error message(s):
-                All selected columns [(col1 - VARCHAR)] is/are
-                unsupported for 'sum' operation.
-            2. TDMLDF_INVALID_AGGREGATE_OPERATION - If the aggregate
-                operation(s) received in parameter 'func' is/are
-                invalid.
-                Possible Value :
-                Invalid aggregate operation(s): minimum, counter.
-                Valid aggregate operation(s): count, max, mean, min,
-                std, sum.
-            3. TDMLDF_AGGREGATE_INVALID_COLUMN - If any of the columns
-                specified in func is not present in the dataframe.
-                Possible Value :
-                Invalid column(s) given in parameter func: col1.
-                Valid column(s) : A, B, C, D.
-        EXAMPLES:
-            col_names, col_types = \
-            df_utils._get_column_names_and_types_from_metaexpr(
-                                                     self._metaexpr)
-            expr, new_col_names, new_col_types = \
-            df_utils._construct_sql_expression_for_aggregations_for_agg(
-                                    col_names, col_types, 'min')
-            expr1, new_col_names1, new_col_types1 = \
-            df_utils._construct_sql_expression_for_aggregations_for_agg(
-                                col_names, col_types, ['min', 'sum'])
-            expr2, new_col_names2, new_col_types2 = \
-            df_utils._construct_sql_expression_for_aggregations_for_agg(
-                    col_names, col_types, {'col1 : ['min', 'sum'],
-                                                'col2' : 'mean'})
-        """
-        # If function is of type time series aggregates, we process aggregation differently.
-        # Also, one is not supposed to pass below time series aggreagtes to DataFrame.agg():
-        #   ['bottom', 'bottom with ties', 'delta_t', 'mad', 'top', 'top with ties']
-        # Thus, no extra processing is required for time series aggregates over here.
-        # 'operations' contains dict of columns -> list of aggregate operations
-        operations = DataFrameUtils._validate_agg_function(func, column_names)
-        all_valid_columns = []
-        all_invalid_columns = {}
-        all_new_column_names = []
-        all_new_column_types = []
-        # For each column, the value is True if there is at least one valid operation (operation on valid datatype)
-        column_supported = {}
-        tdp = preparer(td_dialect)
-        for column in operations:
-            column_supported[column] = False
-            valid_columns = []
-            invalid_columns = {}
-            new_column_names = []
-            new_column_types = []
-            for operation in operations[column]:
-                is_colop_supported, new_col, new_coltype, column_aggr_expr, invalid_column_info = \
-                    DataFrameUtils._generate_aggregate_column_expression(df=df, column=column, operation=operation,
-                                                                         describe_op=describe_op, percentile=percentile,
-                                                                         tdp=tdp, **kwargs)
-                if is_colop_supported:
-                    column_supported[column] = is_colop_supported
-                    new_column_names.append(new_col)
-                    new_column_types.append(new_coltype)
-                    valid_columns.append(column_aggr_expr)
-                else:
-                    if operation in invalid_columns:
-                        invalid_columns[operation].append(invalid_column_info)
-                    else:
-                        invalid_columns[operation] = [invalid_column_info]
-            all_valid_columns.extend(valid_columns)
-            all_new_column_names.extend(new_column_names)
-            all_new_column_types.extend(new_column_types)
-            for operation in invalid_columns:
-                if operation in all_invalid_columns:
-                    all_invalid_columns[operation].extend(invalid_columns[operation])
-                else:
-                    all_invalid_columns[operation] = invalid_columns[operation]
-        unsupported_columns = [col for col in column_supported if not column_supported[col]]
-        unsupported_columns.sort()  # helps in catching the columns in lexicographic order
-        error_msgs = []
-        for operation in sorted(all_invalid_columns):
-            all_invalid_columns[operation].sort()  # helps in catching the columns in
-            # lexicographic order
-            error = MessageCodes.TDMLDF_AGGREGATE_UNSUPPORTED.value.format(
-                    ", ".join(all_invalid_columns[operation]), operation)
-            error_msgs.append(error)
-        if not all(column_supported[oper] for oper in column_supported):
-            new_msg = MessageCodes.TDMLDF_AGGREGATE_AGG_DICT_ERR.value.format(", ".join(unsupported_columns))
-            error_msgs.append(new_msg)
-            msg = Messages.get_message(MessageCodes.TDMLDF_AGGREGATE_COMBINED_ERR).format("\n".join(error_msgs))
-            raise TeradataMlException(msg, MessageCodes.TDMLDF_AGGREGATE_COMBINED_ERR)
-        elif len(all_valid_columns) == 0:  # No supported columns in the given list of columns
-            raise TeradataMlException(Messages.get_message(
-                MessageCodes.TDMLDF_AGGREGATE_COMBINED_ERR).format("\n".join(error_msgs)),
-                                      MessageCodes.TDMLDF_AGGREGATE_COMBINED_ERR)
-        aggregate_expr = ", ".join(all_valid_columns)
-        return aggregate_expr, all_new_column_names, all_new_column_types
-    @staticmethod
-    def _construct_sql_expression_for_time_series_aggregations(df, column_names, column_types, func, **kwargs):
-        """
-        Internal function to create and return the sql expression
-        corresponding to given time series function, given column_names and
-        column_types.
-        Column_types are used to check whether all the datatypes are
-        valid types for given operation and throw exception if they
-        are not.
-        NOTE:
-            This function should be used only for time series aggregates.
-        PARAMETERS :
-            df:
-                Required Argument.
-                Specifies teradataml DataFrame which is to be used to get the desired
-                aggregate column expression.
-                Types: teradataml DataFrame
-            column_names:
-                Required Argument.
-                Specifies the column names for which desired aggregate operation is
-                to be executed.
-                Types: List of strings
-            column_types:
-                Required Argument.
-                Specifies the respective column types for column names.
-                Types: List of teradatasqlalchemy types
-            func:
-                Required Argument.
-                Specifies the aggregate function(s) to be applied on teradataml
-                DataFrame columns. For Time Series aggregates it is usually a string.
-                Types: str
-            kwargs:
-                Specifies miscellaneous keyword arguments that can be passed to aggregate functions.
-        RETURNS :
-            a)sql expression as
-                1. 'bottom(2, "col1") as "bottom2col1"' if
-                        col1 and col2 are the columns in Dataframe and
-                        operation is 'bottom'
-                etc...
-            b) new columns' names (eg min_col1, min_col2 ...)
-            c) new columns' types
-        RAISES:
-            None.
-        EXAMPLES:
-            colname_to_numvalues = {"col1" : 2, "col2": 3}
-            kwargs = {"colname_to_numvalues": colname_to_numvalues}
-            aggregate_expr, column_names, column_types = \
-                df_utils._construct_sql_expression_for_time_series_aggregations(column_names, column_types,
-                                                                                func, **kwargs)
-        """
-        # eg of column_types: [VARCHAR(length=13), INTEGER(), VARCHAR(length=60), VARCHAR(length=5),
-        # FLOAT(precision=0)]
-        # eg of types of each column are <class 'teradatasqlalchemy.types.VARCHAR'>,
-        # <class 'teradatasqlalchemy.types.INTEGER'>, <class 'teradatasqlalchemy.types.FLOAT'>,
-        # <class 'teradatasqlalchemy.types.INTERVAL_MINUTE_TO_SECOND'> etc..
-        col_names_and_types = dict(zip(column_names, column_types))
-        tdp = preparer(td_dialect)
-        select_columns = []
-        new_column_names = []
-        new_column_types = []
-        if func in ["bottom", "bottom with ties", "top", "top with ties"]:
-            # Processing for bottom and top.
-            # Function name to be used in column aliasing.
-            column_alias_func = func.replace(" ", "_")
-            bottom_col_val = kwargs["colname_to_numvalues"]
-            for column in sorted(list(bottom_col_val.keys())):
-                new_col_name = "{2}{0}{1}".format(bottom_col_val[column], column, column_alias_func)
-                quoted_parent_column_name = tdp.quote("{0}".format(column))
-                quoted_new_column_name = tdp.quote(new_col_name)
-                select_columns.append("{0}({1}, {2}) as {3}".format(func, bottom_col_val[column],
-                                                                    quoted_parent_column_name, quoted_new_column_name))
-                new_column_names.append(new_col_name)
-                new_column_types.append(col_names_and_types[column])
-        if func == "delta_t":
-            # Argument processing for DELTA-T
-            new_column_names.append("delta_t_td_timecode")
-            quoted_new_column_name = tdp.quote(new_column_names[0])
-            new_column_types.append(PERIOD_TIMESTAMP)
-            select_columns.append("{0}((WHERE {1}), (WHERE {2})) as {3}".format(func, kwargs["start_condition"],
-                                                                                kwargs["end_condition"],
-                                                                                quoted_new_column_name))
-        if func == 'mad':
-            # Processing for Median Absolute Deviation.
-            # Function name to be used in column aliasing.
-            column_alias_func = func.replace(" ", "_")
-            bottom_col_val = kwargs["colname_to_numvalues"]
-            for column in sorted(list(bottom_col_val.keys())):
-                new_col_name = "{2}{0}{1}".format(bottom_col_val[column], column, column_alias_func)
-                quoted_parent_column_name = tdp.quote("{0}".format(column))
-                quoted_new_column_name = tdp.quote(new_col_name)
-                select_columns.append("{0}({1}, {2}) as {3}".format(func, bottom_col_val[column],
-                                                                    quoted_parent_column_name, quoted_new_column_name))
-                new_column_names.append(new_col_name)
-                if type(col_names_and_types[column]) in [DECIMAL, NUMBER]:
-                    # If column types is DECIMAL or NUMBER, then output column types should also be same.
-                    # Otherwise, it is FLOAT.
-                    new_column_types.append(col_names_and_types[column])
-                else:
-                    new_column_types.append(FLOAT())
-            if "default_constant_for_columns" in kwargs.keys():
-                column_names = kwargs["default_constant_for_columns"]
-                column_types = [col_names_and_types[column] for column in column_names]
-                if len(column_names) > 0:
-                    aggregate_expr, all_new_column_names, all_new_column_types = \
-                        DataFrameUtils._construct_sql_expression_for_aggregations(df=df, column_names=column_names,
-                                                                                  column_types=column_types, func=func,
-                                                                                  )
-                    aggregate_expr_default_column_list = [col.strip() for col in aggregate_expr.split(",")]
-                    select_columns = select_columns + aggregate_expr_default_column_list
-                    new_column_names = new_column_names + all_new_column_names
-                    new_column_types = new_column_types + all_new_column_types
-        aggregate_expr = ", ".join(select_columns)
-        return aggregate_expr, new_column_names, new_column_types
-    @staticmethod
-    def _construct_describe_query(df, metaexpr, percentiles, function_label, groupby_column_list=None,
-                                  include=None, is_time_series_aggregate=False, verbose=False, distinct=False,
-                                  statistics=None, **kwargs):
-        """
-        Internal function to create the sql query for describe().
-        PARAMETERS :
-            df:
-                Required Argument.
-                Specifies teradataml DataFrame we are collecting statistics for.
-                Types: str
-            metaexpr:
-                Required Argument.
-                Specifies the meta expression for the dataframe.
-                Types: _MetaExpression
-            percentiles:
-                Required Argument.
-                Specifies a list of values between 0 and 1.
-                Types: List of floats
-            function_label:
-                Required Argument.
-                Specifies a string value used as the label for the aggregate function column.
-                Types: str
-            groupby_column_list:
-                Optional Argument.
-                Specifies the group by columns for the dataframe.
-                Default Values: None.
-                Types: str ot List of strings (str)
-            include:
-                Optional Argument.
-                Specifies a string that must be "all" or None. If "all", then all columns will be included.
-                Otherwise, only numeric columns are used for collecting statistics.
-                Default Values: None.
-                Types: str
-            is_time_series_aggregate:
-                Optional Argument.
-                Specifies a flag stating whether describe operation is time series aggregate or not.
-                Default Values: False.
-                Types: bool
-            verbose:
-                Optional Argument.
-                Specifies a flag stating whether DESCRIBE VERBOSE option for time series aggregate is to be
-                performed or not.
-                Default Values: False.
-                Types: bool
-            distinct:
-                Optional Argument.
-                Specifies a flag that decides whether to consider duplicate rows in calculation or not.
-                Default Values: False
-                Types: bool
-            kwargs:
-                Optional Arguments.
-                Keyword argument for time series aggregate functions.
-        RETURNS :
-            A SQL query like:
-            select  'count' as "func", cast(count("Feb") as Number) as "Feb", cast(count(accounts) as Number) as accounts from "PYUSER"."salesview"
-            union all
-            select  'mean' as "func", cast(avg("Feb") as Number) as "Feb", null as accounts from "PYUSER"."salesview"
-            union all
-            select  'std' as "func", cast(stddev_samp("Feb") as Number) as "Feb", null as accounts from "PYUSER"."salesview"
-            union all
-            select  'min' as "func", cast(min("Feb") as Number) as "Feb", cast(min(accounts) as Number) as accounts from "PYUSER"."salesview"
-            union all
-            select  '25%' as "func", percentile_cont(0.25) within group(order by cast("Feb" as Number) ) as "Feb", null as accounts from "PYUSER"."salesview"
-            union all
-            select  '50%' as "func", percentile_cont(0.5) within group(order by cast("Feb" as Number) ) as "Feb", null as accounts from "PYUSER"."salesview"
-            union all
-            select  '75%' as "func", percentile_cont(0.75) within group(order by cast("Feb" as Number) ) as "Feb", null as accounts from "PYUSER"."salesview"
-            union all
-            select  'max' as "func", cast(max("Feb") as Number) as "Feb", cast(max(accounts) as Number) as accounts from "PYUSER"."salesview"
-        RAISES:
-            TeradataMLException
-        EXAMPLES:
-            agg_query = \
-                df_utils._construct_describe_query("self._table_name", self._metaexpr, [.25, .5, .75], "func", self.groupby_column_list)
-            agg_query = \
-                df_utils._construct_describe_query("self._table_name", self._metaexpr, [.3, .6], "func", self.groupby_column_list, include="all")
-        """
-        table_name = df._table_name
-        operators = ["count", "mean", "std", "min", "percentile", "max"]
-        all_operators = ["count", "unique", "mean", "std", "min", "percentile", "max"]
-        if is_time_series_aggregate and verbose:
-            # Time Series Aggregate Operators for Vantage DESCRIBE function with verbose
-            operators = ['max', 'mean', 'median', 'min', 'mode', "percentile", 'std']
-        elif is_time_series_aggregate and not verbose:
-            # Time Series Aggregate Operators for Vantage DESCRIBE function.
-            operators = ['max', 'mean', 'min', 'std']
-        col_names = []
-        col_types = []
-        sel_agg_stmts = []
-        tdp = preparer(td_dialect)
-        quoted_function_label = tdp.quote(function_label)
-        if include is not None and include == 'all' and not is_time_series_aggregate:
-            operators = all_operators
-        if include is None and statistics is not None:
-            operators = statistics
-        table_name, sel_groupby, groupby = DataFrameUtils()._process_groupby_clause(table_name, groupby_column_list,
-                                                                                    is_time_series_aggregate, **kwargs)
-        for col in metaexpr.c:
-            if (include is None and type(col.type) in UtilFuncs()._get_numeric_datatypes()) or include == 'all' or statistics is not None:
-                if not(groupby is not None and col.name in groupby_column_list):
-                    col_names.append(col.name)
-                    col_types.append(col.type)
-        if len(col_names) == 0:
-            raise TeradataMlException(
-                Messages.get_message(MessageCodes.TDMLDF_AGGREGATE_COMBINED_ERR,
-                                     "The DataFrame does not contain numeric columns"),
-                MessageCodes.TDMLDF_AGGREGATE_COMBINED_ERR)
-        for op in operators:
-            if op == "percentile":
-                for p in percentiles:
-                    agg_expr, new_col_names, new_col_types = \
-                        DataFrameUtils._construct_sql_expression_for_aggregations(df,
-                            col_names, col_types, op, percentile=p, describe_op=True, distinct=distinct,
-                            as_time_series_aggregate=is_time_series_aggregate)
-                    sel_agg_stmts.append("SELECT \n\t{4} \n\tcast('{0}%' as varchar(6)) as \"{1}\", {2} from {3} ".format(
-                        int(p*100), quoted_function_label, agg_expr, table_name, sel_groupby))
-            else:
-                agg_expr, new_col_names, new_col_types = \
-                    DataFrameUtils._construct_sql_expression_for_aggregations(df,
-                        col_names, col_types, op, describe_op=True, distinct=distinct,
-                        as_time_series_aggregate=is_time_series_aggregate)
-                sel_agg_stmts.append("SELECT \n\t{4} \n\tcast('{0}' as varchar(6)) as \"{1}\", \n\t{2} \nfrom \n\t{3} ".format(
-                    op, quoted_function_label, agg_expr, table_name, sel_groupby))
-        return " \nunion all\n ".join(sel_agg_stmts)
-    @staticmethod
-    def _process_groupby_clause(table_name, groupby_column_list, is_time_series_aggregate, **kwargs):
-        """
-        Internal function used to process and generate GROUP BY or GROUP BY TIME clauses required for
-        query to be run for describe operation.
-        PARAMETERS:
-            table_name:
-                Required Arguments.
-                Specifies table name to be used for forming describe query.
-                Types: str
-            groupby_column_list:
-                Required Arguments.
-                Specifies list of column names involved in Group By.
-                Types: List of Strings.
-            is_time_series_aggregate:
-                Required Arguments.
-                Specifies a boolean stating whether GROUP BY clause to be formed is for
-                Time series aggregate or not.
-                Types: bool
-            kwargs:
-                Optional Arguments.
-                Keyword argument for time series aggregate functions.
-        RETURNS:
-            1. Table Name appended with GROUP BY clause.
-            2. Column projection string for GROUP BY columns.
-            3. Group By Clause.
-        RAISES:
-            None.
-        EXAMPLES:
-            table_name, sel_groupby, groupby = DataFrameUtils()._process_groupby_clause(table_name, groupby_column_list,
-                                                                                    is_time_series_aggregate, **kwargs)
-        """
-        sel_groupby = ""
-        grp_by_clause = None
-        if is_time_series_aggregate:
-            # For time series aggregate timebucket_duration is must so, it'll be always present in kwargs.
-            grp_by_clause = "GROUP BY TIME ({0}".format(kwargs['timebucket_duration'])
-            # Add columns in value expression to GROUP BY TIME
-            if 'value_expression' in kwargs and \
-                    kwargs['value_expression'] is not None and \
-                    len(kwargs['value_expression']) > 0:
-                grp_by_clause = "{0} and {1}".format(grp_by_clause, ", ".join(kwargs['value_expression']))
-            # Complete the parenthesis for GROUP BY TIME
-            grp_by_clause = "{0})".format(grp_by_clause)
-            # Add Time code column information.
-            if 'timecode_column' in kwargs and \
-                    kwargs['timecode_column'] is not None and \
-                    len(kwargs['timecode_column']) > 0:
-                if 'sequence_column' in kwargs and \
-                        kwargs['timecode_column'] is not None and \
-                        len(kwargs['timecode_column']) > 0:
-                    grp_by_clause = "{0} USING TIMECODE({1}, {2})".format(grp_by_clause, kwargs['timecode_column'],
-                                                                          kwargs['sequence_column'])
-                else:
-                    grp_by_clause = "{0} USING TIMECODE({1})".format(grp_by_clause, kwargs['timecode_column'])
-            # Add Fill inforamtion
-            if 'fill' in kwargs and kwargs['fill'] is not None and len(kwargs['fill']) > 0:
-                grp_by_clause = "{0} FILL({1})".format(grp_by_clause, kwargs['fill'])
-        else:
-            if groupby_column_list is not None:
-                grp_by_clause = "GROUP BY {0}".format(",".join(groupby_column_list))
-        if grp_by_clause is not None:
-            table_name = "{0} \n{1}".format(table_name, grp_by_clause)
-            tdp = preparer(td_dialect)
-            for g in groupby_column_list:
-                if is_time_series_aggregate:
-                    if g == "TIMECODE_RANGE":
-                        g = "$TD_TIMECODE_RANGE"
-                    if "GROUP BY TIME" in g:
-                        g = "$TD_GROUP_BY_TIME"
-                quoted_name = tdp.quote(g)
-                sel_groupby += "{0}, ".format(quoted_name)
-        return table_name, sel_groupby, grp_by_clause
-    @staticmethod
-    def _get_column_names_and_types_from_metaexpr(metaexpr):
-        """
-        Internal function to return column names and respective types
-        given _metaexpr.
-        PARAMETERS:
-            metaexpr:
-                Required Argument.
-                Dataframe's metaexpr. It is used to get column names and types.
-                Types: MetaExpression
-        RETURNS:
-            Two lists - one for column names and another for column types
-        RAISES:
-            None
-        EXAMPLES:
-            dfUtils._get_column_names_and_types_from_metaexpr(
-                                                    df._metaexpr)
-        """
-        # Constructing New Column names & Types for selected columns ONLY using Parent _metaexpr
-        col_names = []
-        col_types = []
-        for c in metaexpr.c:
-            col_names.append(c.name)
-            col_types.append(c.type)
-        return col_names, col_types
-    @staticmethod
-    def _insert_all_from_table(to_table_name, from_table_name, column_list, schema_name,
-                               temporary=False):
-        """
-        Inserts all records from one table into the second, using columns ordered by column list.
-        PARAMETERS:
-            to_table_name - String specifying name of the SQL Table to insert to.
-            insert_from_table_name - String specifying name of the SQL Table to insert from.
-            column_list - List of strings specifying column names used in the insertion.
-            schema_name - Name of the database schema to insert table data into.
-            temporary - Specifies whether to create Vantage tables as permanent or volatile.
-                        Default: False
-                        Note: When True:
-                                1. volatile Tables are created, and
-                                2. schema_name is ignored.
-                        When False, permanent tables are created.
-        RETURNS:
-            None
-        RAISES:
-            Database error if an error occurred while executing the insert command.
-        EXAMPLES:
-            df_utils._insert_all_from_table('table1_name', 'table2_name', ['col1', 'col2', 'col3'])
-        """
-        tdp = preparer(td_dialect)
-        # Construct INSERT command.
-        column_order_string = ', '.join([tdp.quote("{0}".format(element)) for element in column_list])
-        if schema_name:
-            full_to_table_name = tdp.quote(schema_name) + "." + tdp.quote(to_table_name)
-        elif temporary:
-            full_to_table_name = tdp.quote(to_table_name)
-        else:
-            full_to_table_name = tdp.quote(_get_current_databasename()) + "." + tdp.quote(
-                to_table_name)
-        insert_sql = SQLBundle._build_insert_from_table_query(full_to_table_name, from_table_name, column_order_string)
-        # Execute INSERT command.
-        return UtilFuncs._execute_ddl_statement(insert_sql)
-    @staticmethod
-    def _dataframe_has_column(data, column):
-        """
-        Function to check whether column names in columns are present in given dataframe or not.
-        This function is used currently only for Analytics wrappers.
-        PARAMETERS:
-            data - teradataml DataFrame to check against for column existence.
-            column - Column name (a string).
-        RAISES:
-            None
-        EXAMPLES:
-            DataFrameUtils._dataframe_has_column(data, col)
-        """
-        if column in [c.name for c in data._metaexpr.c]:
-            return True
-        return False
-    @staticmethod
-    def _get_row_count(table_name):
-        """
-        Function to return the row count of a teradataml Dataframe.
-        This function is used currently to determine the shape/size of a dataframe.
-        PARAMETERS:
-            table_name - Name of the table to get the row count for.
-        RAISES:
-            TeradataMlException (TDMLDF_INFO_ERROR)
-        EXAMPLES:
-            DataFrameUtils._get_row_count(table_name)
-        """
-        # Construct COUNT(*) Query
-        try:
-            row_count_query = SQLBundle._build_nrows_print_query(table_name)
-            res = execute_sql(row_count_query)
-            return res.fetchone()[0]
-        except TeradataMlException:
-            raise
-        except Exception as err:
-            # TODO Better handle the level of information being presented to the user with logging
-            raise TeradataMlException(Messages.get_message(MessageCodes.TDMLDF_INFO_ERROR) + str(err),
-                                      MessageCodes.TDMLDF_INFO_ERROR) from err
-    @staticmethod
-    def _get_scalar_value(table_name):
-        """
-        Function to return the the only 1x1 (scalar) value from a teradataml Dataframe.
-        PARAMETERS:
-            table_name - Name of the table to get the value from.
-        RAISES:
-            TeradataMlException (TDMLDF_INFO_ERROR)
-        EXAMPLES:
-            DataFrameUtils._get_scalar_value(table_name)
-        """
-        # Construct the base Query
-        try:
-            select_query = SQLBundle._build_base_query(table_name)
-            res = execute_sql(select_query)
-            return res.fetchone()[0]
-        except TeradataMlException:
-            raise
-        except Exception as err:
-            # TODO Better handle the level of information being presented to the user with logging
-            raise TeradataMlException(Messages.get_message(MessageCodes.TDMLDF_INFO_ERROR) + str(err),
-                                      MessageCodes.TDMLDF_INFO_ERROR) from err
-    @staticmethod
-    def _get_sorted_nrow(df, n, sort_col, asc=True):
-        """
-        Internal Utility function that returns a teradataml DataFrame containing n rows
-        of the DataFrame. The Dataframe is sorted on the index column or the first column
-        if there is no index column.
-        PARAMETERS:
-            df:  teradataml DataFrame
-            n:   Specifies the number of rows to select.
-                 Type: int
-            sort_col: The column to sort on.
-                 Type: str
-            asc: (optional) - Specifies sort order.
-                 If True, sort in ascending order.
-                 If False, sort in descending order.
-                 The default value is True.
-                 Type: boolean
-        RETURNS:
-            teradataml DataFrame
-        EXAMPLES:
-            DataFrameUtils._get_sorted_nrow(df, 10)
-            DataFrameUtils._get_sorted_nrow(df, 20, asc=True)
-            DataFrameUtils._get_sorted_nrow(df, 30, asc=False)
-        """
-        #TODO: implement and use this in teradatasqlalchemy
-        tdp = preparer(td_dialect)
-        aed_utils = AedUtils()
-        sort_order = "asc"
-        if not asc:
-            sort_order = "desc"
-        quoted_cols = [tdp.quote(c) for c in df.columns]
-        sel_cols_str = ",".join(quoted_cols)
-        sel_row_num = "row_number() over (order by \"{0}\" {1}) - 1 as tdml_row_num, {2}".format(sort_col, sort_order, sel_cols_str)
-        filter_str = "tdml_row_num < {0}".format(n)
-        sel_nodeid = aed_utils._aed_select(df._nodeid, sel_row_num)
-        fil_nodeid = aed_utils._aed_filter(sel_nodeid, filter_str)
-        sel2_nodeid = aed_utils._aed_select(fil_nodeid, sel_cols_str)
-        col_names, col_types = __class__._get_column_names_and_types_from_metaexpr(df._metaexpr)
-        new_metaexpr = UtilFuncs._get_metaexpr_using_columns(df._nodeid, zip(col_names, col_types))
-        # Call the function from_node from appropriate class either DataFrame or GeoDataFrame
-        new_df = df.__class__._from_node(sel2_nodeid, new_metaexpr, df._index_label)
-        new_df._orderby = df._orderby
-        new_df._metaexpr._n_rows = n
-        return new_df
-    @staticmethod
-    def _get_database_names(connection, schema_name):
-        """
-        Function to return a list valid of database names for a given sqlalchemy connection.
-        This function is used to determine whether the database used is valid in user APIs such as copy_to_sql.
-        PARAMETERS:
-            connection:     Required Argument.
-                            A SQLAlchemy connection object.
-            schema_name:   Required Argument
-                            String specifying the requested schema name.
-        RAISES:
-            TeradataMlException (TDMLDF_INFO_ERROR)
-        EXAMPLES:
-            DataFrameUtils._get_database_names(get_connection(), schema_name)
-        """
-        #TODO: implement and use this in teradatasqlalchemy
-        table_obj = table('databasesV', column('databasename'), schema='dbc')
-        stmt = select(text(str(func.lower(table_obj.c.databasename)) + ' as databasename')).where(
-            text('databasename (NOT CASESPECIFIC) = {} (NOT CASESPECIFIC)'.format(':schema_name')))
-        stmt = text(str(stmt))
-        stmt = stmt.bindparams(schema_name=schema_name)
-        res = connection.execute(stmt).fetchall()
-        return [name.databasename for name in res]
+# -*- coding: utf-8 -*-
+"""
+Unpublished work.
+Copyright (c) 2018 by Teradata Corporation. All rights reserved.
+TERADATA CORPORATION CONFIDENTIAL AND TRADE SECRET
+Primary Owner: mark.sandan@teradata.com
+Secondary Owner:
+This file implements util functions of data frame.
+"""
+import numbers
+import pandas as pd
+from collections import OrderedDict
+from teradataml.common.utils import UtilFuncs
+from teradataml.common.aed_utils import AedUtils
+from teradataml.common.constants import AEDConstants, PTITableConstants, \
+    SQLPattern, PythonTypes
+from teradataml.common.sqlbundle import SQLBundle
+from teradataml.common.exceptions import TeradataMlException
+from teradataml.common.messages import Messages
+from teradataml.common.messagecodes import MessageCodes
+from teradataml.context.context import get_context, get_connection
+from teradataml.context.context import _get_current_databasename
+from teradataml.dbutils.dbutils import _execute_query_and_generate_pandas_df
+from teradataml.options.display import display
+from teradataml.options.configure import configure
+from teradataml.utils.utils import execute_sql
+from teradatasqlalchemy.types import FLOAT, NUMBER, DECIMAL, PERIOD_TIMESTAMP
+from teradatasqlalchemy.dialect import preparer, dialect as td_dialect
+import teradataml.dataframe as tdmldf
+from teradataml.dataframe.sql_interfaces import ColumnExpression
+from sqlalchemy.sql import select
+from sqlalchemy.sql.expression import text
+from sqlalchemy import table, column, func
+from datetime import datetime, date, time
+from decimal import Decimal
+# TODO - Need to write unit testcases for these functions
+class DataFrameUtils():
+    @staticmethod
+    def _execute_node_return_db_object_name(nodeid, metaexpression = None):
+        """
+        Fetches queries and view names from AED node and creates views from queries
+        Additionally inspects the metaexpression for consistency
+        PARAMETERS:
+            nodeid: nodeid to execute
+            metaexpression: (optional) updated _metaexpr to validate
+        EXAMPLES:
+             _execute_node_return_db_object_name(nodeid)
+             _execute_node_return_db_object_name(nodeid, metaexpr)
+        RETURNS:
+            Top level view name.
+        """
+        aed_obj = AedUtils()
+        if not aed_obj._aed_is_node_executed(nodeid):
+            view_query_node_type_list = aed_obj._aed_get_exec_query(nodeid)
+            view_names, queries, node_query_types, node_ids = view_query_node_type_list
+            # Executing Nodes / Creating Views
+            for index in range(len(queries) - 1, -1, -1):
+                is_persist = False
+                if metaexpression and metaexpression._is_persist:
+                    is_persist = True
+                try:
+                    if node_query_types[index] == AEDConstants.AED_QUERY_NODE_TYPE_ML_QUERY_MULTI_OUTPUT.value or\
+                       ("OUT TABLE " in queries[index] and SQLPattern.SQLMR.value.match(queries[index])) or \
+                            is_persist:
+                        # TODO:: OR condition in above needs to be removed once AED support is added.
+                        UtilFuncs._create_table(view_names[index], queries[index])
+                    elif node_query_types in ['groupby', 'groupbytime']:
+                        # If query_type is either groupby or groupbytime get it's parent
+                        # nodeid and execute queries for the same
+                        parent_nodeid = aed_obj._aed_get_parent_nodeids(nodeid)[0]
+                        DataFrameUtils._execute_node_return_db_object_name(parent_nodeid)
+                    elif node_query_types[index] == AEDConstants.AED_QUERY_NODE_TYPE_REFERENCE.value:
+                        # Reference nodes - To be ignored.
+                        pass
+                    else:
+                        UtilFuncs._create_view(view_names[index], queries[index])
+                    # Updating Node Status for executed Node
+                    aed_obj._aed_update_node_state_single(node_ids[index], AEDConstants.AED_NODE_EXECUTED.value)
+                except Exception as emsg:
+                    # TODO:: Append node execution details to emsg.
+                    #        Node description, such as nodeType or node operation, should be added
+                    #        here in 'emsg' to give away more information, where exactly
+                    #        node execution failed.
+                    raise TeradataMlException(Messages.get_message(MessageCodes.TDMLDF_EXEC_SQL_FAILED, str(emsg)),
+                                      MessageCodes.TDMLDF_EXEC_SQL_FAILED)
+        # Setting New Table name retrieved to TDML DF
+        result_table_view_name = aed_obj._aed_get_tablename(nodeid)
+        # validate the metaexpression
+        if configure._validate_metaexpression:
+            DataFrameUtils._validate_metaexpression(result_table_view_name, metaexpression)
+        return result_table_view_name
+    @staticmethod
+    def _validate_metaexpression(result_table_view_name, metaexpression):
+        """
+        Inspects the metaexpression for consistency with the underlying table/view
+        PARAMETERS:
+            result_table_view_name: a string representing the table/view name to check column metadata
+            metaexpression: the metaexpr of the DataFrame to compare against the result_table_view_name
+        EXAMPLES:
+             _validate_metaexpression('t1', df._metaexpr)
+             _execute_node_return_db_object_name(nodeid, metaexpr)
+        RETURNS:
+            None
+            Outputs RuntimeWarnings if mismatches are found
+        """
+        # metaexpression should have already been updated
+        if metaexpression is not None:
+            name = lambda x: x[0]
+            type_ = lambda x: x[1]
+            # compare sorted by name of column
+            df = sorted(UtilFuncs._describe_column(DataFrameUtils._get_metadata_from_table(result_table_view_name)), key = lambda x: x[0])
+            meta = sorted(metaexpression.c, key = lambda x: x.name)
+            # check length
+            if len(df) == len(meta):
+                for i in range(len(df)):
+                    # map Teradata type to python type
+                    meta_type = UtilFuncs._teradata_type_to_python_type(meta[i].type)
+                    # compare column names and types
+                    if meta[i].name != name(df[i]) or meta_type != type_(df[i]):
+                        err_msg = "[Mismatch when checking %s]\n\t[Table/View] %s %s\n\t[MetaExpression] %s %s (mapped from => %s)\n"
+                        raise RuntimeError(err_msg % (result_table_view_name,
+                                                      name(df[i]), type_(df[i]),
+                                                      meta[i].name, meta_type, meta[i].type))
+            else:
+                err_msg = "[Length mismatch when checking %s]\nSource Table/View has length %s but MetaExpression has length %s"
+                raise RuntimeError(err_msg % (result_table_view_name, len(df), len(meta)))
+    @staticmethod
+    def _get_dataframe_print_string(table_name, index_label, orderby=None, undropped_index=None):
+        """
+        Builds string output for teradataml DataFrame
+        PARAMETERS:
+            table_name - Name of the database table to read from.
+            index_label - String/List specifying column to use as index.
+            orderby - order expression to sort returned rows
+        EXAMPLES:
+             _get_dataframe_print_string('table_name', None, None)
+        RETURNS:
+            String representation of a pandas DataFrame.
+        """
+        read_query = SQLBundle._build_top_n_print_query(table_name, display.max_rows, orderby)
+        if index_label is not None:
+            pandas_df = _execute_query_and_generate_pandas_df(read_query, index=index_label)
+        else:
+            pandas_df = _execute_query_and_generate_pandas_df(read_query)
+        return pandas_df.to_string()
+    @staticmethod
+    def _get_pprint_dtypes(column_names_and_types, null_count=False):
+        """
+        returns a string containing the column names and types.
+        If null_count is not None, the string will also contain
+        the number of non-null values for each column.
+        PARAMETERS:
+            column_names_and_types - List of column names and types.
+            null_count(optional) - List of the non-null count for each column.
+        EXAMPLES:
+            >>>print(_get_pprint_dtypes(column_names_and_types)
+            accounts      str
+            Feb         float
+            Jan           int
+            Mar           int
+            Apr           int
+            datetime      str
+            >>>print(_get_pprint_dtypes(column_names_and_types, null_count)
+            accounts    3 non-null str
+            Feb         3 non-null float
+            Jan         3 non-null int
+            Mar         3 non-null int
+            Apr         3 non-null int
+            datetime    3 non-null str
+        RAISES:
+        """
+        col_names = [i[0] for i in column_names_and_types]
+        col_types = [i[1] for i in column_names_and_types]
+        max_col_names = len(max(col_names, key=len)) + 4
+        max_col_types = len(max(col_types, key=len))
+        dtypes_string = ""
+        if not null_count:
+            for colname, coltype in column_names_and_types:
+                dtypes_string += "{0: <{name_width}}{1: >{type_width}}\n".format(colname, coltype,
+                                                                                 name_width=max_col_names,
+                                                                                 type_width=max_col_types)
+        else:
+            null_count = [i[2] for i in column_names_and_types]
+            max_null_count = len(str(max(null_count, key=len)))
+            for colname, coltype, num_nulls in column_names_and_types:
+                dtypes_string += "{0: <{name_width}}{1: <{count_width}} non-null {2: <{type_width}}\n".format(colname,
+                                                                                                              num_nulls,
+                                                                                                              coltype,
+                                                                                                              name_width=max_col_names,
+                                                                                                              count_width=max_null_count,
+                                                                                                              type_width=max_col_types)
+        # Remove last new line character.
+        dtypes_string = dtypes_string[:-1]
+        return dtypes_string
+    @staticmethod
+    def _get_metadata_from_table(table_name):
+        """
+        Retrieves column metadata by executing a HELP COLUMN command.
+        PARAMETERS:
+            table_name - The table name or view name.
+        RETURNS:
+            returns the result set (column information) from HELP COLUMN.
+        RAISES:
+            Database error if an error occurred while executing the HELP COLUMN.
+        EXAMPLES:
+            df = DataFrame.from_table('mytab')
+            metadata = _get_metadata_from_table(df._table_name)
+        """
+        # Construct HELP COLUMN command.
+        help_col_sql = SQLBundle._build_help_column(table_name)
+        # Execute HELP COLUMN command.
+        return UtilFuncs._execute_query(help_col_sql)
+    @staticmethod
+    def _extract_select_string(select_expression):
+        """
+        Takes in a string/list representing a Pandas selection clause of any of the forms (only):
+            a) "col1" or 'col1'
+            b) ["col 1"] or ['col 1']
+            c) ["col1", "col2", "col3"] or ['col1', 'col2', 'col3']
+            d) [['col1', 'col2', 'col3']] or [["col1", "col2", "col3"]]
+        And returns a list with column strings representing the selection of the form:
+            a)  ['col1']
+            b)  ['col 1']
+            c)  ['col1','col2','col3']
+            d)  ['col1','col2','col3']
+        Column Names ("col1", "col2"..) are Strings representing database table Columns.
+        All Standard Teradata Data-Types for columns supported: INTEGER, VARCHAR(5), FLOAT.
+        PARAMETERS:
+            selection_expression -  Expression representing column selection
+            Type - String or List of Strings or List of List (Single level only)
+            Required - Yes
+        EXAMPLES:
+            UtilFuncs._extract_select_string([['col1', 'col2']])
+            UtilFuncs._extract_select_string("col1")
+            UtilFuncs._extract_select_string(["col1"])
+            UtilFuncs._extract_select_string(["col1","col2","col3"])
+        RETURNS:
+            List of Strings representing column names.
+        RAISES:
+            TeradataMlException
+        """
+        tdp = preparer(td_dialect)
+        column_list = []
+        # Single String column
+        if isinstance(select_expression, str):
+            # Error handling - Empty String
+            if select_expression ==  "":
+                raise TeradataMlException(Messages.get_message(MessageCodes.TDMLDF_SELECT_NONE_OR_EMPTY),
+                                      MessageCodes.TDMLDF_SELECT_NONE_OR_EMPTY)
+            else:
+                column_list.append(tdp.quote("{0}".format(select_expression.strip())))
+        # Error Handling -  [],  [""], [None], ["None"], ['col1', None], ['col1', '']
+        elif isinstance(select_expression, list) and (len(select_expression) ==  0  or
+                                                    any(element in [None, "None", ""] for element in select_expression)):
+            raise TeradataMlException(Messages.get_message(MessageCodes.TDMLDF_SELECT_NONE_OR_EMPTY),
+                                      MessageCodes.TDMLDF_SELECT_NONE_OR_EMPTY)
+        # List - ["col1"] or ["col1", "col2", "col3"]
+        elif isinstance(select_expression, list) and all(isinstance(element, str) for element in select_expression):
+            if len(select_expression) == 1:
+                column_list.append(tdp.quote("{0}".format(select_expression[0].strip())))
+            else:
+                column_list = [tdp.quote("{0}".format(element.strip())) for element in select_expression]
+        # List of List (Single level only - Pandas Syntax) - [["col1", "col2", "col3"]]
+        elif isinstance(select_expression, list) and isinstance(select_expression[0], list):
+            # Error Handling - [[]], [[""]], [[None]], [['col1', None]], [['col1', "None"]], ["col1", ""]
+            if len(select_expression[0]) ==  0  or any(element in [None, "None", ""] for element in select_expression[0]):
+                raise TeradataMlException(Messages.get_message(MessageCodes.TDMLDF_SELECT_NONE_OR_EMPTY),
+                                      MessageCodes.TDMLDF_SELECT_NONE_OR_EMPTY)
+            else:
+                column_list = [tdp.quote("{0}".format(element.strip())) for element in select_expression[0]]
+        # Any other Format - Raise Format Exception
+        else:
+            raise TeradataMlException(Messages.get_message(MessageCodes.TDMLDF_SELECT_INVALID_FORMAT),
+                                      MessageCodes.TDMLDF_SELECT_INVALID_FORMAT)
+        return column_list
+    @staticmethod
+    def _get_primary_index_from_table(table_name):
+        """
+        Retrieves the primary index by executing a HELP INDEX command.
+        PARAMETERS:
+            table_name - The table name or volatile table name.
+        RETURNS:
+            Returns a list containing the primary index columns from HELP INDEX.
+            If the there are no primary index (NoPI table), then returns None.
+        RAISES:
+            Database error if an error occurred while executing the HELP INDEX.
+        EXAMPLES:
+            df = DataFrame.from_table('mytab')
+            index_labels = df._get_metadata_from_table(df._table_name)
+        """
+        # Construct HELP INDEX command.
+        help_index_sql = SQLBundle._build_help_index(table_name)
+        # Execute HELP INDEX command.
+        rows = UtilFuncs._execute_query(help_index_sql)
+        index_labels = []
+        for row in rows:
+            # row[1] specifies whether the Index is 'Primary or Secondary?'
+            if row[1].rstrip() == 'P':
+                # row[2] specifies a string of comma separated column names that form the primary index
+                if "," in row[2]:
+                    index_cols = row[2].split(',')
+                else:
+                    index_cols = [row[2]]
+                for index_col in index_cols:
+                    # Since TD_TIMEBUCKET column in PTI tables is not functionally available, it can be ignored
+                    # from the index information as well (else a warning is generated by SQLAlchemy).
+                    # row[12] corresponds to 'Timebucket' column in the results of 'help index' SQL command, which
+                    # is available only when the version supports PTI tables.
+                    if index_col == PTITableConstants.TD_TIMEBUCKET.value and len(row) > 11 and row[12] is not None:
+                        continue
+                    else:
+                        index_labels.append(index_col)
+        if len(index_labels) > 0:
+            return index_labels
+        else:
+            return None
+    @staticmethod
+    def __validate_sort_type_raise_exception(sort_col_type):
+        """
+        Function to raise TeradatamlException for errors encountered for invalid/incorrect
+        "sort_col_type" in "_validate_sort_type" function.
+        PARAMETERS:
+            sort_col_type: The sort column type.
+        RETURNS:
+            None
+        RAISES:
+            TeradataMlException
+        EXAMPLES:
+            df_utils.__validate_sort_type_raise_exception(PythonTypes.PY_STRING_TYPE.value)
+        """
+        msg = Messages.get_message(MessageCodes.TDMLDF_DROP_INVALID_INDEX_TYPE).format(sort_col_type)
+        raise TeradataMlException(msg, MessageCodes.TDMLDF_DROP_INVALID_INDEX_TYPE)
+    @staticmethod
+    def _validate_sort_col_type(sort_col_type, sort_col_values):
+        """
+        Validates a list of sort column values with the sort column type.
+        PARAMETERS:
+            sort_col_type - The sort column type.
+            sort_col_values - A single value or list-like values
+        RETURNS:
+            None
+        RAISES:
+            TeradataMlException
+        EXAMPLES:
+            df_utils._validate_sort_col_type(PythonTypes.PY_STRING_TYPE.value, ["Jan", "Feb"])
+            df_utils._validate_sort_col_type(PythonTypes.PY_STRING_TYPE.value, "Jan")
+            df_utils._validate_sort_col_type(PythonTypes.PY_INT_TYPE.value, [1, 2])
+        """
+        if isinstance(sort_col_values, list):
+            if sort_col_type == PythonTypes.PY_STRING_TYPE.value:
+                if not all(isinstance(i, str) for i in sort_col_values):
+                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
+            elif sort_col_type == PythonTypes.PY_FLOAT_TYPE.value:
+                if not all(isinstance(i, float) for i in sort_col_values):
+                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
+            elif sort_col_type == PythonTypes.PY_DECIMAL_TYPE.value:
+                if not all(isinstance(i, Decimal) for i in sort_col_values):
+                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
+            elif sort_col_type == PythonTypes.PY_DATETIME_TYPE.value:
+                if not all(isinstance(i, datetime) for i in sort_col_values):
+                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
+            elif sort_col_type == PythonTypes.PY_TIME_TYPE.value:
+                if not all(isinstance(i, time) for i in sort_col_values):
+                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
+            elif sort_col_type == PythonTypes.PY_DATE_TYPE.value:
+                if not all(isinstance(i, date) for i in sort_col_values):
+                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
+            elif sort_col_type == PythonTypes.PY_BYTES_TYPE.value:
+                if not all(isinstance(i, bytes) for i in sort_col_values):
+                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
+            else:  # numeric type
+                if not all(isinstance(i, numbers.Integral) for i in sort_col_values):
+                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
+        elif isinstance(sort_col_values, (tuple, dict)):
+            raise TeradataMlException(Messages.get_message(MessageCodes.TDMLDF_DROP_ARGS),
+                                      MessageCodes.TDMLDF_DROP_ARGS)
+        else:
+            if sort_col_type == PythonTypes.PY_STRING_TYPE.value:
+                if not isinstance(sort_col_values, str):
+                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
+            elif sort_col_type == PythonTypes.PY_FLOAT_TYPE.value:
+                if not isinstance(sort_col_values, float):
+                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
+            elif sort_col_type == PythonTypes.PY_DECIMAL_TYPE.value:
+                if not isinstance(sort_col_values, Decimal):
+                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
+            elif sort_col_type == PythonTypes.PY_DATETIME_TYPE.value:
+                if not isinstance(sort_col_values, datetime):
+                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
+            elif sort_col_type == PythonTypes.PY_TIME_TYPE.value:
+                if not isinstance(sort_col_values, time):
+                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
+            elif sort_col_type == PythonTypes.PY_DATE_TYPE.value:
+                if not isinstance(sort_col_values, date):
+                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
+            elif sort_col_type == PythonTypes.PY_BYTES_TYPE.value:
+                if not isinstance(sort_col_values, bytes):
+                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
+            else:  # numeric type
+                if not isinstance(sort_col_values, numbers.Integral):
+                    DataFrameUtils.__validate_sort_type_raise_exception(sort_col_type)
+    def _get_required_columns_types_from_metaexpr(metaexpr, col_list = None):
+        """
+        Retrieves column names and types from meta expression. If you want to get types for only some columns,
+        pass those columns to 'col_list' argument.
+        PARAMETERS:
+           metaexpr - Meta expression from which columns and types to be retrieved.
+           col_list - Column list for which you want to get types
+        RETURNS:
+           Dictionary: key as column name and datatype as value.
+        EXAMPLES:
+           df = DataFrame.from_table('mytab')
+           metadata = _get_required_columns_types_from_metaexpr()
+        """
+        if isinstance(col_list, str):
+            col_list = [col_list]
+        if col_list is not None and not isinstance(col_list, list):
+            return None
+        meta_cols = metaexpr.t.c
+        meta_columns = [c.name for c in meta_cols]
+        col_names = []
+        col_types = []
+        # When column list to retrieve is not provided, return meta-data for all columns.
+        if col_list is None:
+            for col_name in meta_columns:
+                    col_names.append(meta_cols[col_name].name)
+                    col_types.append(meta_cols[col_name].type)
+        # Return meta-data for only requested columns otherwise.
+        else:
+            for col_name in col_list:
+                if DataFrameUtils._check_column_exists(col_name, meta_columns):
+                    # _metaexpr saves columns without quotes, so unquoting.
+                    unquoted_col_name = col_name.replace('"', "")
+                    col_names.append(meta_cols[unquoted_col_name].name)
+                    col_types.append(meta_cols[unquoted_col_name].type)
+        return OrderedDict(zip(col_names, col_types))
+    @staticmethod
+    def _check_column_exists(column_name, df_columns):
+        """
+         Checks provide column present in list of columns or not.
+         Note:
+             It is calling functions responsibility to send the column and columns list in proper case.
+             By default the look up is case-sensitive. If they would like to have it case insensitive, then
+             one should send the the column_name and df_columns list in lower case.
+         PARAMETERS:
+            column_name - Column name which need to be check.
+            df_columns  - List columns in which column to be check.
+         RETURNS:
+            True if column exists otherwase False.
+         EXAMPLES:
+            df = DataFrame.from_table('mytab')
+            metadata = _check_column_exists("col1", df.columns)
+        """
+        unquoted_df_columns = [column.replace('"', "") for column in df_columns]
+        if column_name.replace('"', "") in unquoted_df_columns:
+            return True
+        else:
+            return False
+    @staticmethod
+    def _validate_agg_function(func, col_names):
+        """
+        Internal function to validate column names against actual
+        column names passed as parameter and aggregate operations
+        against valid aggregate operations.
+        PARAMETERS:
+            func  - (Required) Specifies the function(s) to be
+                    applied on teradataml DataFrame columns.
+                    Acceptable formats for function(s) are string,
+                    dictionary or list of strings/functions.
+                    Accepted combinations are:
+                    1. String function name
+                    2. List of string functions
+                    3. Dictionary of column names -> string function
+                       (or list of string functions)
+            col_names - List. Names of the columns in Dataframe.
+        RETURNS:
+            operations - dict of columns -> aggregate operations
+            Unified dictionary, similar to func, even for string and
+            list of strings or functions.
+        RAISES:
+            1. TDMLDF_INVALID_AGGREGATE_OPERATION - If the aggregate
+                operation(s) received in parameter 'func' is/are
+                invalid.
+                Possible Value :
+                Invalid aggregate operation(s): minimum, counter.
+                Valid aggregate operation(s): count, max, mean, min,
+                std, sum.
+            2. TDMLDF_AGGREGATE_INVALID_COLUMN - If any of the columns
+                specified in 'func' is not present in the dataframe.
+                Possible Value :
+                Invalid column(s) given in parameter func: col1.
+                Valid column(s) : A, B, C, D.
+        EXAMPLES:
+            Let the dataframe contain 2 columns, col1 and col2.
+            VALID EXAMPLES:
+            1. operations = DataFrameUtils._validate_agg_function(
+                    operation = 'mean', ['col1', 'col2'])
+            2. operations = DataFrameUtils._validate_agg_function(
+                    operation = ['mean', 'min'], ['col1', 'col2'])
+            3. operations = DataFrameUtils._validate_agg_function(
+                    {'col1' : ['mean', 'min'], 'col2' : 'count'},
+                                                    ['col1', 'col2'])
+            INVALID EXAMPLES:
+            1. operations = DataFrameUtils._validate_agg_function(
+                    operation = 'counter', ['col1', 'col2'])
+            2. operations = DataFrameUtils._validate_agg_function(
+                    {'col1' : ['mean', 'min'], 'col55' : 'count'},
+                                                    ['col1', 'col2'])
+        """
+        operations = OrderedDict()
+        valid_aggregate_operations = UtilFuncs._get_valid_aggregate_operations()
+        if isinstance(func, str):
+            for column in col_names:
+                operations[column] = [func]
+        elif isinstance(func, list):
+            for column in col_names:
+                operations[column] = func
+        else:
+            for column in func:
+                if isinstance(func[column], str):
+                    func[column] = [func[column]] # Converts string inside dict to list
+            operations = func
+        given_columns = operations.keys()
+        invalid_columns = []
+        all_operations = []
+        for col in given_columns:
+            all_operations.extend(operations[col])
+            if col not in col_names:
+                invalid_columns.append(col)
+        if len(invalid_columns) > 0:  # If any of the columns specified is not present in dataframe
+            col_names.sort()
+            invalid_columns.sort()
+            msg = Messages.get_message(MessageCodes.TDMLDF_AGGREGATE_INVALID_COLUMN). \
+                format(", ".join(invalid_columns), 'func', ", ".join(col_names))
+            raise TeradataMlException(msg, MessageCodes.TDMLDF_AGGREGATE_INVALID_COLUMN)
+        all_operations = list(set(all_operations))
+        invalid_aggregates = []
+        for operation in all_operations:
+            if operation not in valid_aggregate_operations \
+                    and operation not in UtilFuncs._get_valid_time_series_aggregate_operations():
+                invalid_aggregates.append(operation)
+        if len(invalid_aggregates) > 0: # If any of the aggregate operations specified is not valid
+            # To raise error message, let's add other time series aggregate operations those can be
+            # used with DataFrame.agg() method.
+            valid_aggregate_operations = valid_aggregate_operations + ['first', 'last', 'mode']
+            valid_aggregate_operations.sort()
+            invalid_aggregates.sort()
+            msg = Messages.get_message(MessageCodes.TDMLDF_INVALID_AGGREGATE_OPERATION). \
+                format(", ".join(invalid_aggregates), ", ".join(valid_aggregate_operations))
+            raise TeradataMlException(msg, MessageCodes.TDMLDF_INVALID_AGGREGATE_OPERATION)
+        return operations
+    @staticmethod
+    def _generate_aggregate_column_expression(df, column, operation, describe_op, tdp, **kwargs):
+        """
+        Function generate the aggregate column expression for the provided column
+        and aggregate function.
+        PARAMETERS:
+            df:
+                Required Argument.
+                Specifies teradataml DataFrame which is to be used to get the
+                desired aggregate column expression.
+                Types: teradataml DataFrame
+            column:
+                Required Argument.
+                Specifies the column name for which desired aggregate operation is
+                to be used.
+                Types: str
+            operation:
+                Required Argument.
+                Specifies the aggregate operation.
+                Types: str
+            describe_op:
+                Required Argument.
+                Specifies a boolean flag, that will decide whether the aggregate
+                operation is being performed for DataFrame.describe() or not.
+                Types: bool
+            tdp:
+                Required Argument.
+                Specifies a TeradataIdentifierPreparer object. It is required for
+                quoting.
+                Types: TeradataIdentifierPreparer
+            kwargs:
+                Specifies miscellaneous keyword arguments that can be passed to
+                aggregate functions.
+        RAISES:
+            AttributeError - In case ColumnExpression does not have desired aggregate
+            function implemnted.
+        RETURNS:
+            A boolean stating whether column is supported or not, New column name,
+            New column type, A string representing column aggregate expression,
+            invalid column information in case column has unsupported type for an
+            aggregate operation.
+        EXAMPLES:
+            column_supported, new_column_name, new_column_type, column_aggr_expr, invalid_column_str = \
+                DataFrameUtils._generate_aggregate_column_expression(df=df, column=column, operation=func,
+                                                                     describe_op=describe_op, percentile=percentile,
+                                                                     tdp=tdp, **kwargs)
+        """
+        try:
+            key_to_process = ""
+            # quote column names same as that of the Teradata reserved keywords.
+            if "sort_columns" in kwargs:
+                key_to_process = "sort_columns"
+            elif "sort_column" in kwargs:
+                key_to_process = "sort_column"
+            if key_to_process:
+                quoted_columns = UtilFuncs._process_for_teradata_keyword(kwargs[key_to_process])
+                kwargs[key_to_process] = quoted_columns
+            func_expression = getattr(df[column], operation)(describe_op=describe_op, **kwargs)
+            new_column_name = column if describe_op else "{1}_{0}".format(column, operation)
+            # column_supported, new_column_name, new_column_type, column_aggr_expr, invalid_column_str
+            return True, new_column_name, NUMBER() if describe_op else func_expression.type, \
+                   func_expression.compile_label(new_column_name), None
+        except AttributeError:
+            # We are here means, provided operation is invalid and is not supported.
+            # This if for internal purpose only.
+            # Validation of operations for "agg" should be done in "agg" only.
+            raise RuntimeError("Invalid aggregate function: {}".format(operation))
+        except RuntimeError:
+            # We are here means, column does not support the provided operation.
+            # We will ignore this and add the column to invalid column list.
+            # invalid_columns[operation].append("({0} - {1})".format(column, column_type)) OR
+            # We will raise Generic message, mentioning DF does not have any column with type
+            # supported to perform an operation.
+            if describe_op:
+                return True, tdp.quote(column), NUMBER(), 'null as {}'.format(tdp.quote(column)), None
+            else:
+                return False, None, None, None, "({0} - {1})".format(column, df[column].type)
+        except Exception:
+            raise
+    @staticmethod
+    def _construct_sql_expression_for_aggregations(df, column_names, column_types, func, percentile=.5,
+                                                   describe_op=False, **kwargs):
+        """
+        Internal function to create and return the sql expression
+        corresponding to given operation, given column_names and
+        column_types.
+        Column_types are used to check whether all the datatypes are
+        valid types for given operation and throw exception if they
+        are not.
+        PARAMETERS :
+            df:
+                Required Argument.
+                Specifies teradataml DataFrame which is to be used to get the desired
+                aggregate column expression.
+                Types: teradataml DataFrame
+            column_names:
+                Required Argument.
+                Specifies the column names for which desired aggregate operation is
+                to be executed.
+                Types: List of strings
+            column_types:
+                Required Argument.
+                Specifies the respective column types for column names.
+                Types: List of teradatasqlalchemy types
+            func:
+                Required Argument.
+                Specifies the aggregate function(s) to be applied on teradataml
+                DataFrame columns.
+                Types: string, dictionary or list of strings/functions.
+                       Accepted combinations are:
+                            1. String function name
+                            2. List of functions
+                            3. Dictionary containing column name as key and aggregate
+                               function name (string or list of strings) as value
+                            4. ColumnExpression built using the aggregate functions.
+                            5. List of ColumnExpression built using the aggregate functions.
+            percentile:
+                Optional Argument.
+                Specifies a value between 0 and 1 that can only be used with func = 'percentile'.
+                The default is .5, which returns the 50th percentiles.
+                Types: float
+            describe_op:
+                Optional Argument.
+                Specifies a boolean flag, that will decide whether the aggregate operation being
+                performed is for DataFrame.describe() or not.
+                Types: bool
+            kwargs:
+                Specifies miscellaneous keyword arguments that can be passed to aggregate functions.
+        RETURNS :
+            a)sql expression as
+                1. 'min(col1) as min_col1, min(col2) as min_col2' if
+                        col1 and col2 are the columns in Dataframe and
+                        operation is 'min'
+                2. 'max(col1) as max_col1, max(col2) as max_col2' if
+                        col1 and col2 are the columns in Dataframe and
+                        operation is 'max'
+                3. 'min(col1) as min_col1, stddev_samp(col2) as
+                        std_col2' if col1, col2 are the columns in
+                        Dataframe and operations are min, std.
+                etc...
+            b) new columns' names (eg min_col1, min_col2 ...)
+            c) new columns' types
+        RAISES:
+            TeradataMLException
+            1. TDMLDF_AGGREGATE_COMBINED_ERR - If the provided
+                aggregate operations do not support specified columns.
+                Possible Value :
+                No results. Below is/are the error message(s):
+                All selected columns [(col1 - VARCHAR)] is/are
+                unsupported for 'sum' operation.
+            2. TDMLDF_INVALID_AGGREGATE_OPERATION - If the aggregate
+                operation(s) received in parameter 'func' is/are
+                invalid.
+                Possible Value :
+                Invalid aggregate operation(s): minimum, counter.
+                Valid aggregate operation(s): count, max, mean, min,
+                std, sum.
+            3. TDMLDF_AGGREGATE_INVALID_COLUMN - If any of the columns
+                specified in func is not present in the dataframe.
+                Possible Value :
+                Invalid column(s) given in parameter func: col1.
+                Valid column(s) : A, B, C, D.
+        EXAMPLES:
+            col_names, col_types = \
+            df_utils._get_column_names_and_types_from_metaexpr(
+                                                     self._metaexpr)
+            expr, new_col_names, new_col_types = \
+            df_utils._construct_sql_expression_for_aggregations(
+                                    col_names, col_types, 'min')
+            expr1, new_col_names1, new_col_types1 = \
+            df_utils._construct_sql_expression_for_aggregations(
+                                col_names, col_types, ['min', 'sum'])
+            expr2, new_col_names2, new_col_types2 = \
+            df_utils._construct_sql_expression_for_aggregations(
+                    col_names, col_types, {'col1 : ['min', 'sum'],
+                                                'col2' : 'mean'})
+        """
+        # eg of column_types: [VARCHAR(length=13), INTEGER(), VARCHAR(length=60), VARCHAR(length=5),
+        # FLOAT(precision=0)]
+        # eg of types of each column are <class 'teradatasqlalchemy.types.VARCHAR'>,
+        # <class 'teradatasqlalchemy.types.INTEGER'>, <class 'teradatasqlalchemy.types.FLOAT'>,
+        # <class 'teradatasqlalchemy.types.INTERVAL_MINUTE_TO_SECOND'> etc..
+        # If function is of type time series aggregates, we process aggregation differently.
+        if not isinstance(func, str):
+            # If func is not instance of string, that means function call is
+            # from DataFrame.agg(). And is made to process multiple functions.
+            # We will process the same differently, as we need to map and serialize the
+            # column names and aggregate function operate on.
+            # If we have just function to be executed on complete DataFrame, then we don't need
+            # this extra processing. Also, if call is from DataFrame.agg(), time series aggregate check
+            # is not required. As special Time Series aggregate functions cannot be used in
+            # DataFrame.agg().
+            return DataFrameUtils._construct_sql_expression_for_aggregations_for_agg(df, column_names, column_types,
+                                                                                     func, percentile, describe_op,
+                                                                                     **kwargs)
+        as_time_series_aggregate = False
+        if "as_time_series_aggregate" in kwargs.keys():
+            as_time_series_aggregate = kwargs["as_time_series_aggregate"]
+        if as_time_series_aggregate and func in ['bottom', 'bottom with ties', 'delta_t', 'mad', 'top',
+                                                 'top with ties']:
+            return DataFrameUtils._construct_sql_expression_for_time_series_aggregations(df, column_names, column_types,
+                                                                                         func, **kwargs)
+        tdp = preparer(td_dialect)
+        # This variable is used to decide whether DataFrame has all columns unsupported
+        # for the provided operations.
+        all_unsupported_columns = True
+        valid_columns = []
+        invalid_columns = []
+        new_column_names = []
+        new_column_types = []
+        for column in column_names:
+            column_supported, new_column_name, new_column_type, column_aggr_expr, invalid_column_str = \
+                DataFrameUtils._generate_aggregate_column_expression(df=df, column=column, operation=func,
+                                                                     describe_op=describe_op, percentile=percentile,
+                                                                     tdp=tdp, **kwargs)
+            if column_supported:
+                all_unsupported_columns = False
+                new_column_names.append(new_column_name)
+                new_column_types.append(new_column_type)
+                valid_columns.append(column_aggr_expr)
+            else:
+                invalid_columns.append("({0} - {1})".format(column, df[column].type))
+        if all_unsupported_columns:
+            error_msgs = []
+            invalid_columns.sort()  # Helps in catching the columns in lexicographic order
+            error = MessageCodes.TDMLDF_AGGREGATE_UNSUPPORTED.value.format(", ".join(invalid_columns),
+                                                                           func)
+            error_msgs.append(error)
+            if len(valid_columns) == 0:  # No supported columns in the given list of columns
+                raise TeradataMlException(Messages.get_message(
+                    MessageCodes.TDMLDF_AGGREGATE_COMBINED_ERR).format("\n".join(error_msgs)),
+                                          MessageCodes.TDMLDF_AGGREGATE_COMBINED_ERR)
+        # quote column names same as that of the Teradata reserved keywords.
+        quote_column_name = [UtilFuncs._process_for_teradata_keyword(col) for col in column_names]
+        # Actual columns should be retained if "drop_columns" is set to False.
+        if kwargs.get("drop_columns") is False:
+            valid_columns = quote_column_name + valid_columns
+            new_column_names = column_names + new_column_names
+            new_column_types = column_types + new_column_types
+        aggregate_expr = ", ".join(valid_columns)
+        return aggregate_expr, new_column_names, new_column_types
+    @staticmethod
+    def _construct_sql_expression_for_aggregations_for_agg(df, column_names, column_types, func, percentile=.5,
+                                                           describe_op=False, **kwargs):
+        """
+        Internal function to create and return the sql expression
+        corresponding to given operation, given column_names and
+        column_types.
+        Column_types are used to check whether all the datatypes are
+        valid types for given operation and throw exception if they
+        are not.
+        PARAMETERS :
+            df:
+                Required Argument.
+                Specifies teradataml DataFrame which is to be used to get the desired
+                aggregate column expression.
+                Types: teradataml DataFrame
+            column_names:
+                Required Argument.
+                Specifies the column names for which desired aggregate operation is
+                to be executed.
+                Types: List of strings
+            column_types:
+                Required Argument.
+                Specifies the respective column types for column names.
+                Types: List of teradatasqlalchemy types
+            func:
+                Required Argument.
+                Specifies the aggregate function(s) to be applied on teradataml
+                DataFrame columns.
+                Types: string, dictionary or list of strings/functions.
+                       Accepted combinations are:
+                            1. String function name
+                            2. List of functions
+                            3. Dictionary containing column name as key and aggregate
+                               function name (string or list of strings) as value
+                            4. ColumnExpression built using the aggregate functions.
+                            5. List of ColumnExpression built using the aggregate functions.
+            percentile:
+                Optional Argument.
+                Specifies a value between 0 and 1 that can only be used with func = 'percentile'.
+                The default is .5, which returns the 50th percentiles.
+                Types: float
+            describe_op:
+                Optional Argument.
+                Specifies a boolean flag, that will decide whether the aggregate operation being
+                performed is for DataFrame.describe() or not.
+                Types: bool
+            kwargs:
+                Specifies miscellaneous keyword arguments that can be passed to aggregate functions.
+        RETURNS :
+            a)sql expression as
+                1. 'min(col1) as min_col1, min(col2) as min_col2' if
+                        col1 and col2 are the columns in Dataframe and
+                        operation is 'min'
+                2. 'max(col1) as max_col1, max(col2) as max_col2' if
+                        col1 and col2 are the columns in Dataframe and
+                        operation is 'max'
+                3. 'min(col1) as min_col1, stddev_samp(col2) as
+                        std_col2' if col1, col2 are the columns in
+                        Dataframe and operations are min, std.
+                etc...
+            b) new columns' names (eg min_col1, min_col2 ...)
+            c) new columns' types
+        RAISES:
+            TeradataMLException
+            1. TDMLDF_AGGREGATE_COMBINED_ERR - If the provided
+                aggregate operations do not support specified columns.
+                Possible Value :
+                No results. Below is/are the error message(s):
+                All selected columns [(col1 - VARCHAR)] is/are
+                unsupported for 'sum' operation.
+            2. TDMLDF_INVALID_AGGREGATE_OPERATION - If the aggregate
+                operation(s) received in parameter 'func' is/are
+                invalid.
+                Possible Value :
+                Invalid aggregate operation(s): minimum, counter.
+                Valid aggregate operation(s): count, max, mean, min,
+                std, sum.
+            3. TDMLDF_AGGREGATE_INVALID_COLUMN - If any of the columns
+                specified in func is not present in the dataframe.
+                Possible Value :
+                Invalid column(s) given in parameter func: col1.
+                Valid column(s) : A, B, C, D.
+        EXAMPLES:
+            col_names, col_types = \
+            df_utils._get_column_names_and_types_from_metaexpr(
+                                                     self._metaexpr)
+            expr, new_col_names, new_col_types = \
+            df_utils._construct_sql_expression_for_aggregations_for_agg(
+                                    col_names, col_types, 'min')
+            expr1, new_col_names1, new_col_types1 = \
+            df_utils._construct_sql_expression_for_aggregations_for_agg(
+                                col_names, col_types, ['min', 'sum'])
+            expr2, new_col_names2, new_col_types2 = \
+            df_utils._construct_sql_expression_for_aggregations_for_agg(
+                    col_names, col_types, {'col1 : ['min', 'sum'],
+                                                'col2' : 'mean'})
+        """
+        # If function is of type time series aggregates, we process aggregation differently.
+        # Also, one is not supposed to pass below time series aggreagtes to DataFrame.agg():
+        #   ['bottom', 'bottom with ties', 'delta_t', 'mad', 'top', 'top with ties']
+        # Thus, no extra processing is required for time series aggregates over here.
+        if isinstance(func, ColumnExpression) or (isinstance(func, list) and isinstance(func[0], ColumnExpression)):
+            column_agg_expr = []
+            new_column_names = []
+            new_column_types = []
+            if isinstance(func, ColumnExpression):
+                func= UtilFuncs._as_list(func)
+            # validate that func is a list of ColumnExpression
+            for expr in func:
+                if not isinstance(expr, ColumnExpression):
+                    raise TeradataMlException(Messages.get_message(MessageCodes.UNSUPPORTED_DATATYPE,
+                                              'func', ['str, dict, ColumnExpression or list of values of type(s): str, ColumnExpression']),
+                                              MessageCodes.UNSUPPORTED_DATATYPE)
+            for operations in func:
+                alias = operations.alias_name
+                column_agg_expr.append(operations.compile_label(alias))
+                new_column_names.append(alias)
+                new_column_types.append(operations.type)
+            aggregate_expr = ", ".join(column_agg_expr)
+            return aggregate_expr, new_column_names, new_column_types
+        # 'operations' contains dict of columns -> list of aggregate operations
+        operations = DataFrameUtils._validate_agg_function(func, column_names)
+        all_valid_columns = []
+        all_invalid_columns = {}
+        all_new_column_names = []
+        all_new_column_types = []
+        # For each column, the value is True if there is at least one valid operation (operation on valid datatype)
+        column_supported = {}
+        tdp = preparer(td_dialect)
+        for column in operations:
+            column_supported[column] = False
+            valid_columns = []
+            invalid_columns = {}
+            new_column_names = []
+            new_column_types = []
+            for operation in operations[column]:
+                is_colop_supported, new_col, new_coltype, column_aggr_expr, invalid_column_info = \
+                    DataFrameUtils._generate_aggregate_column_expression(df=df, column=column, operation=operation,
+                                                                         describe_op=describe_op, percentile=percentile,
+                                                                         tdp=tdp, **kwargs)
+                if is_colop_supported:
+                    column_supported[column] = is_colop_supported
+                    new_column_names.append(new_col)
+                    new_column_types.append(new_coltype)
+                    valid_columns.append(column_aggr_expr)
+                else:
+                    if operation in invalid_columns:
+                        invalid_columns[operation].append(invalid_column_info)
+                    else:
+                        invalid_columns[operation] = [invalid_column_info]
+            all_valid_columns.extend(valid_columns)
+            all_new_column_names.extend(new_column_names)
+            all_new_column_types.extend(new_column_types)
+            for operation in invalid_columns:
+                if operation in all_invalid_columns:
+                    all_invalid_columns[operation].extend(invalid_columns[operation])
+                else:
+                    all_invalid_columns[operation] = invalid_columns[operation]
+        unsupported_columns = [col for col in column_supported if not column_supported[col]]
+        unsupported_columns.sort()  # helps in catching the columns in lexicographic order
+        error_msgs = []
+        for operation in sorted(all_invalid_columns):
+            all_invalid_columns[operation].sort()  # helps in catching the columns in
+            # lexicographic order
+            error = MessageCodes.TDMLDF_AGGREGATE_UNSUPPORTED.value.format(
+                    ", ".join(all_invalid_columns[operation]), operation)
+            error_msgs.append(error)
+        if not all(column_supported[oper] for oper in column_supported):
+            new_msg = MessageCodes.TDMLDF_AGGREGATE_AGG_DICT_ERR.value.format(", ".join(unsupported_columns))
+            error_msgs.append(new_msg)
+            msg = Messages.get_message(MessageCodes.TDMLDF_AGGREGATE_COMBINED_ERR).format("\n".join(error_msgs))
+            raise TeradataMlException(msg, MessageCodes.TDMLDF_AGGREGATE_COMBINED_ERR)
+        elif len(all_valid_columns) == 0:  # No supported columns in the given list of columns
+            raise TeradataMlException(Messages.get_message(
+                MessageCodes.TDMLDF_AGGREGATE_COMBINED_ERR).format("\n".join(error_msgs)),
+                                      MessageCodes.TDMLDF_AGGREGATE_COMBINED_ERR)
+        aggregate_expr = ", ".join(all_valid_columns)
+        return aggregate_expr, all_new_column_names, all_new_column_types
+    @staticmethod
+    def _construct_sql_expression_for_time_series_aggregations(df, column_names, column_types, func, **kwargs):
+        """
+        Internal function to create and return the sql expression
+        corresponding to given time series function, given column_names and
+        column_types.
+        Column_types are used to check whether all the datatypes are
+        valid types for given operation and throw exception if they
+        are not.
+        NOTE:
+            This function should be used only for time series aggregates.
+        PARAMETERS :
+            df:
+                Required Argument.
+                Specifies teradataml DataFrame which is to be used to get the desired
+                aggregate column expression.
+                Types: teradataml DataFrame
+            column_names:
+                Required Argument.
+                Specifies the column names for which desired aggregate operation is
+                to be executed.
+                Types: List of strings
+            column_types:
+                Required Argument.
+                Specifies the respective column types for column names.
+                Types: List of teradatasqlalchemy types
+            func:
+                Required Argument.
+                Specifies the aggregate function(s) to be applied on teradataml
+                DataFrame columns. For Time Series aggregates it is usually a string.
+                Types: str
+            kwargs:
+                Specifies miscellaneous keyword arguments that can be passed to aggregate functions.
+        RETURNS :
+            a)sql expression as
+                1. 'bottom(2, "col1") as "bottom2col1"' if
+                        col1 and col2 are the columns in Dataframe and
+                        operation is 'bottom'
+                etc...
+            b) new columns' names (eg min_col1, min_col2 ...)
+            c) new columns' types
+        RAISES:
+            None.
+        EXAMPLES:
+            colname_to_numvalues = {"col1" : 2, "col2": 3}
+            kwargs = {"colname_to_numvalues": colname_to_numvalues}
+            aggregate_expr, column_names, column_types = \
+                df_utils._construct_sql_expression_for_time_series_aggregations(column_names, column_types,
+                                                                                func, **kwargs)
+        """
+        # eg of column_types: [VARCHAR(length=13), INTEGER(), VARCHAR(length=60), VARCHAR(length=5),
+        # FLOAT(precision=0)]
+        # eg of types of each column are <class 'teradatasqlalchemy.types.VARCHAR'>,
+        # <class 'teradatasqlalchemy.types.INTEGER'>, <class 'teradatasqlalchemy.types.FLOAT'>,
+        # <class 'teradatasqlalchemy.types.INTERVAL_MINUTE_TO_SECOND'> etc..
+        col_names_and_types = dict(zip(column_names, column_types))
+        tdp = preparer(td_dialect)
+        select_columns = []
+        new_column_names = []
+        new_column_types = []
+        if func in ["bottom", "bottom with ties", "top", "top with ties"]:
+            # Processing for bottom and top.
+            # Function name to be used in column aliasing.
+            column_alias_func = func.replace(" ", "_")
+            bottom_col_val = kwargs["colname_to_numvalues"]
+            for column in sorted(list(bottom_col_val.keys())):
+                new_col_name = "{2}{0}{1}".format(bottom_col_val[column], column, column_alias_func)
+                quoted_parent_column_name = tdp.quote("{0}".format(column))
+                quoted_new_column_name = tdp.quote(new_col_name)
+                select_columns.append("{0}({1}, {2}) as {3}".format(func, bottom_col_val[column],
+                                                                    quoted_parent_column_name, quoted_new_column_name))
+                new_column_names.append(new_col_name)
+                new_column_types.append(col_names_and_types[column])
+        if func == "delta_t":
+            # Argument processing for DELTA-T
+            new_column_names.append("delta_t_td_timecode")
+            quoted_new_column_name = tdp.quote(new_column_names[0])
+            new_column_types.append(PERIOD_TIMESTAMP)
+            select_columns.append("{0}((WHERE {1}), (WHERE {2})) as {3}".format(func, kwargs["start_condition"],
+                                                                                kwargs["end_condition"],
+                                                                                quoted_new_column_name))
+        if func == 'mad':
+            # Processing for Median Absolute Deviation.
+            # Function name to be used in column aliasing.
+            column_alias_func = func.replace(" ", "_")
+            bottom_col_val = kwargs["colname_to_numvalues"]
+            for column in sorted(list(bottom_col_val.keys())):
+                new_col_name = "{2}{0}{1}".format(bottom_col_val[column], column, column_alias_func)
+                quoted_parent_column_name = tdp.quote("{0}".format(column))
+                quoted_new_column_name = tdp.quote(new_col_name)
+                select_columns.append("{0}({1}, {2}) as {3}".format(func, bottom_col_val[column],
+                                                                    quoted_parent_column_name, quoted_new_column_name))
+                new_column_names.append(new_col_name)
+                if type(col_names_and_types[column]) in [DECIMAL, NUMBER]:
+                    # If column types is DECIMAL or NUMBER, then output column types should also be same.
+                    # Otherwise, it is FLOAT.
+                    new_column_types.append(col_names_and_types[column])
+                else:
+                    new_column_types.append(FLOAT())
+            if "default_constant_for_columns" in kwargs.keys():
+                column_names = kwargs["default_constant_for_columns"]
+                column_types = [col_names_and_types[column] for column in column_names]
+                if len(column_names) > 0:
+                    aggregate_expr, all_new_column_names, all_new_column_types = \
+                        DataFrameUtils._construct_sql_expression_for_aggregations(df=df, column_names=column_names,
+                                                                                  column_types=column_types, func=func,
+                                                                                  )
+                    aggregate_expr_default_column_list = [col.strip() for col in aggregate_expr.split(",")]
+                    select_columns = select_columns + aggregate_expr_default_column_list
+                    new_column_names = new_column_names + all_new_column_names
+                    new_column_types = new_column_types + all_new_column_types
+        aggregate_expr = ", ".join(select_columns)
+        return aggregate_expr, new_column_names, new_column_types
+    @staticmethod
+    def _invalid_describe_column(df, columns, metaexpr, groupby_column_list):
+        """
+        Internal function to validate columns provided to describe() is correct or not,
+        when DataFrame is output of groupby and groupby_time.
+        PARAMETERS:
+            df:
+                Required Argument.
+                Specifies teradataml DataFrame we are collecting statistics for.
+                Types: str
+            columns:
+                Optional Argument.
+                Specifies the name(s) of columns we are collecting statistics for.
+                Types: str ot List of strings (str)
+            metaexpr:
+                Required Argument.
+                Specifies the meta expression for the dataframe.
+                Types: _MetaExpression
+            groupby_column_list:
+                Optional Argument.
+                Specifies the group by columns for the dataframe.
+                Default Values: None.
+                Types: str ot List of strings (str)
+        Returns:
+            None
+        Raises:
+            TeradataMLException
+        """
+        invalid_columns = [_column for _column in groupby_column_list if columns is not None
+                           and _column in columns]
+        if len(invalid_columns) > 0:
+            all_columns = [col.name for col in metaexpr.c]
+            valid_columns = [item for item in all_columns if item not in groupby_column_list]
+            msg = Messages.get_message(MessageCodes.TDMLDF_AGGREGATE_INVALID_COLUMN). \
+                format(", ".join(invalid_columns), 'columns', ", ".join(valid_columns))
+            raise TeradataMlException(msg, MessageCodes.TDMLDF_AGGREGATE_INVALID_COLUMN)
+    @staticmethod
+    def _construct_describe_query(df, columns, metaexpr, percentiles, function_label, groupby_column_list=None,
+                                  include=None, is_time_series_aggregate=False, verbose=False, distinct=False,
+                                  statistics=None, **kwargs):
+        """
+        Internal function to create the sql query for describe().
+        PARAMETERS :
+            df:
+                Required Argument.
+                Specifies teradataml DataFrame we are collecting statistics for.
+                Types: str
+            columns:
+                Optional Argument.
+                Specifies the name(s) of columns we are collecting statistics for.
+                Types: str ot List of strings (str)
+            metaexpr:
+                Required Argument.
+                Specifies the meta expression for the dataframe.
+                Types: _MetaExpression
+            percentiles:
+                Required Argument.
+                Specifies a list of values between 0 and 1.
+                Types: List of floats
+            function_label:
+                Required Argument.
+                Specifies a string value used as the label for the aggregate function column.
+                Types: str
+            groupby_column_list:
+                Optional Argument.
+                Specifies the group by columns for the dataframe.
+                Default Values: None.
+                Types: str ot List of strings (str)
+            include:
+                Optional Argument.
+                Specifies a string that must be "all" or None. If "all", then all columns will be included.
+                Otherwise, only numeric columns are used for collecting statistics.
+                Default Values: None.
+                Types: str
+            is_time_series_aggregate:
+                Optional Argument.
+                Specifies a flag stating whether describe operation is time series aggregate or not.
+                Default Values: False.
+                Types: bool
+            verbose:
+                Optional Argument.
+                Specifies a flag stating whether DESCRIBE VERBOSE option for time series aggregate is to be
+                performed or not.
+                Default Values: False.
+                Types: bool
+            distinct:
+                Optional Argument.
+                Specifies a flag that decides whether to consider duplicate rows in calculation or not.
+                Default Values: False
+                Types: bool
+            kwargs:
+                Optional Arguments.
+                Keyword argument for time series aggregate functions.
+        RETURNS :
+            A SQL query like:
+            select  'count' as "func", cast(count("Feb") as Number) as "Feb", cast(count(accounts) as Number) as accounts from "PYUSER"."salesview"
+            union all
+            select  'mean' as "func", cast(avg("Feb") as Number) as "Feb", null as accounts from "PYUSER"."salesview"
+            union all
+            select  'std' as "func", cast(stddev_samp("Feb") as Number) as "Feb", null as accounts from "PYUSER"."salesview"
+            union all
+            select  'min' as "func", cast(min("Feb") as Number) as "Feb", cast(min(accounts) as Number) as accounts from "PYUSER"."salesview"
+            union all
+            select  '25%' as "func", percentile_cont(0.25) within group(order by cast("Feb" as Number) ) as "Feb", null as accounts from "PYUSER"."salesview"
+            union all
+            select  '50%' as "func", percentile_cont(0.5) within group(order by cast("Feb" as Number) ) as "Feb", null as accounts from "PYUSER"."salesview"
+            union all
+            select  '75%' as "func", percentile_cont(0.75) within group(order by cast("Feb" as Number) ) as "Feb", null as accounts from "PYUSER"."salesview"
+            union all
+            select  'max' as "func", cast(max("Feb") as Number) as "Feb", cast(max(accounts) as Number) as accounts from "PYUSER"."salesview"
+        RAISES:
+            TeradataMLException
+        EXAMPLES:
+            agg_query = \
+                df_utils._construct_describe_query("self._table_name", self._metaexpr, [.25, .5, .75], "func", self.groupby_column_list)
+            agg_query = \
+                df_utils._construct_describe_query("self._table_name", self._metaexpr, [.3, .6], "func", self.groupby_column_list, include="all")
+        """
+        table_name = df._table_name
+        operators = ["count", "mean", "std", "min", "percentile", "max"]
+        all_operators = ["count", "unique", "mean", "std", "min", "percentile", "max"]
+        if is_time_series_aggregate and verbose:
+            # Time Series Aggregate Operators for Vantage DESCRIBE function with verbose
+            operators = ['max', 'mean', 'median', 'min', 'mode', "percentile", 'std']
+        elif is_time_series_aggregate and not verbose:
+            # Time Series Aggregate Operators for Vantage DESCRIBE function.
+            operators = ['max', 'mean', 'min', 'std']
+        col_names = []
+        col_types = []
+        sel_agg_stmts = []
+        tdp = preparer(td_dialect)
+        quoted_function_label = tdp.quote(function_label)
+        if include is not None and include == 'all' and not is_time_series_aggregate:
+            operators = all_operators
+        if include is None and statistics is not None:
+            operators = statistics
+        table_name, sel_groupby, groupby = DataFrameUtils()._process_groupby_clause(table_name, groupby_column_list,
+                                                                                    is_time_series_aggregate, **kwargs)
+        for col in metaexpr.c:
+            if (include is None and type(col.type) in UtilFuncs()._get_numeric_datatypes()) or include == 'all' or statistics is not None:
+                if not(groupby is not None and col.name in groupby_column_list):
+                    if columns is None or col.name in columns:
+                        col_names.append(col.name)
+                        col_types.append(col.type)
+        if len(col_names) == 0:
+            raise TeradataMlException(
+                Messages.get_message(MessageCodes.TDMLDF_AGGREGATE_COMBINED_ERR,
+                                     "The DataFrame does not contain numeric columns"),
+                MessageCodes.TDMLDF_AGGREGATE_COMBINED_ERR)
+        for op in operators:
+            if op == "percentile":
+                for p in percentiles:
+                    agg_expr, new_col_names, new_col_types = \
+                        DataFrameUtils._construct_sql_expression_for_aggregations(df,
+                            col_names, col_types, op, percentile=p, describe_op=True, distinct=distinct,
+                            as_time_series_aggregate=is_time_series_aggregate)
+                    sel_agg_stmts.append("SELECT \n\t{4} \n\tcast('{0}%' as varchar(6)) as \"{1}\", {2} from {3} ".format(
+                        int(p*100), quoted_function_label, agg_expr, table_name, sel_groupby))
+            else:
+                agg_expr, new_col_names, new_col_types = \
+                    DataFrameUtils._construct_sql_expression_for_aggregations(df,
+                        col_names, col_types, op, describe_op=True, distinct=distinct,
+                        as_time_series_aggregate=is_time_series_aggregate)
+                sel_agg_stmts.append("SELECT \n\t{4} \n\tcast('{0}' as varchar(6)) as \"{1}\", \n\t{2} \nfrom \n\t{3} ".format(
+                    op, quoted_function_label, agg_expr, table_name, sel_groupby))
+        return " \nunion all\n ".join(sel_agg_stmts)
+    @staticmethod
+    def _process_groupby_clause(table_name, groupby_column_list, is_time_series_aggregate, **kwargs):
+        """
+        Internal function used to process and generate GROUP BY or GROUP BY TIME clauses required for
+        query to be run for describe operation.
+        PARAMETERS:
+            table_name:
+                Required Arguments.
+                Specifies table name to be used for forming describe query.
+                Types: str
+            groupby_column_list:
+                Required Arguments.
+                Specifies list of column names involved in Group By.
+                Types: List of Strings.
+            is_time_series_aggregate:
+                Required Arguments.
+                Specifies a boolean stating whether GROUP BY clause to be formed is for
+                Time series aggregate or not.
+                Types: bool
+            kwargs:
+                Optional Arguments.
+                Keyword argument for time series aggregate functions.
+        RETURNS:
+            1. Table Name appended with GROUP BY clause.
+            2. Column projection string for GROUP BY columns.
+            3. Group By Clause.
+        RAISES:
+            None.
+        EXAMPLES:
+            table_name, sel_groupby, groupby = DataFrameUtils()._process_groupby_clause(table_name, groupby_column_list,
+                                                                                    is_time_series_aggregate, **kwargs)
+        """
+        sel_groupby = ""
+        grp_by_clause = None
+        if is_time_series_aggregate:
+            # For time series aggregate timebucket_duration is must so, it'll be always present in kwargs.
+            grp_by_clause = "GROUP BY TIME ({0}".format(kwargs['timebucket_duration'])
+            # Add columns in value expression to GROUP BY TIME
+            if 'value_expression' in kwargs and \
+                    kwargs['value_expression'] is not None and \
+                    len(kwargs['value_expression']) > 0:
+                grp_by_clause = "{0} and {1}".format(grp_by_clause, ", ".join(kwargs['value_expression']))
+            # Complete the parenthesis for GROUP BY TIME
+            grp_by_clause = "{0})".format(grp_by_clause)
+            # Add Time code column information.
+            if 'timecode_column' in kwargs and \
+                    kwargs['timecode_column'] is not None and \
+                    len(kwargs['timecode_column']) > 0:
+                if 'sequence_column' in kwargs and \
+                        kwargs['timecode_column'] is not None and \
+                        len(kwargs['timecode_column']) > 0:
+                    grp_by_clause = "{0} USING TIMECODE({1}, {2})".format(grp_by_clause, kwargs['timecode_column'],
+                                                                          kwargs['sequence_column'])
+                else:
+                    grp_by_clause = "{0} USING TIMECODE({1})".format(grp_by_clause, kwargs['timecode_column'])
+            # Add Fill inforamtion
+            if 'fill' in kwargs and kwargs['fill'] is not None and len(kwargs['fill']) > 0:
+                grp_by_clause = "{0} FILL({1})".format(grp_by_clause, kwargs['fill'])
+        else:
+            if groupby_column_list is not None:
+                grp_by_clause = "GROUP BY {0}".format(",".join(groupby_column_list))
+        if grp_by_clause is not None:
+            table_name = "{0} \n{1}".format(table_name, grp_by_clause)
+            tdp = preparer(td_dialect)
+            for g in groupby_column_list:
+                if is_time_series_aggregate:
+                    if g == "TIMECODE_RANGE":
+                        g = "$TD_TIMECODE_RANGE"
+                    if "GROUP BY TIME" in g:
+                        g = "$TD_GROUP_BY_TIME"
+                quoted_name = tdp.quote(g)
+                sel_groupby += "{0}, ".format(quoted_name)
+        return table_name, sel_groupby, grp_by_clause
+    @staticmethod
+    def _get_column_names_and_types_from_metaexpr(metaexpr):
+        """
+        Internal function to return column names and respective types
+        given _metaexpr.
+        PARAMETERS:
+            metaexpr:
+                Required Argument.
+                Dataframe's metaexpr. It is used to get column names and types.
+                Types: MetaExpression
+        RETURNS:
+            Two lists - one for column names and another for column types
+        RAISES:
+            None
+        EXAMPLES:
+            dfUtils._get_column_names_and_types_from_metaexpr(
+                                                    df._metaexpr)
+        """
+        # Constructing New Column names & Types for selected columns ONLY using Parent _metaexpr
+        col_names = []
+        col_types = []
+        for c in metaexpr.c:
+            col_names.append(c.name)
+            col_types.append(c.type)
+        return col_names, col_types
+    @staticmethod
+    def _insert_all_from_table(to_table_name, from_table_name, column_list, to_schema_name=None,
+                               from_schema_name=None, temporary=False):
+        """
+        Inserts all records from one table into the second, using columns ordered by column list.
+        PARAMETERS:
+            to_table_name - String specifying name of the SQL Table to insert to.
+            from_table_name - String specifying name of the SQL Table to insert from.
+            column_list - List of strings specifying column names used in the insertion.
+            to_schema_name - Name of the database schema to insert table data into.
+            from_schema_name - Name of the database schema to insert table data from.
+            temporary - Specifies whether to create Vantage tables as permanent or volatile.
+                        Default: False
+                        Note: When True:
+                                1. volatile Tables are created, and
+                                2. schema_name is ignored.
+                        When False, permanent tables are created.
+        RETURNS:
+            None
+        RAISES:
+            Database error if an error occurred while executing the insert command.
+        EXAMPLES:
+            df_utils._insert_all_from_table('table1_name', 'table2_name', ['col1', 'col2', 'col3'])
+        """
+        tdp = preparer(td_dialect)
+        # Construct INSERT command.
+        column_order_string = ', '.join([tdp.quote("{0}".format(element)) for element in column_list])
+        # Generate full name of the destination table.
+        if to_schema_name:
+            full_to_table_name = tdp.quote(to_schema_name) + "." + tdp.quote(to_table_name)
+        elif temporary:
+            full_to_table_name = tdp.quote(to_table_name)
+        else:
+            full_to_table_name = tdp.quote(_get_current_databasename()) + "." + tdp.quote(
+                to_table_name)
+        # Generate full name of source table.
+        if from_schema_name:
+            full_from_table_name = tdp.quote(from_schema_name) + "." + tdp.quote(from_table_name)
+        else:
+            full_from_table_name = tdp.quote(_get_current_databasename()) + "." + tdp.quote(
+                from_table_name)
+        insert_sql = SQLBundle._build_insert_from_table_query(full_to_table_name,
+                                                              full_from_table_name,
+                                                              column_order_string)
+        # Execute INSERT command.
+        return UtilFuncs._execute_ddl_statement(insert_sql)
+    @staticmethod
+    def _dataframe_has_column(data, column):
+        """
+        Function to check whether column names in columns are present in given dataframe or not.
+        This function is used currently only for Analytics wrappers.
+        PARAMETERS:
+            data - teradataml DataFrame to check against for column existence.
+            column - Column name (a string).
+        RAISES:
+            None
+        EXAMPLES:
+            DataFrameUtils._dataframe_has_column(data, col)
+        """
+        if column in [c.name for c in data._metaexpr.c]:
+            return True
+        return False
+    @staticmethod
+    def _get_row_count(table_name):
+        """
+        Function to return the row count of a teradataml Dataframe.
+        This function is used currently to determine the shape/size of a dataframe.
+        PARAMETERS:
+            table_name - Name of the table to get the row count for.
+        RAISES:
+            TeradataMlException (TDMLDF_INFO_ERROR)
+        EXAMPLES:
+            DataFrameUtils._get_row_count(table_name)
+        """
+        # Construct COUNT(*) Query
+        try:
+            row_count_query = SQLBundle._build_nrows_print_query(table_name)
+            res = execute_sql(row_count_query)
+            return res.fetchone()[0]
+        except TeradataMlException:
+            raise
+        except Exception as err:
+            # TODO Better handle the level of information being presented to the user with logging
+            raise TeradataMlException(Messages.get_message(MessageCodes.TDMLDF_INFO_ERROR) + str(err),
+                                      MessageCodes.TDMLDF_INFO_ERROR) from err
+    @staticmethod
+    def _get_scalar_value(table_name):
+        """
+        Function to return the the only 1x1 (scalar) value from a teradataml Dataframe.
+        PARAMETERS:
+            table_name - Name of the table to get the value from.
+        RAISES:
+            TeradataMlException (TDMLDF_INFO_ERROR)
+        EXAMPLES:
+            DataFrameUtils._get_scalar_value(table_name)
+        """
+        # Construct the base Query
+        try:
+            select_query = SQLBundle._build_base_query(table_name)
+            res = execute_sql(select_query)
+            return res.fetchone()[0]
+        except TeradataMlException:
+            raise
+        except Exception as err:
+            # TODO Better handle the level of information being presented to the user with logging
+            raise TeradataMlException(Messages.get_message(MessageCodes.TDMLDF_INFO_ERROR) + str(err),
+                                      MessageCodes.TDMLDF_INFO_ERROR) from err
+    @staticmethod
+    def _get_sorted_nrow(df, n, sort_col, asc=True):
+        """
+        Internal Utility function that returns a teradataml DataFrame containing n rows
+        of the DataFrame. The Dataframe is sorted on the index column or the first column
+        if there is no index column.
+        PARAMETERS:
+            df:  teradataml DataFrame
+            n:   Specifies the number of rows to select.
+                 Type: int
+            sort_col: The column to sort on.
+                 Type: str
+            asc: (optional) - Specifies sort order.
+                 If True, sort in ascending order.
+                 If False, sort in descending order.
+                 The default value is True.
+                 Type: boolean
+        RETURNS:
+            teradataml DataFrame
+        EXAMPLES:
+            DataFrameUtils._get_sorted_nrow(df, 10)
+            DataFrameUtils._get_sorted_nrow(df, 20, asc=True)
+            DataFrameUtils._get_sorted_nrow(df, 30, asc=False)
+        """
+        #TODO: implement and use this in teradatasqlalchemy
+        tdp = preparer(td_dialect)
+        aed_utils = AedUtils()
+        sort_order = "asc"
+        if not asc:
+            sort_order = "desc"
+        quoted_cols = [tdp.quote(c) for c in df.columns]
+        sel_cols_str = ",".join(quoted_cols)
+        sel_row_num = "row_number() over (order by \"{0}\" {1}) - 1 as tdml_row_num, {2}".format(sort_col, sort_order, sel_cols_str)
+        filter_str = "tdml_row_num < {0}".format(n)
+        sel_nodeid = aed_utils._aed_select(df._nodeid, sel_row_num)
+        fil_nodeid = aed_utils._aed_filter(sel_nodeid, filter_str)
+        sel2_nodeid = aed_utils._aed_select(fil_nodeid, sel_cols_str)
+        col_names, col_types = __class__._get_column_names_and_types_from_metaexpr(df._metaexpr)
+        new_metaexpr = UtilFuncs._get_metaexpr_using_columns(df._nodeid, zip(col_names, col_types))
+        # Call the function from_node from appropriate class either DataFrame or GeoDataFrame
+        new_df = df.__class__._from_node(sel2_nodeid, new_metaexpr, df._index_label)
+        new_df._orderby = df._orderby
+        new_df._metaexpr._n_rows = n
+        return new_df
+    @staticmethod
+    def _get_database_names(connection, schema_name):
+        """
+        Function to return a list valid of database names for a given sqlalchemy connection.
+        This function is used to determine whether the database used is valid in user APIs such as copy_to_sql.
+        PARAMETERS:
+            connection:     Required Argument.
+                            A SQLAlchemy connection object.
+            schema_name:   Required Argument
+                            String specifying the requested schema name.
+        RAISES:
+            TeradataMlException (TDMLDF_INFO_ERROR)
+        EXAMPLES:
+            DataFrameUtils._get_database_names(get_connection(), schema_name)
+        """
+        #TODO: implement and use this in teradatasqlalchemy
+        table_obj = table('databasesV', column('databasename'), schema='dbc')
+        stmt = select(text(str(func.lower(table_obj.c.databasename)) + ' as databasename')).where(
+            text('databasename (NOT CASESPECIFIC) = {} (NOT CASESPECIFIC)'.format(':schema_name')))
+        stmt = text(str(stmt))
+        stmt = stmt.bindparams(schema_name=schema_name)
+        res = connection.execute(stmt).fetchall()
+        return [name.databasename for name in res]
+    @staticmethod
+    def _get_common_parent_df_from_dataframes(dfs):
+        """
+        Internal function to return common parent dataframe from given list of dataframes.
+        """
+        from teradataml import DataFrame, in_schema
+        aed_utils = AedUtils()
+        if len(dfs) == 1:
+            operation = aed_utils._aed_get_node_query_type(dfs[0]._nodeid)
+            if operation in ["table", "assign"]:
+                # Assign might have removed some columns and if it is only one dataframe,
+                # then return the same dataframe.
+                # Return the same dataframe if it is DataFrame object from table.
+                return dfs[0]
+            # If select node or any other node, then get the parent node and execute it.
+            pids = aed_utils._aed_get_parent_nodeids(dfs[0]._nodeid)
+            if not aed_utils._aed_is_node_executed(pids[0]):
+                _ = DataFrameUtils._execute_node_return_db_object_name(pids[0])
+            tab_name_first = aed_utils._aed_get_source_tablename(pids[0])
+            db_schema = UtilFuncs._extract_db_name(tab_name_first)
+            db_table_name = UtilFuncs._extract_table_name(tab_name_first)
+            return DataFrame(in_schema(db_schema, db_table_name))
+        pids_first = None
+        parent_df = None
+        for i in range(len(dfs)):
+            pids = aed_utils._aed_get_parent_nodeids(dfs[i]._nodeid)
+            if parent_df is None:
+                if not aed_utils._aed_is_node_executed(pids[0]):
+                    _ = DataFrameUtils._execute_node_return_db_object_name(pids[0])
+                tab_name_first = aed_utils._aed_get_source_tablename(pids[0])
+                db_schema = UtilFuncs._extract_db_name(tab_name_first)
+                db_table_name = UtilFuncs._extract_table_name(tab_name_first)
+                parent_df = DataFrame(in_schema(db_schema, db_table_name))
+                pids_first = pids
+            else:
+                if pids_first != pids:
+                    raise TeradataMlException(Messages.get_message(MessageCodes.DFS_NO_COMMON_PARENT),
+                                            MessageCodes.DFS_NO_COMMON_PARENT)
+        return parent_df

teradataml 17.20.0.7__py3-none-any.whl → 20.0.0.1__py3-none-any.whl

Potentially problematic release.

teradataml 17.20.0.7py3-none-any.whl → 20.0.0.1py3-none-any.whl