teradataml 20.0.0.8__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- teradataml/LICENSE-3RD-PARTY.pdf +0 -0
- teradataml/LICENSE.pdf +0 -0
- teradataml/README.md +2762 -0
- teradataml/__init__.py +78 -0
- teradataml/_version.py +11 -0
- teradataml/analytics/Transformations.py +2996 -0
- teradataml/analytics/__init__.py +82 -0
- teradataml/analytics/analytic_function_executor.py +2416 -0
- teradataml/analytics/analytic_query_generator.py +1050 -0
- teradataml/analytics/byom/H2OPredict.py +514 -0
- teradataml/analytics/byom/PMMLPredict.py +437 -0
- teradataml/analytics/byom/__init__.py +16 -0
- teradataml/analytics/json_parser/__init__.py +133 -0
- teradataml/analytics/json_parser/analytic_functions_argument.py +1805 -0
- teradataml/analytics/json_parser/json_store.py +191 -0
- teradataml/analytics/json_parser/metadata.py +1666 -0
- teradataml/analytics/json_parser/utils.py +805 -0
- teradataml/analytics/meta_class.py +236 -0
- teradataml/analytics/sqle/DecisionTreePredict.py +456 -0
- teradataml/analytics/sqle/NaiveBayesPredict.py +420 -0
- teradataml/analytics/sqle/__init__.py +128 -0
- teradataml/analytics/sqle/json/decisiontreepredict_sqle.json +78 -0
- teradataml/analytics/sqle/json/naivebayespredict_sqle.json +62 -0
- teradataml/analytics/table_operator/__init__.py +11 -0
- teradataml/analytics/uaf/__init__.py +82 -0
- teradataml/analytics/utils.py +828 -0
- teradataml/analytics/valib.py +1617 -0
- teradataml/automl/__init__.py +5835 -0
- teradataml/automl/autodataprep/__init__.py +493 -0
- teradataml/automl/custom_json_utils.py +1625 -0
- teradataml/automl/data_preparation.py +1384 -0
- teradataml/automl/data_transformation.py +1254 -0
- teradataml/automl/feature_engineering.py +2273 -0
- teradataml/automl/feature_exploration.py +1873 -0
- teradataml/automl/model_evaluation.py +488 -0
- teradataml/automl/model_training.py +1407 -0
- teradataml/catalog/__init__.py +2 -0
- teradataml/catalog/byom.py +1759 -0
- teradataml/catalog/function_argument_mapper.py +859 -0
- teradataml/catalog/model_cataloging_utils.py +491 -0
- teradataml/clients/__init__.py +0 -0
- teradataml/clients/auth_client.py +137 -0
- teradataml/clients/keycloak_client.py +165 -0
- teradataml/clients/pkce_client.py +481 -0
- teradataml/common/__init__.py +1 -0
- teradataml/common/aed_utils.py +2078 -0
- teradataml/common/bulk_exposed_utils.py +113 -0
- teradataml/common/constants.py +1669 -0
- teradataml/common/deprecations.py +166 -0
- teradataml/common/exceptions.py +147 -0
- teradataml/common/formula.py +743 -0
- teradataml/common/garbagecollector.py +666 -0
- teradataml/common/logger.py +1261 -0
- teradataml/common/messagecodes.py +518 -0
- teradataml/common/messages.py +262 -0
- teradataml/common/pylogger.py +67 -0
- teradataml/common/sqlbundle.py +764 -0
- teradataml/common/td_coltype_code_to_tdtype.py +48 -0
- teradataml/common/utils.py +3166 -0
- teradataml/common/warnings.py +36 -0
- teradataml/common/wrapper_utils.py +625 -0
- teradataml/config/__init__.py +0 -0
- teradataml/config/dummy_file1.cfg +5 -0
- teradataml/config/dummy_file2.cfg +3 -0
- teradataml/config/sqlengine_alias_definitions_v1.0 +14 -0
- teradataml/config/sqlengine_alias_definitions_v1.1 +20 -0
- teradataml/config/sqlengine_alias_definitions_v1.3 +19 -0
- teradataml/context/__init__.py +0 -0
- teradataml/context/aed_context.py +223 -0
- teradataml/context/context.py +1462 -0
- teradataml/data/A_loan.csv +19 -0
- teradataml/data/BINARY_REALS_LEFT.csv +11 -0
- teradataml/data/BINARY_REALS_RIGHT.csv +11 -0
- teradataml/data/B_loan.csv +49 -0
- teradataml/data/BuoyData2.csv +17 -0
- teradataml/data/CONVOLVE2_COMPLEX_LEFT.csv +5 -0
- teradataml/data/CONVOLVE2_COMPLEX_RIGHT.csv +5 -0
- teradataml/data/Convolve2RealsLeft.csv +5 -0
- teradataml/data/Convolve2RealsRight.csv +5 -0
- teradataml/data/Convolve2ValidLeft.csv +11 -0
- teradataml/data/Convolve2ValidRight.csv +11 -0
- teradataml/data/DFFTConv_Real_8_8.csv +65 -0
- teradataml/data/Employee.csv +5 -0
- teradataml/data/Employee_Address.csv +4 -0
- teradataml/data/Employee_roles.csv +5 -0
- teradataml/data/JulesBelvezeDummyData.csv +100 -0
- teradataml/data/Mall_customer_data.csv +201 -0
- teradataml/data/Orders1_12mf.csv +25 -0
- teradataml/data/Pi_loan.csv +7 -0
- teradataml/data/SMOOTHED_DATA.csv +7 -0
- teradataml/data/TestDFFT8.csv +9 -0
- teradataml/data/TestRiver.csv +109 -0
- teradataml/data/Traindata.csv +28 -0
- teradataml/data/__init__.py +0 -0
- teradataml/data/acf.csv +17 -0
- teradataml/data/adaboost_example.json +34 -0
- teradataml/data/adaboostpredict_example.json +24 -0
- teradataml/data/additional_table.csv +11 -0
- teradataml/data/admissions_test.csv +21 -0
- teradataml/data/admissions_train.csv +41 -0
- teradataml/data/admissions_train_nulls.csv +41 -0
- teradataml/data/advertising.csv +201 -0
- teradataml/data/ageandheight.csv +13 -0
- teradataml/data/ageandpressure.csv +31 -0
- teradataml/data/amazon_reviews_25.csv +26 -0
- teradataml/data/antiselect_example.json +36 -0
- teradataml/data/antiselect_input.csv +8 -0
- teradataml/data/antiselect_input_mixed_case.csv +8 -0
- teradataml/data/applicant_external.csv +7 -0
- teradataml/data/applicant_reference.csv +7 -0
- teradataml/data/apriori_example.json +22 -0
- teradataml/data/arima_example.json +9 -0
- teradataml/data/assortedtext_input.csv +8 -0
- teradataml/data/attribution_example.json +34 -0
- teradataml/data/attribution_sample_table.csv +27 -0
- teradataml/data/attribution_sample_table1.csv +6 -0
- teradataml/data/attribution_sample_table2.csv +11 -0
- teradataml/data/bank_churn.csv +10001 -0
- teradataml/data/bank_marketing.csv +11163 -0
- teradataml/data/bank_web_clicks1.csv +43 -0
- teradataml/data/bank_web_clicks2.csv +91 -0
- teradataml/data/bank_web_url.csv +85 -0
- teradataml/data/barrier.csv +2 -0
- teradataml/data/barrier_new.csv +3 -0
- teradataml/data/betweenness_example.json +14 -0
- teradataml/data/bike_sharing.csv +732 -0
- teradataml/data/bin_breaks.csv +8 -0
- teradataml/data/bin_fit_ip.csv +4 -0
- teradataml/data/binary_complex_left.csv +11 -0
- teradataml/data/binary_complex_right.csv +11 -0
- teradataml/data/binary_matrix_complex_left.csv +21 -0
- teradataml/data/binary_matrix_complex_right.csv +21 -0
- teradataml/data/binary_matrix_real_left.csv +21 -0
- teradataml/data/binary_matrix_real_right.csv +21 -0
- teradataml/data/blood2ageandweight.csv +26 -0
- teradataml/data/bmi.csv +501 -0
- teradataml/data/boston.csv +507 -0
- teradataml/data/boston2cols.csv +721 -0
- teradataml/data/breast_cancer.csv +570 -0
- teradataml/data/buoydata_mix.csv +11 -0
- teradataml/data/burst_data.csv +5 -0
- teradataml/data/burst_example.json +21 -0
- teradataml/data/byom_example.json +34 -0
- teradataml/data/bytes_table.csv +4 -0
- teradataml/data/cal_housing_ex_raw.csv +70 -0
- teradataml/data/callers.csv +7 -0
- teradataml/data/calls.csv +10 -0
- teradataml/data/cars_hist.csv +33 -0
- teradataml/data/cat_table.csv +25 -0
- teradataml/data/ccm_example.json +32 -0
- teradataml/data/ccm_input.csv +91 -0
- teradataml/data/ccm_input2.csv +13 -0
- teradataml/data/ccmexample.csv +101 -0
- teradataml/data/ccmprepare_example.json +9 -0
- teradataml/data/ccmprepare_input.csv +91 -0
- teradataml/data/cfilter_example.json +12 -0
- teradataml/data/changepointdetection_example.json +18 -0
- teradataml/data/changepointdetectionrt_example.json +8 -0
- teradataml/data/chi_sq.csv +3 -0
- teradataml/data/churn_data.csv +14 -0
- teradataml/data/churn_emission.csv +35 -0
- teradataml/data/churn_initial.csv +3 -0
- teradataml/data/churn_state_transition.csv +5 -0
- teradataml/data/citedges_2.csv +745 -0
- teradataml/data/citvertices_2.csv +1210 -0
- teradataml/data/clicks2.csv +16 -0
- teradataml/data/clickstream.csv +13 -0
- teradataml/data/clickstream1.csv +11 -0
- teradataml/data/closeness_example.json +16 -0
- teradataml/data/complaints.csv +21 -0
- teradataml/data/complaints_mini.csv +3 -0
- teradataml/data/complaints_test_tokenized.csv +353 -0
- teradataml/data/complaints_testtoken.csv +224 -0
- teradataml/data/complaints_tokens_model.csv +348 -0
- teradataml/data/complaints_tokens_test.csv +353 -0
- teradataml/data/complaints_traintoken.csv +472 -0
- teradataml/data/computers_category.csv +1001 -0
- teradataml/data/computers_test1.csv +1252 -0
- teradataml/data/computers_train1.csv +5009 -0
- teradataml/data/computers_train1_clustered.csv +5009 -0
- teradataml/data/confusionmatrix_example.json +9 -0
- teradataml/data/conversion_event_table.csv +3 -0
- teradataml/data/corr_input.csv +17 -0
- teradataml/data/correlation_example.json +11 -0
- teradataml/data/covid_confirm_sd.csv +83 -0
- teradataml/data/coxhazardratio_example.json +39 -0
- teradataml/data/coxph_example.json +15 -0
- teradataml/data/coxsurvival_example.json +28 -0
- teradataml/data/cpt.csv +41 -0
- teradataml/data/credit_ex_merged.csv +45 -0
- teradataml/data/creditcard_data.csv +1001 -0
- teradataml/data/customer_loyalty.csv +301 -0
- teradataml/data/customer_loyalty_newseq.csv +31 -0
- teradataml/data/customer_segmentation_test.csv +2628 -0
- teradataml/data/customer_segmentation_train.csv +8069 -0
- teradataml/data/dataframe_example.json +173 -0
- teradataml/data/decisionforest_example.json +37 -0
- teradataml/data/decisionforestpredict_example.json +38 -0
- teradataml/data/decisiontree_example.json +21 -0
- teradataml/data/decisiontreepredict_example.json +45 -0
- teradataml/data/dfft2_size4_real.csv +17 -0
- teradataml/data/dfft2_test_matrix16.csv +17 -0
- teradataml/data/dfft2conv_real_4_4.csv +65 -0
- teradataml/data/diabetes.csv +443 -0
- teradataml/data/diabetes_test.csv +89 -0
- teradataml/data/dict_table.csv +5 -0
- teradataml/data/docperterm_table.csv +4 -0
- teradataml/data/docs/__init__.py +1 -0
- teradataml/data/docs/byom/__init__.py +0 -0
- teradataml/data/docs/byom/docs/DataRobotPredict.py +180 -0
- teradataml/data/docs/byom/docs/DataikuPredict.py +217 -0
- teradataml/data/docs/byom/docs/H2OPredict.py +325 -0
- teradataml/data/docs/byom/docs/ONNXEmbeddings.py +242 -0
- teradataml/data/docs/byom/docs/ONNXPredict.py +283 -0
- teradataml/data/docs/byom/docs/ONNXSeq2Seq.py +255 -0
- teradataml/data/docs/byom/docs/PMMLPredict.py +278 -0
- teradataml/data/docs/byom/docs/__init__.py +0 -0
- teradataml/data/docs/sqle/__init__.py +0 -0
- teradataml/data/docs/sqle/docs_17_10/Antiselect.py +83 -0
- teradataml/data/docs/sqle/docs_17_10/Attribution.py +200 -0
- teradataml/data/docs/sqle/docs_17_10/BincodeFit.py +172 -0
- teradataml/data/docs/sqle/docs_17_10/BincodeTransform.py +131 -0
- teradataml/data/docs/sqle/docs_17_10/CategoricalSummary.py +86 -0
- teradataml/data/docs/sqle/docs_17_10/ChiSq.py +90 -0
- teradataml/data/docs/sqle/docs_17_10/ColumnSummary.py +86 -0
- teradataml/data/docs/sqle/docs_17_10/ConvertTo.py +96 -0
- teradataml/data/docs/sqle/docs_17_10/DecisionForestPredict.py +139 -0
- teradataml/data/docs/sqle/docs_17_10/DecisionTreePredict.py +152 -0
- teradataml/data/docs/sqle/docs_17_10/FTest.py +161 -0
- teradataml/data/docs/sqle/docs_17_10/FillRowId.py +83 -0
- teradataml/data/docs/sqle/docs_17_10/Fit.py +88 -0
- teradataml/data/docs/sqle/docs_17_10/GLMPredict.py +144 -0
- teradataml/data/docs/sqle/docs_17_10/GetRowsWithMissingValues.py +85 -0
- teradataml/data/docs/sqle/docs_17_10/GetRowsWithoutMissingValues.py +82 -0
- teradataml/data/docs/sqle/docs_17_10/Histogram.py +165 -0
- teradataml/data/docs/sqle/docs_17_10/MovingAverage.py +134 -0
- teradataml/data/docs/sqle/docs_17_10/NGramSplitter.py +209 -0
- teradataml/data/docs/sqle/docs_17_10/NPath.py +266 -0
- teradataml/data/docs/sqle/docs_17_10/NaiveBayesPredict.py +116 -0
- teradataml/data/docs/sqle/docs_17_10/NaiveBayesTextClassifierPredict.py +176 -0
- teradataml/data/docs/sqle/docs_17_10/NumApply.py +147 -0
- teradataml/data/docs/sqle/docs_17_10/OneHotEncodingFit.py +135 -0
- teradataml/data/docs/sqle/docs_17_10/OneHotEncodingTransform.py +109 -0
- teradataml/data/docs/sqle/docs_17_10/OutlierFilterFit.py +166 -0
- teradataml/data/docs/sqle/docs_17_10/OutlierFilterTransform.py +105 -0
- teradataml/data/docs/sqle/docs_17_10/Pack.py +128 -0
- teradataml/data/docs/sqle/docs_17_10/PolynomialFeaturesFit.py +112 -0
- teradataml/data/docs/sqle/docs_17_10/PolynomialFeaturesTransform.py +102 -0
- teradataml/data/docs/sqle/docs_17_10/QQNorm.py +105 -0
- teradataml/data/docs/sqle/docs_17_10/RoundColumns.py +110 -0
- teradataml/data/docs/sqle/docs_17_10/RowNormalizeFit.py +118 -0
- teradataml/data/docs/sqle/docs_17_10/RowNormalizeTransform.py +99 -0
- teradataml/data/docs/sqle/docs_17_10/SVMSparsePredict.py +153 -0
- teradataml/data/docs/sqle/docs_17_10/ScaleFit.py +197 -0
- teradataml/data/docs/sqle/docs_17_10/ScaleTransform.py +99 -0
- teradataml/data/docs/sqle/docs_17_10/Sessionize.py +114 -0
- teradataml/data/docs/sqle/docs_17_10/SimpleImputeFit.py +116 -0
- teradataml/data/docs/sqle/docs_17_10/SimpleImputeTransform.py +98 -0
- teradataml/data/docs/sqle/docs_17_10/StrApply.py +187 -0
- teradataml/data/docs/sqle/docs_17_10/StringSimilarity.py +146 -0
- teradataml/data/docs/sqle/docs_17_10/Transform.py +105 -0
- teradataml/data/docs/sqle/docs_17_10/UnivariateStatistics.py +142 -0
- teradataml/data/docs/sqle/docs_17_10/Unpack.py +214 -0
- teradataml/data/docs/sqle/docs_17_10/WhichMax.py +83 -0
- teradataml/data/docs/sqle/docs_17_10/WhichMin.py +83 -0
- teradataml/data/docs/sqle/docs_17_10/ZTest.py +155 -0
- teradataml/data/docs/sqle/docs_17_10/__init__.py +0 -0
- teradataml/data/docs/sqle/docs_17_20/ANOVA.py +186 -0
- teradataml/data/docs/sqle/docs_17_20/Antiselect.py +83 -0
- teradataml/data/docs/sqle/docs_17_20/Apriori.py +138 -0
- teradataml/data/docs/sqle/docs_17_20/Attribution.py +201 -0
- teradataml/data/docs/sqle/docs_17_20/BincodeFit.py +172 -0
- teradataml/data/docs/sqle/docs_17_20/BincodeTransform.py +139 -0
- teradataml/data/docs/sqle/docs_17_20/CFilter.py +132 -0
- teradataml/data/docs/sqle/docs_17_20/CategoricalSummary.py +86 -0
- teradataml/data/docs/sqle/docs_17_20/ChiSq.py +90 -0
- teradataml/data/docs/sqle/docs_17_20/ClassificationEvaluator.py +166 -0
- teradataml/data/docs/sqle/docs_17_20/ColumnSummary.py +86 -0
- teradataml/data/docs/sqle/docs_17_20/ColumnTransformer.py +246 -0
- teradataml/data/docs/sqle/docs_17_20/ConvertTo.py +113 -0
- teradataml/data/docs/sqle/docs_17_20/DecisionForest.py +280 -0
- teradataml/data/docs/sqle/docs_17_20/DecisionForestPredict.py +144 -0
- teradataml/data/docs/sqle/docs_17_20/DecisionTreePredict.py +136 -0
- teradataml/data/docs/sqle/docs_17_20/FTest.py +240 -0
- teradataml/data/docs/sqle/docs_17_20/FillRowId.py +83 -0
- teradataml/data/docs/sqle/docs_17_20/Fit.py +88 -0
- teradataml/data/docs/sqle/docs_17_20/GLM.py +541 -0
- teradataml/data/docs/sqle/docs_17_20/GLMPerSegment.py +415 -0
- teradataml/data/docs/sqle/docs_17_20/GLMPredict.py +144 -0
- teradataml/data/docs/sqle/docs_17_20/GLMPredictPerSegment.py +233 -0
- teradataml/data/docs/sqle/docs_17_20/GetFutileColumns.py +125 -0
- teradataml/data/docs/sqle/docs_17_20/GetRowsWithMissingValues.py +109 -0
- teradataml/data/docs/sqle/docs_17_20/GetRowsWithoutMissingValues.py +106 -0
- teradataml/data/docs/sqle/docs_17_20/Histogram.py +224 -0
- teradataml/data/docs/sqle/docs_17_20/KMeans.py +251 -0
- teradataml/data/docs/sqle/docs_17_20/KMeansPredict.py +144 -0
- teradataml/data/docs/sqle/docs_17_20/KNN.py +215 -0
- teradataml/data/docs/sqle/docs_17_20/MovingAverage.py +134 -0
- teradataml/data/docs/sqle/docs_17_20/NERExtractor.py +121 -0
- teradataml/data/docs/sqle/docs_17_20/NGramSplitter.py +209 -0
- teradataml/data/docs/sqle/docs_17_20/NPath.py +266 -0
- teradataml/data/docs/sqle/docs_17_20/NaiveBayes.py +162 -0
- teradataml/data/docs/sqle/docs_17_20/NaiveBayesPredict.py +116 -0
- teradataml/data/docs/sqle/docs_17_20/NaiveBayesTextClassifierPredict.py +177 -0
- teradataml/data/docs/sqle/docs_17_20/NaiveBayesTextClassifierTrainer.py +127 -0
- teradataml/data/docs/sqle/docs_17_20/NonLinearCombineFit.py +119 -0
- teradataml/data/docs/sqle/docs_17_20/NonLinearCombineTransform.py +112 -0
- teradataml/data/docs/sqle/docs_17_20/NumApply.py +147 -0
- teradataml/data/docs/sqle/docs_17_20/OneClassSVM.py +307 -0
- teradataml/data/docs/sqle/docs_17_20/OneClassSVMPredict.py +185 -0
- teradataml/data/docs/sqle/docs_17_20/OneHotEncodingFit.py +231 -0
- teradataml/data/docs/sqle/docs_17_20/OneHotEncodingTransform.py +121 -0
- teradataml/data/docs/sqle/docs_17_20/OrdinalEncodingFit.py +220 -0
- teradataml/data/docs/sqle/docs_17_20/OrdinalEncodingTransform.py +127 -0
- teradataml/data/docs/sqle/docs_17_20/OutlierFilterFit.py +191 -0
- teradataml/data/docs/sqle/docs_17_20/OutlierFilterTransform.py +117 -0
- teradataml/data/docs/sqle/docs_17_20/Pack.py +128 -0
- teradataml/data/docs/sqle/docs_17_20/Pivoting.py +279 -0
- teradataml/data/docs/sqle/docs_17_20/PolynomialFeaturesFit.py +112 -0
- teradataml/data/docs/sqle/docs_17_20/PolynomialFeaturesTransform.py +112 -0
- teradataml/data/docs/sqle/docs_17_20/QQNorm.py +105 -0
- teradataml/data/docs/sqle/docs_17_20/ROC.py +164 -0
- teradataml/data/docs/sqle/docs_17_20/RandomProjectionFit.py +155 -0
- teradataml/data/docs/sqle/docs_17_20/RandomProjectionMinComponents.py +106 -0
- teradataml/data/docs/sqle/docs_17_20/RandomProjectionTransform.py +120 -0
- teradataml/data/docs/sqle/docs_17_20/RegressionEvaluator.py +211 -0
- teradataml/data/docs/sqle/docs_17_20/RoundColumns.py +109 -0
- teradataml/data/docs/sqle/docs_17_20/RowNormalizeFit.py +118 -0
- teradataml/data/docs/sqle/docs_17_20/RowNormalizeTransform.py +111 -0
- teradataml/data/docs/sqle/docs_17_20/SMOTE.py +212 -0
- teradataml/data/docs/sqle/docs_17_20/SVM.py +414 -0
- teradataml/data/docs/sqle/docs_17_20/SVMPredict.py +213 -0
- teradataml/data/docs/sqle/docs_17_20/SVMSparsePredict.py +153 -0
- teradataml/data/docs/sqle/docs_17_20/ScaleFit.py +315 -0
- teradataml/data/docs/sqle/docs_17_20/ScaleTransform.py +202 -0
- teradataml/data/docs/sqle/docs_17_20/SentimentExtractor.py +206 -0
- teradataml/data/docs/sqle/docs_17_20/Sessionize.py +114 -0
- teradataml/data/docs/sqle/docs_17_20/Shap.py +225 -0
- teradataml/data/docs/sqle/docs_17_20/Silhouette.py +153 -0
- teradataml/data/docs/sqle/docs_17_20/SimpleImputeFit.py +116 -0
- teradataml/data/docs/sqle/docs_17_20/SimpleImputeTransform.py +109 -0
- teradataml/data/docs/sqle/docs_17_20/StrApply.py +187 -0
- teradataml/data/docs/sqle/docs_17_20/StringSimilarity.py +146 -0
- teradataml/data/docs/sqle/docs_17_20/TDDecisionForestPredict.py +207 -0
- teradataml/data/docs/sqle/docs_17_20/TDGLMPredict.py +333 -0
- teradataml/data/docs/sqle/docs_17_20/TDNaiveBayesPredict.py +189 -0
- teradataml/data/docs/sqle/docs_17_20/TFIDF.py +142 -0
- teradataml/data/docs/sqle/docs_17_20/TargetEncodingFit.py +267 -0
- teradataml/data/docs/sqle/docs_17_20/TargetEncodingTransform.py +141 -0
- teradataml/data/docs/sqle/docs_17_20/TextMorph.py +119 -0
- teradataml/data/docs/sqle/docs_17_20/TextParser.py +224 -0
- teradataml/data/docs/sqle/docs_17_20/TrainTestSplit.py +160 -0
- teradataml/data/docs/sqle/docs_17_20/Transform.py +123 -0
- teradataml/data/docs/sqle/docs_17_20/UnivariateStatistics.py +142 -0
- teradataml/data/docs/sqle/docs_17_20/Unpack.py +214 -0
- teradataml/data/docs/sqle/docs_17_20/Unpivoting.py +216 -0
- teradataml/data/docs/sqle/docs_17_20/VectorDistance.py +169 -0
- teradataml/data/docs/sqle/docs_17_20/WhichMax.py +83 -0
- teradataml/data/docs/sqle/docs_17_20/WhichMin.py +83 -0
- teradataml/data/docs/sqle/docs_17_20/WordEmbeddings.py +237 -0
- teradataml/data/docs/sqle/docs_17_20/XGBoost.py +362 -0
- teradataml/data/docs/sqle/docs_17_20/XGBoostPredict.py +281 -0
- teradataml/data/docs/sqle/docs_17_20/ZTest.py +220 -0
- teradataml/data/docs/sqle/docs_17_20/__init__.py +0 -0
- teradataml/data/docs/tableoperator/__init__.py +0 -0
- teradataml/data/docs/tableoperator/docs_17_00/ReadNOS.py +430 -0
- teradataml/data/docs/tableoperator/docs_17_00/__init__.py +0 -0
- teradataml/data/docs/tableoperator/docs_17_05/ReadNOS.py +430 -0
- teradataml/data/docs/tableoperator/docs_17_05/WriteNOS.py +348 -0
- teradataml/data/docs/tableoperator/docs_17_05/__init__.py +0 -0
- teradataml/data/docs/tableoperator/docs_17_10/ReadNOS.py +429 -0
- teradataml/data/docs/tableoperator/docs_17_10/WriteNOS.py +348 -0
- teradataml/data/docs/tableoperator/docs_17_10/__init__.py +0 -0
- teradataml/data/docs/tableoperator/docs_17_20/Image2Matrix.py +118 -0
- teradataml/data/docs/tableoperator/docs_17_20/ReadNOS.py +440 -0
- teradataml/data/docs/tableoperator/docs_17_20/WriteNOS.py +387 -0
- teradataml/data/docs/tableoperator/docs_17_20/__init__.py +0 -0
- teradataml/data/docs/uaf/__init__.py +0 -0
- teradataml/data/docs/uaf/docs_17_20/ACF.py +186 -0
- teradataml/data/docs/uaf/docs_17_20/ArimaEstimate.py +370 -0
- teradataml/data/docs/uaf/docs_17_20/ArimaForecast.py +172 -0
- teradataml/data/docs/uaf/docs_17_20/ArimaValidate.py +161 -0
- teradataml/data/docs/uaf/docs_17_20/ArimaXEstimate.py +293 -0
- teradataml/data/docs/uaf/docs_17_20/AutoArima.py +354 -0
- teradataml/data/docs/uaf/docs_17_20/BinaryMatrixOp.py +248 -0
- teradataml/data/docs/uaf/docs_17_20/BinarySeriesOp.py +252 -0
- teradataml/data/docs/uaf/docs_17_20/BreuschGodfrey.py +178 -0
- teradataml/data/docs/uaf/docs_17_20/BreuschPaganGodfrey.py +175 -0
- teradataml/data/docs/uaf/docs_17_20/Convolve.py +230 -0
- teradataml/data/docs/uaf/docs_17_20/Convolve2.py +218 -0
- teradataml/data/docs/uaf/docs_17_20/CopyArt.py +145 -0
- teradataml/data/docs/uaf/docs_17_20/CumulPeriodogram.py +185 -0
- teradataml/data/docs/uaf/docs_17_20/DFFT.py +204 -0
- teradataml/data/docs/uaf/docs_17_20/DFFT2.py +216 -0
- teradataml/data/docs/uaf/docs_17_20/DFFT2Conv.py +216 -0
- teradataml/data/docs/uaf/docs_17_20/DFFTConv.py +192 -0
- teradataml/data/docs/uaf/docs_17_20/DIFF.py +175 -0
- teradataml/data/docs/uaf/docs_17_20/DTW.py +180 -0
- teradataml/data/docs/uaf/docs_17_20/DWT.py +235 -0
- teradataml/data/docs/uaf/docs_17_20/DWT2D.py +217 -0
- teradataml/data/docs/uaf/docs_17_20/DickeyFuller.py +142 -0
- teradataml/data/docs/uaf/docs_17_20/DurbinWatson.py +184 -0
- teradataml/data/docs/uaf/docs_17_20/ExtractResults.py +185 -0
- teradataml/data/docs/uaf/docs_17_20/FilterFactory1d.py +160 -0
- teradataml/data/docs/uaf/docs_17_20/FitMetrics.py +172 -0
- teradataml/data/docs/uaf/docs_17_20/GenseriesFormula.py +206 -0
- teradataml/data/docs/uaf/docs_17_20/GenseriesSinusoids.py +143 -0
- teradataml/data/docs/uaf/docs_17_20/GoldfeldQuandt.py +198 -0
- teradataml/data/docs/uaf/docs_17_20/HoltWintersForecaster.py +260 -0
- teradataml/data/docs/uaf/docs_17_20/IDFFT.py +165 -0
- teradataml/data/docs/uaf/docs_17_20/IDFFT2.py +191 -0
- teradataml/data/docs/uaf/docs_17_20/IDWT.py +236 -0
- teradataml/data/docs/uaf/docs_17_20/IDWT2D.py +226 -0
- teradataml/data/docs/uaf/docs_17_20/IQR.py +134 -0
- teradataml/data/docs/uaf/docs_17_20/InputValidator.py +121 -0
- teradataml/data/docs/uaf/docs_17_20/LineSpec.py +156 -0
- teradataml/data/docs/uaf/docs_17_20/LinearRegr.py +215 -0
- teradataml/data/docs/uaf/docs_17_20/MAMean.py +174 -0
- teradataml/data/docs/uaf/docs_17_20/MInfo.py +134 -0
- teradataml/data/docs/uaf/docs_17_20/Matrix2Image.py +297 -0
- teradataml/data/docs/uaf/docs_17_20/MatrixMultiply.py +145 -0
- teradataml/data/docs/uaf/docs_17_20/MultivarRegr.py +191 -0
- teradataml/data/docs/uaf/docs_17_20/PACF.py +157 -0
- teradataml/data/docs/uaf/docs_17_20/Portman.py +217 -0
- teradataml/data/docs/uaf/docs_17_20/PowerSpec.py +203 -0
- teradataml/data/docs/uaf/docs_17_20/PowerTransform.py +155 -0
- teradataml/data/docs/uaf/docs_17_20/Resample.py +237 -0
- teradataml/data/docs/uaf/docs_17_20/SAX.py +246 -0
- teradataml/data/docs/uaf/docs_17_20/SInfo.py +123 -0
- teradataml/data/docs/uaf/docs_17_20/SeasonalNormalize.py +173 -0
- teradataml/data/docs/uaf/docs_17_20/SelectionCriteria.py +174 -0
- teradataml/data/docs/uaf/docs_17_20/SignifPeriodicities.py +171 -0
- teradataml/data/docs/uaf/docs_17_20/SignifResidmean.py +164 -0
- teradataml/data/docs/uaf/docs_17_20/SimpleExp.py +180 -0
- teradataml/data/docs/uaf/docs_17_20/Smoothma.py +208 -0
- teradataml/data/docs/uaf/docs_17_20/TrackingOp.py +151 -0
- teradataml/data/docs/uaf/docs_17_20/UNDIFF.py +171 -0
- teradataml/data/docs/uaf/docs_17_20/Unnormalize.py +202 -0
- teradataml/data/docs/uaf/docs_17_20/WhitesGeneral.py +171 -0
- teradataml/data/docs/uaf/docs_17_20/WindowDFFT.py +368 -0
- teradataml/data/docs/uaf/docs_17_20/__init__.py +0 -0
- teradataml/data/dtw_example.json +18 -0
- teradataml/data/dtw_t1.csv +11 -0
- teradataml/data/dtw_t2.csv +4 -0
- teradataml/data/dwt2d_dataTable.csv +65 -0
- teradataml/data/dwt2d_example.json +16 -0
- teradataml/data/dwt_dataTable.csv +8 -0
- teradataml/data/dwt_example.json +15 -0
- teradataml/data/dwt_filterTable.csv +3 -0
- teradataml/data/dwt_filter_dim.csv +5 -0
- teradataml/data/emission.csv +9 -0
- teradataml/data/emp_table_by_dept.csv +19 -0
- teradataml/data/employee_info.csv +4 -0
- teradataml/data/employee_table.csv +6 -0
- teradataml/data/excluding_event_table.csv +2 -0
- teradataml/data/finance_data.csv +6 -0
- teradataml/data/finance_data2.csv +61 -0
- teradataml/data/finance_data3.csv +93 -0
- teradataml/data/finance_data4.csv +13 -0
- teradataml/data/fish.csv +160 -0
- teradataml/data/fm_blood2ageandweight.csv +26 -0
- teradataml/data/fmeasure_example.json +12 -0
- teradataml/data/followers_leaders.csv +10 -0
- teradataml/data/fpgrowth_example.json +12 -0
- teradataml/data/frequentpaths_example.json +29 -0
- teradataml/data/friends.csv +9 -0
- teradataml/data/fs_input.csv +33 -0
- teradataml/data/fs_input1.csv +33 -0
- teradataml/data/genData.csv +513 -0
- teradataml/data/geodataframe_example.json +40 -0
- teradataml/data/glass_types.csv +215 -0
- teradataml/data/glm_admissions_model.csv +12 -0
- teradataml/data/glm_example.json +56 -0
- teradataml/data/glml1l2_example.json +28 -0
- teradataml/data/glml1l2predict_example.json +54 -0
- teradataml/data/glmpredict_example.json +54 -0
- teradataml/data/gq_t1.csv +21 -0
- teradataml/data/grocery_transaction.csv +19 -0
- teradataml/data/hconvolve_complex_right.csv +5 -0
- teradataml/data/hconvolve_complex_rightmulti.csv +5 -0
- teradataml/data/histogram_example.json +12 -0
- teradataml/data/hmmdecoder_example.json +79 -0
- teradataml/data/hmmevaluator_example.json +25 -0
- teradataml/data/hmmsupervised_example.json +10 -0
- teradataml/data/hmmunsupervised_example.json +8 -0
- teradataml/data/hnsw_alter_data.csv +5 -0
- teradataml/data/hnsw_data.csv +10 -0
- teradataml/data/house_values.csv +12 -0
- teradataml/data/house_values2.csv +13 -0
- teradataml/data/housing_cat.csv +7 -0
- teradataml/data/housing_data.csv +9 -0
- teradataml/data/housing_test.csv +47 -0
- teradataml/data/housing_test_binary.csv +47 -0
- teradataml/data/housing_train.csv +493 -0
- teradataml/data/housing_train_attribute.csv +5 -0
- teradataml/data/housing_train_binary.csv +437 -0
- teradataml/data/housing_train_parameter.csv +2 -0
- teradataml/data/housing_train_response.csv +493 -0
- teradataml/data/housing_train_segment.csv +201 -0
- teradataml/data/ibm_stock.csv +370 -0
- teradataml/data/ibm_stock1.csv +370 -0
- teradataml/data/identitymatch_example.json +22 -0
- teradataml/data/idf_table.csv +4 -0
- teradataml/data/idwt2d_dataTable.csv +5 -0
- teradataml/data/idwt_dataTable.csv +8 -0
- teradataml/data/idwt_filterTable.csv +3 -0
- teradataml/data/impressions.csv +101 -0
- teradataml/data/inflation.csv +21 -0
- teradataml/data/initial.csv +3 -0
- teradataml/data/insect2Cols.csv +61 -0
- teradataml/data/insect_sprays.csv +13 -0
- teradataml/data/insurance.csv +1339 -0
- teradataml/data/interpolator_example.json +13 -0
- teradataml/data/interval_data.csv +5 -0
- teradataml/data/iris_altinput.csv +481 -0
- teradataml/data/iris_attribute_output.csv +8 -0
- teradataml/data/iris_attribute_test.csv +121 -0
- teradataml/data/iris_attribute_train.csv +481 -0
- teradataml/data/iris_category_expect_predict.csv +31 -0
- teradataml/data/iris_data.csv +151 -0
- teradataml/data/iris_input.csv +151 -0
- teradataml/data/iris_response_train.csv +121 -0
- teradataml/data/iris_test.csv +31 -0
- teradataml/data/iris_train.csv +121 -0
- teradataml/data/join_table1.csv +4 -0
- teradataml/data/join_table2.csv +4 -0
- teradataml/data/jsons/anly_function_name.json +7 -0
- teradataml/data/jsons/byom/ONNXSeq2Seq.json +287 -0
- teradataml/data/jsons/byom/dataikupredict.json +148 -0
- teradataml/data/jsons/byom/datarobotpredict.json +147 -0
- teradataml/data/jsons/byom/h2opredict.json +195 -0
- teradataml/data/jsons/byom/onnxembeddings.json +267 -0
- teradataml/data/jsons/byom/onnxpredict.json +187 -0
- teradataml/data/jsons/byom/pmmlpredict.json +147 -0
- teradataml/data/jsons/paired_functions.json +450 -0
- teradataml/data/jsons/sqle/16.20/Antiselect.json +56 -0
- teradataml/data/jsons/sqle/16.20/Attribution.json +249 -0
- teradataml/data/jsons/sqle/16.20/DecisionForestPredict.json +156 -0
- teradataml/data/jsons/sqle/16.20/DecisionTreePredict.json +170 -0
- teradataml/data/jsons/sqle/16.20/GLMPredict.json +122 -0
- teradataml/data/jsons/sqle/16.20/MovingAverage.json +367 -0
- teradataml/data/jsons/sqle/16.20/NGramSplitter.json +239 -0
- teradataml/data/jsons/sqle/16.20/NaiveBayesPredict.json +136 -0
- teradataml/data/jsons/sqle/16.20/NaiveBayesTextClassifierPredict.json +235 -0
- teradataml/data/jsons/sqle/16.20/Pack.json +98 -0
- teradataml/data/jsons/sqle/16.20/SVMSparsePredict.json +162 -0
- teradataml/data/jsons/sqle/16.20/Sessionize.json +105 -0
- teradataml/data/jsons/sqle/16.20/StringSimilarity.json +86 -0
- teradataml/data/jsons/sqle/16.20/Unpack.json +166 -0
- teradataml/data/jsons/sqle/16.20/nPath.json +269 -0
- teradataml/data/jsons/sqle/17.00/Antiselect.json +56 -0
- teradataml/data/jsons/sqle/17.00/Attribution.json +249 -0
- teradataml/data/jsons/sqle/17.00/DecisionForestPredict.json +156 -0
- teradataml/data/jsons/sqle/17.00/DecisionTreePredict.json +170 -0
- teradataml/data/jsons/sqle/17.00/GLMPredict.json +122 -0
- teradataml/data/jsons/sqle/17.00/MovingAverage.json +367 -0
- teradataml/data/jsons/sqle/17.00/NGramSplitter.json +239 -0
- teradataml/data/jsons/sqle/17.00/NaiveBayesPredict.json +136 -0
- teradataml/data/jsons/sqle/17.00/NaiveBayesTextClassifierPredict.json +235 -0
- teradataml/data/jsons/sqle/17.00/Pack.json +98 -0
- teradataml/data/jsons/sqle/17.00/SVMSparsePredict.json +162 -0
- teradataml/data/jsons/sqle/17.00/Sessionize.json +105 -0
- teradataml/data/jsons/sqle/17.00/StringSimilarity.json +86 -0
- teradataml/data/jsons/sqle/17.00/Unpack.json +166 -0
- teradataml/data/jsons/sqle/17.00/nPath.json +269 -0
- teradataml/data/jsons/sqle/17.05/Antiselect.json +56 -0
- teradataml/data/jsons/sqle/17.05/Attribution.json +249 -0
- teradataml/data/jsons/sqle/17.05/DecisionForestPredict.json +156 -0
- teradataml/data/jsons/sqle/17.05/DecisionTreePredict.json +170 -0
- teradataml/data/jsons/sqle/17.05/GLMPredict.json +122 -0
- teradataml/data/jsons/sqle/17.05/MovingAverage.json +367 -0
- teradataml/data/jsons/sqle/17.05/NGramSplitter.json +239 -0
- teradataml/data/jsons/sqle/17.05/NaiveBayesPredict.json +136 -0
- teradataml/data/jsons/sqle/17.05/NaiveBayesTextClassifierPredict.json +235 -0
- teradataml/data/jsons/sqle/17.05/Pack.json +98 -0
- teradataml/data/jsons/sqle/17.05/SVMSparsePredict.json +162 -0
- teradataml/data/jsons/sqle/17.05/Sessionize.json +105 -0
- teradataml/data/jsons/sqle/17.05/StringSimilarity.json +86 -0
- teradataml/data/jsons/sqle/17.05/Unpack.json +166 -0
- teradataml/data/jsons/sqle/17.05/nPath.json +269 -0
- teradataml/data/jsons/sqle/17.10/Antiselect.json +56 -0
- teradataml/data/jsons/sqle/17.10/Attribution.json +249 -0
- teradataml/data/jsons/sqle/17.10/DecisionForestPredict.json +185 -0
- teradataml/data/jsons/sqle/17.10/DecisionTreePredict.json +172 -0
- teradataml/data/jsons/sqle/17.10/GLMPredict.json +151 -0
- teradataml/data/jsons/sqle/17.10/MovingAverage.json +368 -0
- teradataml/data/jsons/sqle/17.10/NGramSplitter.json +239 -0
- teradataml/data/jsons/sqle/17.10/NaiveBayesPredict.json +149 -0
- teradataml/data/jsons/sqle/17.10/NaiveBayesTextClassifierPredict.json +288 -0
- teradataml/data/jsons/sqle/17.10/Pack.json +133 -0
- teradataml/data/jsons/sqle/17.10/SVMSparsePredict.json +193 -0
- teradataml/data/jsons/sqle/17.10/Sessionize.json +105 -0
- teradataml/data/jsons/sqle/17.10/StringSimilarity.json +86 -0
- teradataml/data/jsons/sqle/17.10/TD_BinCodeFit.json +239 -0
- teradataml/data/jsons/sqle/17.10/TD_BinCodeTransform.json +70 -0
- teradataml/data/jsons/sqle/17.10/TD_CategoricalSummary.json +54 -0
- teradataml/data/jsons/sqle/17.10/TD_Chisq.json +68 -0
- teradataml/data/jsons/sqle/17.10/TD_ColumnSummary.json +54 -0
- teradataml/data/jsons/sqle/17.10/TD_ConvertTo.json +69 -0
- teradataml/data/jsons/sqle/17.10/TD_FTest.json +187 -0
- teradataml/data/jsons/sqle/17.10/TD_FillRowID.json +52 -0
- teradataml/data/jsons/sqle/17.10/TD_FunctionFit.json +46 -0
- teradataml/data/jsons/sqle/17.10/TD_FunctionTransform.json +72 -0
- teradataml/data/jsons/sqle/17.10/TD_GetRowsWithMissingValues.json +53 -0
- teradataml/data/jsons/sqle/17.10/TD_GetRowsWithoutMissingValues.json +53 -0
- teradataml/data/jsons/sqle/17.10/TD_Histogram.json +133 -0
- teradataml/data/jsons/sqle/17.10/TD_NumApply.json +147 -0
- teradataml/data/jsons/sqle/17.10/TD_OneHotEncodingFit.json +183 -0
- teradataml/data/jsons/sqle/17.10/TD_OneHotEncodingTransform.json +66 -0
- teradataml/data/jsons/sqle/17.10/TD_OutlierFilterFit.json +197 -0
- teradataml/data/jsons/sqle/17.10/TD_OutlierFilterTransform.json +48 -0
- teradataml/data/jsons/sqle/17.10/TD_PolynomialFeaturesFit.json +114 -0
- teradataml/data/jsons/sqle/17.10/TD_PolynomialFeaturesTransform.json +72 -0
- teradataml/data/jsons/sqle/17.10/TD_QQNorm.json +112 -0
- teradataml/data/jsons/sqle/17.10/TD_RoundColumns.json +93 -0
- teradataml/data/jsons/sqle/17.10/TD_RowNormalizeFit.json +128 -0
- teradataml/data/jsons/sqle/17.10/TD_RowNormalizeTransform.json +71 -0
- teradataml/data/jsons/sqle/17.10/TD_ScaleFit.json +157 -0
- teradataml/data/jsons/sqle/17.10/TD_ScaleTransform.json +71 -0
- teradataml/data/jsons/sqle/17.10/TD_SimpleImputeFit.json +148 -0
- teradataml/data/jsons/sqle/17.10/TD_SimpleImputeTransform.json +48 -0
- teradataml/data/jsons/sqle/17.10/TD_StrApply.json +240 -0
- teradataml/data/jsons/sqle/17.10/TD_UnivariateStatistics.json +119 -0
- teradataml/data/jsons/sqle/17.10/TD_WhichMax.json +53 -0
- teradataml/data/jsons/sqle/17.10/TD_WhichMin.json +53 -0
- teradataml/data/jsons/sqle/17.10/TD_ZTest.json +171 -0
- teradataml/data/jsons/sqle/17.10/Unpack.json +188 -0
- teradataml/data/jsons/sqle/17.10/nPath.json +269 -0
- teradataml/data/jsons/sqle/17.20/Antiselect.json +56 -0
- teradataml/data/jsons/sqle/17.20/Attribution.json +249 -0
- teradataml/data/jsons/sqle/17.20/DecisionForestPredict.json +185 -0
- teradataml/data/jsons/sqle/17.20/DecisionTreePredict.json +172 -0
- teradataml/data/jsons/sqle/17.20/GLMPredict.json +151 -0
- teradataml/data/jsons/sqle/17.20/MovingAverage.json +367 -0
- teradataml/data/jsons/sqle/17.20/NGramSplitter.json +239 -0
- teradataml/data/jsons/sqle/17.20/NaiveBayesPredict.json +149 -0
- teradataml/data/jsons/sqle/17.20/NaiveBayesTextClassifierPredict.json +287 -0
- teradataml/data/jsons/sqle/17.20/Pack.json +133 -0
- teradataml/data/jsons/sqle/17.20/SVMSparsePredict.json +192 -0
- teradataml/data/jsons/sqle/17.20/Sessionize.json +105 -0
- teradataml/data/jsons/sqle/17.20/StringSimilarity.json +86 -0
- teradataml/data/jsons/sqle/17.20/TD_ANOVA.json +149 -0
- teradataml/data/jsons/sqle/17.20/TD_Apriori.json +181 -0
- teradataml/data/jsons/sqle/17.20/TD_BinCodeFit.json +239 -0
- teradataml/data/jsons/sqle/17.20/TD_BinCodeTransform.json +71 -0
- teradataml/data/jsons/sqle/17.20/TD_CFilter.json +118 -0
- teradataml/data/jsons/sqle/17.20/TD_CategoricalSummary.json +53 -0
- teradataml/data/jsons/sqle/17.20/TD_Chisq.json +68 -0
- teradataml/data/jsons/sqle/17.20/TD_ClassificationEvaluator.json +146 -0
- teradataml/data/jsons/sqle/17.20/TD_ColumnSummary.json +53 -0
- teradataml/data/jsons/sqle/17.20/TD_ColumnTransformer.json +218 -0
- teradataml/data/jsons/sqle/17.20/TD_ConvertTo.json +92 -0
- teradataml/data/jsons/sqle/17.20/TD_DecisionForest.json +260 -0
- teradataml/data/jsons/sqle/17.20/TD_DecisionForestPredict.json +139 -0
- teradataml/data/jsons/sqle/17.20/TD_FTest.json +269 -0
- teradataml/data/jsons/sqle/17.20/TD_FillRowID.json +52 -0
- teradataml/data/jsons/sqle/17.20/TD_FunctionFit.json +46 -0
- teradataml/data/jsons/sqle/17.20/TD_FunctionTransform.json +72 -0
- teradataml/data/jsons/sqle/17.20/TD_GLM.json +507 -0
- teradataml/data/jsons/sqle/17.20/TD_GLMPREDICT.json +168 -0
- teradataml/data/jsons/sqle/17.20/TD_GLMPerSegment.json +411 -0
- teradataml/data/jsons/sqle/17.20/TD_GLMPredictPerSegment.json +146 -0
- teradataml/data/jsons/sqle/17.20/TD_GetFutileColumns.json +93 -0
- teradataml/data/jsons/sqle/17.20/TD_GetRowsWithMissingValues.json +76 -0
- teradataml/data/jsons/sqle/17.20/TD_GetRowsWithoutMissingValues.json +76 -0
- teradataml/data/jsons/sqle/17.20/TD_Histogram.json +152 -0
- teradataml/data/jsons/sqle/17.20/TD_KMeans.json +232 -0
- teradataml/data/jsons/sqle/17.20/TD_KMeansPredict.json +87 -0
- teradataml/data/jsons/sqle/17.20/TD_KNN.json +262 -0
- teradataml/data/jsons/sqle/17.20/TD_NERExtractor.json +145 -0
- teradataml/data/jsons/sqle/17.20/TD_NaiveBayes.json +193 -0
- teradataml/data/jsons/sqle/17.20/TD_NaiveBayesPredict.json +212 -0
- teradataml/data/jsons/sqle/17.20/TD_NaiveBayesTextClassifierTrainer.json +137 -0
- teradataml/data/jsons/sqle/17.20/TD_NonLinearCombineFit.json +102 -0
- teradataml/data/jsons/sqle/17.20/TD_NonLinearCombineTransform.json +71 -0
- teradataml/data/jsons/sqle/17.20/TD_NumApply.json +147 -0
- teradataml/data/jsons/sqle/17.20/TD_OneClassSVM.json +316 -0
- teradataml/data/jsons/sqle/17.20/TD_OneClassSVMPredict.json +124 -0
- teradataml/data/jsons/sqle/17.20/TD_OneHotEncodingFit.json +271 -0
- teradataml/data/jsons/sqle/17.20/TD_OneHotEncodingTransform.json +65 -0
- teradataml/data/jsons/sqle/17.20/TD_OrdinalEncodingFit.json +229 -0
- teradataml/data/jsons/sqle/17.20/TD_OrdinalEncodingTransform.json +75 -0
- teradataml/data/jsons/sqle/17.20/TD_OutlierFilterFit.json +217 -0
- teradataml/data/jsons/sqle/17.20/TD_OutlierFilterTransform.json +48 -0
- teradataml/data/jsons/sqle/17.20/TD_Pivoting.json +280 -0
- teradataml/data/jsons/sqle/17.20/TD_PolynomialFeaturesFit.json +114 -0
- teradataml/data/jsons/sqle/17.20/TD_PolynomialFeaturesTransform.json +72 -0
- teradataml/data/jsons/sqle/17.20/TD_QQNorm.json +111 -0
- teradataml/data/jsons/sqle/17.20/TD_ROC.json +179 -0
- teradataml/data/jsons/sqle/17.20/TD_RandomProjectionFit.json +179 -0
- teradataml/data/jsons/sqle/17.20/TD_RandomProjectionMinComponents.json +74 -0
- teradataml/data/jsons/sqle/17.20/TD_RandomProjectionTransform.json +74 -0
- teradataml/data/jsons/sqle/17.20/TD_RegressionEvaluator.json +138 -0
- teradataml/data/jsons/sqle/17.20/TD_RoundColumns.json +93 -0
- teradataml/data/jsons/sqle/17.20/TD_RowNormalizeFit.json +128 -0
- teradataml/data/jsons/sqle/17.20/TD_RowNormalizeTransform.json +71 -0
- teradataml/data/jsons/sqle/17.20/TD_SMOTE.json +267 -0
- teradataml/data/jsons/sqle/17.20/TD_SVM.json +389 -0
- teradataml/data/jsons/sqle/17.20/TD_SVMPredict.json +142 -0
- teradataml/data/jsons/sqle/17.20/TD_ScaleFit.json +310 -0
- teradataml/data/jsons/sqle/17.20/TD_ScaleTransform.json +120 -0
- teradataml/data/jsons/sqle/17.20/TD_SentimentExtractor.json +194 -0
- teradataml/data/jsons/sqle/17.20/TD_Shap.json +221 -0
- teradataml/data/jsons/sqle/17.20/TD_Silhouette.json +143 -0
- teradataml/data/jsons/sqle/17.20/TD_SimpleImputeFit.json +147 -0
- teradataml/data/jsons/sqle/17.20/TD_SimpleImputeTransform.json +48 -0
- teradataml/data/jsons/sqle/17.20/TD_StrApply.json +240 -0
- teradataml/data/jsons/sqle/17.20/TD_TFIDF.json +162 -0
- teradataml/data/jsons/sqle/17.20/TD_TargetEncodingFit.json +248 -0
- teradataml/data/jsons/sqle/17.20/TD_TargetEncodingTransform.json +75 -0
- teradataml/data/jsons/sqle/17.20/TD_TextMorph.json +134 -0
- teradataml/data/jsons/sqle/17.20/TD_TextParser.json +297 -0
- teradataml/data/jsons/sqle/17.20/TD_TrainTestSplit.json +142 -0
- teradataml/data/jsons/sqle/17.20/TD_UnivariateStatistics.json +117 -0
- teradataml/data/jsons/sqle/17.20/TD_Unpivoting.json +235 -0
- teradataml/data/jsons/sqle/17.20/TD_VectorDistance.json +183 -0
- teradataml/data/jsons/sqle/17.20/TD_WhichMax.json +53 -0
- teradataml/data/jsons/sqle/17.20/TD_WhichMin.json +53 -0
- teradataml/data/jsons/sqle/17.20/TD_WordEmbeddings.json +241 -0
- teradataml/data/jsons/sqle/17.20/TD_XGBoost.json +330 -0
- teradataml/data/jsons/sqle/17.20/TD_XGBoostPredict.json +195 -0
- teradataml/data/jsons/sqle/17.20/TD_ZTest.json +247 -0
- teradataml/data/jsons/sqle/17.20/Unpack.json +188 -0
- teradataml/data/jsons/sqle/17.20/nPath.json +269 -0
- teradataml/data/jsons/sqle/20.00/AI_AnalyzeSentiment.json +370 -0
- teradataml/data/jsons/sqle/20.00/AI_AskLLM.json +460 -0
- teradataml/data/jsons/sqle/20.00/AI_DetectLanguage.json +385 -0
- teradataml/data/jsons/sqle/20.00/AI_ExtractKeyPhrases.json +369 -0
- teradataml/data/jsons/sqle/20.00/AI_MaskPII.json +369 -0
- teradataml/data/jsons/sqle/20.00/AI_RecognizeEntities.json +369 -0
- teradataml/data/jsons/sqle/20.00/AI_RecognizePIIEntities.json +369 -0
- teradataml/data/jsons/sqle/20.00/AI_TextClassifier.json +400 -0
- teradataml/data/jsons/sqle/20.00/AI_TextEmbeddings.json +401 -0
- teradataml/data/jsons/sqle/20.00/AI_TextSummarize.json +384 -0
- teradataml/data/jsons/sqle/20.00/AI_TextTranslate.json +384 -0
- teradataml/data/jsons/sqle/20.00/TD_API_AzureML.json +151 -0
- teradataml/data/jsons/sqle/20.00/TD_API_Sagemaker.json +182 -0
- teradataml/data/jsons/sqle/20.00/TD_API_VertexAI.json +183 -0
- teradataml/data/jsons/sqle/20.00/TD_HNSW.json +296 -0
- teradataml/data/jsons/sqle/20.00/TD_HNSWPredict.json +206 -0
- teradataml/data/jsons/sqle/20.00/TD_HNSWSummary.json +32 -0
- teradataml/data/jsons/sqle/20.00/TD_KMeans.json +250 -0
- teradataml/data/jsons/sqle/20.00/TD_SMOTE.json +266 -0
- teradataml/data/jsons/sqle/20.00/TD_VectorDistance.json +278 -0
- teradataml/data/jsons/storedprocedure/17.20/TD_COPYART.json +71 -0
- teradataml/data/jsons/storedprocedure/17.20/TD_FILTERFACTORY1D.json +150 -0
- teradataml/data/jsons/tableoperator/17.00/read_nos.json +198 -0
- teradataml/data/jsons/tableoperator/17.05/read_nos.json +198 -0
- teradataml/data/jsons/tableoperator/17.05/write_nos.json +195 -0
- teradataml/data/jsons/tableoperator/17.10/read_nos.json +184 -0
- teradataml/data/jsons/tableoperator/17.10/write_nos.json +195 -0
- teradataml/data/jsons/tableoperator/17.20/IMAGE2MATRIX.json +53 -0
- teradataml/data/jsons/tableoperator/17.20/read_nos.json +183 -0
- teradataml/data/jsons/tableoperator/17.20/write_nos.json +224 -0
- teradataml/data/jsons/uaf/17.20/TD_ACF.json +132 -0
- teradataml/data/jsons/uaf/17.20/TD_ARIMAESTIMATE.json +396 -0
- teradataml/data/jsons/uaf/17.20/TD_ARIMAFORECAST.json +77 -0
- teradataml/data/jsons/uaf/17.20/TD_ARIMAVALIDATE.json +153 -0
- teradataml/data/jsons/uaf/17.20/TD_ARIMAXESTIMATE.json +362 -0
- teradataml/data/jsons/uaf/17.20/TD_AUTOARIMA.json +469 -0
- teradataml/data/jsons/uaf/17.20/TD_BINARYMATRIXOP.json +107 -0
- teradataml/data/jsons/uaf/17.20/TD_BINARYSERIESOP.json +106 -0
- teradataml/data/jsons/uaf/17.20/TD_BREUSCH_GODFREY.json +89 -0
- teradataml/data/jsons/uaf/17.20/TD_BREUSCH_PAGAN_GODFREY.json +104 -0
- teradataml/data/jsons/uaf/17.20/TD_CONVOLVE.json +78 -0
- teradataml/data/jsons/uaf/17.20/TD_CONVOLVE2.json +66 -0
- teradataml/data/jsons/uaf/17.20/TD_CUMUL_PERIODOGRAM.json +87 -0
- teradataml/data/jsons/uaf/17.20/TD_DFFT.json +134 -0
- teradataml/data/jsons/uaf/17.20/TD_DFFT2.json +144 -0
- teradataml/data/jsons/uaf/17.20/TD_DFFT2CONV.json +108 -0
- teradataml/data/jsons/uaf/17.20/TD_DFFTCONV.json +108 -0
- teradataml/data/jsons/uaf/17.20/TD_DICKEY_FULLER.json +78 -0
- teradataml/data/jsons/uaf/17.20/TD_DIFF.json +92 -0
- teradataml/data/jsons/uaf/17.20/TD_DTW.json +114 -0
- teradataml/data/jsons/uaf/17.20/TD_DURBIN_WATSON.json +101 -0
- teradataml/data/jsons/uaf/17.20/TD_DWT.json +173 -0
- teradataml/data/jsons/uaf/17.20/TD_DWT2D.json +160 -0
- teradataml/data/jsons/uaf/17.20/TD_EXTRACT_RESULTS.json +39 -0
- teradataml/data/jsons/uaf/17.20/TD_FITMETRICS.json +101 -0
- teradataml/data/jsons/uaf/17.20/TD_GENSERIES4FORMULA.json +85 -0
- teradataml/data/jsons/uaf/17.20/TD_GENSERIES4SINUSOIDS.json +71 -0
- teradataml/data/jsons/uaf/17.20/TD_GOLDFELD_QUANDT.json +139 -0
- teradataml/data/jsons/uaf/17.20/TD_HOLT_WINTERS_FORECASTER.json +313 -0
- teradataml/data/jsons/uaf/17.20/TD_IDFFT.json +58 -0
- teradataml/data/jsons/uaf/17.20/TD_IDFFT2.json +81 -0
- teradataml/data/jsons/uaf/17.20/TD_IDWT.json +162 -0
- teradataml/data/jsons/uaf/17.20/TD_IDWT2D.json +149 -0
- teradataml/data/jsons/uaf/17.20/TD_INPUTVALIDATOR.json +64 -0
- teradataml/data/jsons/uaf/17.20/TD_IQR.json +117 -0
- teradataml/data/jsons/uaf/17.20/TD_LINEAR_REGR.json +182 -0
- teradataml/data/jsons/uaf/17.20/TD_LINESPEC.json +103 -0
- teradataml/data/jsons/uaf/17.20/TD_MAMEAN.json +181 -0
- teradataml/data/jsons/uaf/17.20/TD_MATRIX2IMAGE.json +209 -0
- teradataml/data/jsons/uaf/17.20/TD_MATRIXMULTIPLY.json +68 -0
- teradataml/data/jsons/uaf/17.20/TD_MINFO.json +67 -0
- teradataml/data/jsons/uaf/17.20/TD_MULTIVAR_REGR.json +179 -0
- teradataml/data/jsons/uaf/17.20/TD_PACF.json +114 -0
- teradataml/data/jsons/uaf/17.20/TD_PORTMAN.json +119 -0
- teradataml/data/jsons/uaf/17.20/TD_POWERSPEC.json +175 -0
- teradataml/data/jsons/uaf/17.20/TD_POWERTRANSFORM.json +98 -0
- teradataml/data/jsons/uaf/17.20/TD_RESAMPLE.json +194 -0
- teradataml/data/jsons/uaf/17.20/TD_SAX.json +210 -0
- teradataml/data/jsons/uaf/17.20/TD_SEASONALNORMALIZE.json +143 -0
- teradataml/data/jsons/uaf/17.20/TD_SELECTION_CRITERIA.json +90 -0
- teradataml/data/jsons/uaf/17.20/TD_SIGNIF_PERIODICITIES.json +80 -0
- teradataml/data/jsons/uaf/17.20/TD_SIGNIF_RESIDMEAN.json +68 -0
- teradataml/data/jsons/uaf/17.20/TD_SIMPLEEXP.json +184 -0
- teradataml/data/jsons/uaf/17.20/TD_SINFO.json +58 -0
- teradataml/data/jsons/uaf/17.20/TD_SMOOTHMA.json +163 -0
- teradataml/data/jsons/uaf/17.20/TD_TRACKINGOP.json +101 -0
- teradataml/data/jsons/uaf/17.20/TD_UNDIFF.json +112 -0
- teradataml/data/jsons/uaf/17.20/TD_UNNORMALIZE.json +95 -0
- teradataml/data/jsons/uaf/17.20/TD_WHITES_GENERAL.json +78 -0
- teradataml/data/jsons/uaf/17.20/TD_WINDOWDFFT.json +410 -0
- teradataml/data/kmeans_example.json +23 -0
- teradataml/data/kmeans_table.csv +10 -0
- teradataml/data/kmeans_us_arrests_data.csv +51 -0
- teradataml/data/knn_example.json +19 -0
- teradataml/data/knnrecommender_example.json +7 -0
- teradataml/data/knnrecommenderpredict_example.json +12 -0
- teradataml/data/lar_example.json +17 -0
- teradataml/data/larpredict_example.json +30 -0
- teradataml/data/lc_new_predictors.csv +5 -0
- teradataml/data/lc_new_reference.csv +9 -0
- teradataml/data/lda_example.json +9 -0
- teradataml/data/ldainference_example.json +15 -0
- teradataml/data/ldatopicsummary_example.json +9 -0
- teradataml/data/levendist_input.csv +13 -0
- teradataml/data/levenshteindistance_example.json +10 -0
- teradataml/data/linreg_example.json +10 -0
- teradataml/data/load_example_data.py +350 -0
- teradataml/data/loan_prediction.csv +295 -0
- teradataml/data/lungcancer.csv +138 -0
- teradataml/data/mappingdata.csv +12 -0
- teradataml/data/medical_readings.csv +101 -0
- teradataml/data/milk_timeseries.csv +157 -0
- teradataml/data/min_max_titanic.csv +4 -0
- teradataml/data/minhash_example.json +6 -0
- teradataml/data/ml_ratings.csv +7547 -0
- teradataml/data/ml_ratings_10.csv +2445 -0
- teradataml/data/mobile_data.csv +13 -0
- teradataml/data/model1_table.csv +5 -0
- teradataml/data/model2_table.csv +5 -0
- teradataml/data/models/License_file.txt +1 -0
- teradataml/data/models/License_file_empty.txt +0 -0
- teradataml/data/models/dataiku_iris_data_ann_thin +0 -0
- teradataml/data/models/dr_iris_rf +0 -0
- teradataml/data/models/iris_db_dt_model_sklearn.onnx +0 -0
- teradataml/data/models/iris_db_dt_model_sklearn_floattensor.onnx +0 -0
- teradataml/data/models/iris_db_glm_model.pmml +57 -0
- teradataml/data/models/iris_db_xgb_model.pmml +4471 -0
- teradataml/data/models/iris_kmeans_model +0 -0
- teradataml/data/models/iris_mojo_glm_h2o_model +0 -0
- teradataml/data/models/iris_mojo_xgb_h2o_model +0 -0
- teradataml/data/modularity_example.json +12 -0
- teradataml/data/movavg_example.json +8 -0
- teradataml/data/mtx1.csv +7 -0
- teradataml/data/mtx2.csv +13 -0
- teradataml/data/multi_model_classification.csv +401 -0
- teradataml/data/multi_model_regression.csv +401 -0
- teradataml/data/mvdfft8.csv +9 -0
- teradataml/data/naivebayes_example.json +10 -0
- teradataml/data/naivebayespredict_example.json +19 -0
- teradataml/data/naivebayestextclassifier2_example.json +7 -0
- teradataml/data/naivebayestextclassifier_example.json +8 -0
- teradataml/data/naivebayestextclassifierpredict_example.json +32 -0
- teradataml/data/name_Find_configure.csv +10 -0
- teradataml/data/namedentityfinder_example.json +14 -0
- teradataml/data/namedentityfinderevaluator_example.json +10 -0
- teradataml/data/namedentityfindertrainer_example.json +6 -0
- teradataml/data/nb_iris_input_test.csv +31 -0
- teradataml/data/nb_iris_input_train.csv +121 -0
- teradataml/data/nbp_iris_model.csv +13 -0
- teradataml/data/ner_dict.csv +8 -0
- teradataml/data/ner_extractor_text.csv +2 -0
- teradataml/data/ner_input_eng.csv +7 -0
- teradataml/data/ner_rule.csv +5 -0
- teradataml/data/ner_sports_test2.csv +29 -0
- teradataml/data/ner_sports_train.csv +501 -0
- teradataml/data/nerevaluator_example.json +6 -0
- teradataml/data/nerextractor_example.json +18 -0
- teradataml/data/nermem_sports_test.csv +18 -0
- teradataml/data/nermem_sports_train.csv +51 -0
- teradataml/data/nertrainer_example.json +7 -0
- teradataml/data/ngrams_example.json +7 -0
- teradataml/data/notebooks/__init__.py +0 -0
- teradataml/data/notebooks/sqlalchemy/Teradata Vantage Aggregate Functions using SQLAlchemy.ipynb +1455 -0
- teradataml/data/notebooks/sqlalchemy/Teradata Vantage Arithmetic Functions Using SQLAlchemy.ipynb +1993 -0
- teradataml/data/notebooks/sqlalchemy/Teradata Vantage Bit-Byte Manipulation Functions using SQLAlchemy.ipynb +1492 -0
- teradataml/data/notebooks/sqlalchemy/Teradata Vantage Built-in functions using SQLAlchemy.ipynb +536 -0
- teradataml/data/notebooks/sqlalchemy/Teradata Vantage Regular Expressions Using SQLAlchemy.ipynb +570 -0
- teradataml/data/notebooks/sqlalchemy/Teradata Vantage String Functions Using SQLAlchemy.ipynb +2559 -0
- teradataml/data/notebooks/sqlalchemy/Teradata Vantage Window Aggregate Functions using SQLAlchemy.ipynb +2911 -0
- teradataml/data/notebooks/sqlalchemy/Using Generic SQLAlchemy ClauseElements teradataml DataFrame assign method.ipynb +698 -0
- teradataml/data/notebooks/sqlalchemy/__init__.py +0 -0
- teradataml/data/notebooks/sqlalchemy/teradataml filtering using SQLAlchemy ClauseElements.ipynb +784 -0
- teradataml/data/npath_example.json +23 -0
- teradataml/data/ntree_example.json +14 -0
- teradataml/data/numeric_strings.csv +5 -0
- teradataml/data/numerics.csv +4 -0
- teradataml/data/ocean_buoy.csv +17 -0
- teradataml/data/ocean_buoy2.csv +17 -0
- teradataml/data/ocean_buoys.csv +28 -0
- teradataml/data/ocean_buoys2.csv +10 -0
- teradataml/data/ocean_buoys_nonpti.csv +28 -0
- teradataml/data/ocean_buoys_seq.csv +29 -0
- teradataml/data/onehot_encoder_train.csv +4 -0
- teradataml/data/openml_example.json +92 -0
- teradataml/data/optional_event_table.csv +4 -0
- teradataml/data/orders1.csv +11 -0
- teradataml/data/orders1_12.csv +13 -0
- teradataml/data/orders_ex.csv +4 -0
- teradataml/data/pack_example.json +9 -0
- teradataml/data/package_tracking.csv +19 -0
- teradataml/data/package_tracking_pti.csv +19 -0
- teradataml/data/pagerank_example.json +13 -0
- teradataml/data/paragraphs_input.csv +6 -0
- teradataml/data/pathanalyzer_example.json +8 -0
- teradataml/data/pathgenerator_example.json +8 -0
- teradataml/data/patient_profile.csv +101 -0
- teradataml/data/pattern_matching_data.csv +11 -0
- teradataml/data/payment_fraud_dataset.csv +10001 -0
- teradataml/data/peppers.png +0 -0
- teradataml/data/phrases.csv +7 -0
- teradataml/data/pivot_example.json +9 -0
- teradataml/data/pivot_input.csv +22 -0
- teradataml/data/playerRating.csv +31 -0
- teradataml/data/pos_input.csv +40 -0
- teradataml/data/postagger_example.json +7 -0
- teradataml/data/posttagger_output.csv +44 -0
- teradataml/data/production_data.csv +17 -0
- teradataml/data/production_data2.csv +7 -0
- teradataml/data/randomsample_example.json +32 -0
- teradataml/data/randomwalksample_example.json +9 -0
- teradataml/data/rank_table.csv +6 -0
- teradataml/data/real_values.csv +14 -0
- teradataml/data/ref_mobile_data.csv +4 -0
- teradataml/data/ref_mobile_data_dense.csv +2 -0
- teradataml/data/ref_url.csv +17 -0
- teradataml/data/restaurant_reviews.csv +7 -0
- teradataml/data/retail_churn_table.csv +27772 -0
- teradataml/data/river_data.csv +145 -0
- teradataml/data/roc_example.json +8 -0
- teradataml/data/roc_input.csv +101 -0
- teradataml/data/rule_inputs.csv +6 -0
- teradataml/data/rule_table.csv +2 -0
- teradataml/data/sales.csv +7 -0
- teradataml/data/sales_transaction.csv +501 -0
- teradataml/data/salesdata.csv +342 -0
- teradataml/data/sample_cities.csv +3 -0
- teradataml/data/sample_shapes.csv +11 -0
- teradataml/data/sample_streets.csv +3 -0
- teradataml/data/sampling_example.json +16 -0
- teradataml/data/sax_example.json +17 -0
- teradataml/data/scale_attributes.csv +3 -0
- teradataml/data/scale_example.json +74 -0
- teradataml/data/scale_housing.csv +11 -0
- teradataml/data/scale_housing_test.csv +6 -0
- teradataml/data/scale_input_part_sparse.csv +31 -0
- teradataml/data/scale_input_partitioned.csv +16 -0
- teradataml/data/scale_input_sparse.csv +11 -0
- teradataml/data/scale_parameters.csv +3 -0
- teradataml/data/scale_stat.csv +11 -0
- teradataml/data/scalebypartition_example.json +13 -0
- teradataml/data/scalemap_example.json +13 -0
- teradataml/data/scalesummary_example.json +12 -0
- teradataml/data/score_category.csv +101 -0
- teradataml/data/score_summary.csv +4 -0
- teradataml/data/script_example.json +10 -0
- teradataml/data/scripts/deploy_script.py +84 -0
- teradataml/data/scripts/lightgbm/dataset.template +175 -0
- teradataml/data/scripts/lightgbm/lightgbm_class_functions.template +264 -0
- teradataml/data/scripts/lightgbm/lightgbm_function.template +234 -0
- teradataml/data/scripts/lightgbm/lightgbm_sklearn.template +177 -0
- teradataml/data/scripts/mapper.R +20 -0
- teradataml/data/scripts/mapper.py +16 -0
- teradataml/data/scripts/mapper_replace.py +16 -0
- teradataml/data/scripts/sklearn/__init__.py +0 -0
- teradataml/data/scripts/sklearn/sklearn_fit.py +205 -0
- teradataml/data/scripts/sklearn/sklearn_fit_predict.py +148 -0
- teradataml/data/scripts/sklearn/sklearn_function.template +144 -0
- teradataml/data/scripts/sklearn/sklearn_model_selection_split.py +166 -0
- teradataml/data/scripts/sklearn/sklearn_neighbors.py +161 -0
- teradataml/data/scripts/sklearn/sklearn_score.py +145 -0
- teradataml/data/scripts/sklearn/sklearn_transform.py +327 -0
- teradataml/data/sdk/modelops/modelops_spec.json +101737 -0
- teradataml/data/seeds.csv +10 -0
- teradataml/data/sentenceextractor_example.json +7 -0
- teradataml/data/sentiment_extract_input.csv +11 -0
- teradataml/data/sentiment_train.csv +16 -0
- teradataml/data/sentiment_word.csv +20 -0
- teradataml/data/sentiment_word_input.csv +20 -0
- teradataml/data/sentimentextractor_example.json +24 -0
- teradataml/data/sentimenttrainer_example.json +8 -0
- teradataml/data/sequence_table.csv +10 -0
- teradataml/data/seriessplitter_example.json +8 -0
- teradataml/data/sessionize_example.json +17 -0
- teradataml/data/sessionize_table.csv +116 -0
- teradataml/data/setop_test1.csv +24 -0
- teradataml/data/setop_test2.csv +22 -0
- teradataml/data/soc_nw_edges.csv +11 -0
- teradataml/data/soc_nw_vertices.csv +8 -0
- teradataml/data/souvenir_timeseries.csv +168 -0
- teradataml/data/sparse_iris_attribute.csv +5 -0
- teradataml/data/sparse_iris_test.csv +121 -0
- teradataml/data/sparse_iris_train.csv +601 -0
- teradataml/data/star1.csv +6 -0
- teradataml/data/star_pivot.csv +8 -0
- teradataml/data/state_transition.csv +5 -0
- teradataml/data/stock_data.csv +53 -0
- teradataml/data/stock_movement.csv +11 -0
- teradataml/data/stock_vol.csv +76 -0
- teradataml/data/stop_words.csv +8 -0
- teradataml/data/store_sales.csv +37 -0
- teradataml/data/stringsimilarity_example.json +8 -0
- teradataml/data/strsimilarity_input.csv +13 -0
- teradataml/data/students.csv +101 -0
- teradataml/data/svm_iris_input_test.csv +121 -0
- teradataml/data/svm_iris_input_train.csv +481 -0
- teradataml/data/svm_iris_model.csv +7 -0
- teradataml/data/svmdense_example.json +10 -0
- teradataml/data/svmdensepredict_example.json +19 -0
- teradataml/data/svmsparse_example.json +8 -0
- teradataml/data/svmsparsepredict_example.json +14 -0
- teradataml/data/svmsparsesummary_example.json +8 -0
- teradataml/data/target_mobile_data.csv +13 -0
- teradataml/data/target_mobile_data_dense.csv +5 -0
- teradataml/data/target_udt_data.csv +8 -0
- teradataml/data/tdnerextractor_example.json +14 -0
- teradataml/data/templatedata.csv +1201 -0
- teradataml/data/templates/open_source_ml.json +11 -0
- teradataml/data/teradata_icon.ico +0 -0
- teradataml/data/teradataml_example.json +1473 -0
- teradataml/data/test_classification.csv +101 -0
- teradataml/data/test_loan_prediction.csv +53 -0
- teradataml/data/test_pacf_12.csv +37 -0
- teradataml/data/test_prediction.csv +101 -0
- teradataml/data/test_regression.csv +101 -0
- teradataml/data/test_river2.csv +109 -0
- teradataml/data/text_inputs.csv +6 -0
- teradataml/data/textchunker_example.json +8 -0
- teradataml/data/textclassifier_example.json +7 -0
- teradataml/data/textclassifier_input.csv +7 -0
- teradataml/data/textclassifiertrainer_example.json +7 -0
- teradataml/data/textmorph_example.json +11 -0
- teradataml/data/textparser_example.json +15 -0
- teradataml/data/texttagger_example.json +12 -0
- teradataml/data/texttokenizer_example.json +7 -0
- teradataml/data/texttrainer_input.csv +11 -0
- teradataml/data/tf_example.json +7 -0
- teradataml/data/tfidf_example.json +14 -0
- teradataml/data/tfidf_input1.csv +201 -0
- teradataml/data/tfidf_train.csv +6 -0
- teradataml/data/time_table1.csv +535 -0
- teradataml/data/time_table2.csv +14 -0
- teradataml/data/timeseriesdata.csv +1601 -0
- teradataml/data/timeseriesdatasetsd4.csv +105 -0
- teradataml/data/timestamp_data.csv +4 -0
- teradataml/data/titanic.csv +892 -0
- teradataml/data/titanic_dataset_unpivoted.csv +19 -0
- teradataml/data/to_num_data.csv +4 -0
- teradataml/data/tochar_data.csv +5 -0
- teradataml/data/token_table.csv +696 -0
- teradataml/data/train_multiclass.csv +101 -0
- teradataml/data/train_regression.csv +101 -0
- teradataml/data/train_regression_multiple_labels.csv +101 -0
- teradataml/data/train_tracking.csv +28 -0
- teradataml/data/trans_dense.csv +16 -0
- teradataml/data/trans_sparse.csv +55 -0
- teradataml/data/transformation_table.csv +6 -0
- teradataml/data/transformation_table_new.csv +2 -0
- teradataml/data/tv_spots.csv +16 -0
- teradataml/data/twod_climate_data.csv +117 -0
- teradataml/data/uaf_example.json +529 -0
- teradataml/data/univariatestatistics_example.json +9 -0
- teradataml/data/unpack_example.json +10 -0
- teradataml/data/unpivot_example.json +25 -0
- teradataml/data/unpivot_input.csv +8 -0
- teradataml/data/url_data.csv +10 -0
- teradataml/data/us_air_pass.csv +37 -0
- teradataml/data/us_population.csv +624 -0
- teradataml/data/us_states_shapes.csv +52 -0
- teradataml/data/varmax_example.json +18 -0
- teradataml/data/vectordistance_example.json +30 -0
- teradataml/data/ville_climatedata.csv +121 -0
- teradataml/data/ville_tempdata.csv +12 -0
- teradataml/data/ville_tempdata1.csv +12 -0
- teradataml/data/ville_temperature.csv +11 -0
- teradataml/data/waveletTable.csv +1605 -0
- teradataml/data/waveletTable2.csv +1605 -0
- teradataml/data/weightedmovavg_example.json +9 -0
- teradataml/data/wft_testing.csv +5 -0
- teradataml/data/windowdfft.csv +16 -0
- teradataml/data/wine_data.csv +1600 -0
- teradataml/data/word_embed_input_table1.csv +6 -0
- teradataml/data/word_embed_input_table2.csv +5 -0
- teradataml/data/word_embed_model.csv +23 -0
- teradataml/data/words_input.csv +13 -0
- teradataml/data/xconvolve_complex_left.csv +6 -0
- teradataml/data/xconvolve_complex_leftmulti.csv +6 -0
- teradataml/data/xgboost_example.json +36 -0
- teradataml/data/xgboostpredict_example.json +32 -0
- teradataml/data/ztest_example.json +16 -0
- teradataml/dataframe/__init__.py +0 -0
- teradataml/dataframe/copy_to.py +2446 -0
- teradataml/dataframe/data_transfer.py +2840 -0
- teradataml/dataframe/dataframe.py +20908 -0
- teradataml/dataframe/dataframe_utils.py +2114 -0
- teradataml/dataframe/fastload.py +794 -0
- teradataml/dataframe/functions.py +2110 -0
- teradataml/dataframe/indexer.py +424 -0
- teradataml/dataframe/row.py +160 -0
- teradataml/dataframe/setop.py +1171 -0
- teradataml/dataframe/sql.py +10904 -0
- teradataml/dataframe/sql_function_parameters.py +440 -0
- teradataml/dataframe/sql_functions.py +652 -0
- teradataml/dataframe/sql_interfaces.py +220 -0
- teradataml/dataframe/vantage_function_types.py +675 -0
- teradataml/dataframe/window.py +694 -0
- teradataml/dbutils/__init__.py +3 -0
- teradataml/dbutils/dbutils.py +2871 -0
- teradataml/dbutils/filemgr.py +318 -0
- teradataml/gen_ai/__init__.py +2 -0
- teradataml/gen_ai/convAI.py +473 -0
- teradataml/geospatial/__init__.py +4 -0
- teradataml/geospatial/geodataframe.py +1105 -0
- teradataml/geospatial/geodataframecolumn.py +392 -0
- teradataml/geospatial/geometry_types.py +926 -0
- teradataml/hyperparameter_tuner/__init__.py +1 -0
- teradataml/hyperparameter_tuner/optimizer.py +4115 -0
- teradataml/hyperparameter_tuner/utils.py +303 -0
- teradataml/lib/__init__.py +0 -0
- teradataml/lib/aed_0_1.dll +0 -0
- teradataml/lib/libaed_0_1.dylib +0 -0
- teradataml/lib/libaed_0_1.so +0 -0
- teradataml/lib/libaed_0_1_aarch64.so +0 -0
- teradataml/lib/libaed_0_1_ppc64le.so +0 -0
- teradataml/opensource/__init__.py +1 -0
- teradataml/opensource/_base.py +1321 -0
- teradataml/opensource/_class.py +464 -0
- teradataml/opensource/_constants.py +61 -0
- teradataml/opensource/_lightgbm.py +949 -0
- teradataml/opensource/_sklearn.py +1008 -0
- teradataml/opensource/_wrapper_utils.py +267 -0
- teradataml/options/__init__.py +148 -0
- teradataml/options/configure.py +489 -0
- teradataml/options/display.py +187 -0
- teradataml/plot/__init__.py +3 -0
- teradataml/plot/axis.py +1427 -0
- teradataml/plot/constants.py +15 -0
- teradataml/plot/figure.py +431 -0
- teradataml/plot/plot.py +810 -0
- teradataml/plot/query_generator.py +83 -0
- teradataml/plot/subplot.py +216 -0
- teradataml/scriptmgmt/UserEnv.py +4273 -0
- teradataml/scriptmgmt/__init__.py +3 -0
- teradataml/scriptmgmt/lls_utils.py +2157 -0
- teradataml/sdk/README.md +79 -0
- teradataml/sdk/__init__.py +4 -0
- teradataml/sdk/_auth_modes.py +422 -0
- teradataml/sdk/_func_params.py +487 -0
- teradataml/sdk/_json_parser.py +453 -0
- teradataml/sdk/_openapi_spec_constants.py +249 -0
- teradataml/sdk/_utils.py +236 -0
- teradataml/sdk/api_client.py +900 -0
- teradataml/sdk/constants.py +62 -0
- teradataml/sdk/modelops/__init__.py +98 -0
- teradataml/sdk/modelops/_client.py +409 -0
- teradataml/sdk/modelops/_constants.py +304 -0
- teradataml/sdk/modelops/models.py +2308 -0
- teradataml/sdk/spinner.py +107 -0
- teradataml/series/__init__.py +0 -0
- teradataml/series/series.py +537 -0
- teradataml/series/series_utils.py +71 -0
- teradataml/store/__init__.py +12 -0
- teradataml/store/feature_store/__init__.py +0 -0
- teradataml/store/feature_store/constants.py +658 -0
- teradataml/store/feature_store/feature_store.py +4814 -0
- teradataml/store/feature_store/mind_map.py +639 -0
- teradataml/store/feature_store/models.py +7330 -0
- teradataml/store/feature_store/utils.py +390 -0
- teradataml/table_operators/Apply.py +979 -0
- teradataml/table_operators/Script.py +1739 -0
- teradataml/table_operators/TableOperator.py +1343 -0
- teradataml/table_operators/__init__.py +2 -0
- teradataml/table_operators/apply_query_generator.py +262 -0
- teradataml/table_operators/query_generator.py +493 -0
- teradataml/table_operators/table_operator_query_generator.py +462 -0
- teradataml/table_operators/table_operator_util.py +726 -0
- teradataml/table_operators/templates/dataframe_apply.template +184 -0
- teradataml/table_operators/templates/dataframe_map.template +176 -0
- teradataml/table_operators/templates/dataframe_register.template +73 -0
- teradataml/table_operators/templates/dataframe_udf.template +67 -0
- teradataml/table_operators/templates/script_executor.template +170 -0
- teradataml/telemetry_utils/__init__.py +0 -0
- teradataml/telemetry_utils/queryband.py +53 -0
- teradataml/utils/__init__.py +0 -0
- teradataml/utils/docstring.py +527 -0
- teradataml/utils/dtypes.py +943 -0
- teradataml/utils/internal_buffer.py +122 -0
- teradataml/utils/print_versions.py +206 -0
- teradataml/utils/utils.py +451 -0
- teradataml/utils/validators.py +3305 -0
- teradataml-20.0.0.8.dist-info/METADATA +2804 -0
- teradataml-20.0.0.8.dist-info/RECORD +1208 -0
- teradataml-20.0.0.8.dist-info/WHEEL +5 -0
- teradataml-20.0.0.8.dist-info/top_level.txt +1 -0
- teradataml-20.0.0.8.dist-info/zip-safe +1 -0
|
@@ -0,0 +1,2804 @@
|
|
|
1
|
+
Metadata-Version: 2.1
|
|
2
|
+
Name: teradataml
|
|
3
|
+
Version: 20.0.0.8
|
|
4
|
+
Summary: Teradata Vantage Python package for Advanced Analytics
|
|
5
|
+
Home-page: http://www.teradata.com/
|
|
6
|
+
Author: Teradata Corporation
|
|
7
|
+
License: Teradata License Agreement
|
|
8
|
+
Keywords: Teradata
|
|
9
|
+
Platform: MacOS X, Windows, Linux
|
|
10
|
+
Classifier: Programming Language :: Python :: 3 :: Only
|
|
11
|
+
Classifier: Programming Language :: Python :: 3.8
|
|
12
|
+
Classifier: Programming Language :: Python :: 3.9
|
|
13
|
+
Classifier: Operating System :: Microsoft :: Windows
|
|
14
|
+
Classifier: Operating System :: MacOS :: MacOS X
|
|
15
|
+
Classifier: Operating System :: POSIX :: Linux
|
|
16
|
+
Classifier: Topic :: Database :: Front-Ends
|
|
17
|
+
Classifier: License :: Other/Proprietary License
|
|
18
|
+
Requires-Python: >=3.8
|
|
19
|
+
Description-Content-Type: text/markdown
|
|
20
|
+
Requires-Dist: teradatasql (>=20.0.0.26)
|
|
21
|
+
Requires-Dist: teradatasqlalchemy (>=20.0.0.8)
|
|
22
|
+
Requires-Dist: pandas (>=0.22)
|
|
23
|
+
Requires-Dist: psutil
|
|
24
|
+
Requires-Dist: requests (>=2.25.1)
|
|
25
|
+
Requires-Dist: scikit-learn (>=0.24.2)
|
|
26
|
+
Requires-Dist: IPython
|
|
27
|
+
Requires-Dist: imbalanced-learn (>=0.8.0)
|
|
28
|
+
Requires-Dist: matplotlib (>=3.7.5)
|
|
29
|
+
Requires-Dist: seaborn (>=0.13.0)
|
|
30
|
+
Requires-Dist: pyjwt (>=2.8.0)
|
|
31
|
+
Requires-Dist: cryptography (>=42.0.5)
|
|
32
|
+
Requires-Dist: sqlalchemy (>=2.0)
|
|
33
|
+
Requires-Dist: lightgbm (>=3.3.3)
|
|
34
|
+
Requires-Dist: python-dotenv
|
|
35
|
+
Requires-Dist: teradatamlwidgets (>=20.0.0.5)
|
|
36
|
+
Requires-Dist: oauthlib (>=3.2.2)
|
|
37
|
+
Requires-Dist: requests-oauthlib (>=2.0.0)
|
|
38
|
+
Requires-Dist: pydantic (>=2.10.6)
|
|
39
|
+
Requires-Dist: PyYAML (>=6.0.2)
|
|
40
|
+
|
|
41
|
+
## Teradata Python package for Advanced Analytics.
|
|
42
|
+
|
|
43
|
+
teradataml makes available to Python users a collection of analytic functions that reside on Teradata Vantage. This allows users to perform analytics on Teradata Vantage with no SQL coding. In addition, the teradataml library provides functions for scaling data manipulation and transformation, data filtering and sub-setting, and can be used in conjunction with other open-source python libraries.
|
|
44
|
+
|
|
45
|
+
For community support, please visit the [Teradata Community](https://support.teradata.com/community?id=community_forum&sys_id=14fe131e1bf7f304682ca8233a4bcb1d).
|
|
46
|
+
|
|
47
|
+
For Teradata customer support, please visit [Teradata Support](https://support.teradata.com/csm).
|
|
48
|
+
|
|
49
|
+
Copyright 2025, Teradata. All Rights Reserved.
|
|
50
|
+
|
|
51
|
+
### Table of Contents
|
|
52
|
+
* [Release Notes](#release-notes)
|
|
53
|
+
* [Installation and Requirements](#installation-and-requirements)
|
|
54
|
+
* [Using the Teradata Python Package](#using-the-teradata-python-package)
|
|
55
|
+
* [Documentation](#documentation)
|
|
56
|
+
* [License](#license)
|
|
57
|
+
|
|
58
|
+
## Release Notes:
|
|
59
|
+
#### teradataml 20.00.00.08
|
|
60
|
+
* ##### New Features/Functionality
|
|
61
|
+
* Extending compatibility for IBM PowerPC with python >=3.9. Refer Teradata Python Package User Guide for more details related to installation on IBM PowerPC.
|
|
62
|
+
|
|
63
|
+
* ###### teradataml: AutoML
|
|
64
|
+
* New methods added for `AutoML()`, `AutoRegressor()`, `AutoClassifier()`, `AutoFraud()`, `AutoChurn()` and `AutoCluster()`.
|
|
65
|
+
* `get_transformed_data()` - Returns the transformed data obtained from all feature selection methods for given input data.
|
|
66
|
+
* `get_raw_data_with_id()` - Returns the raw input data along with the ID column mapping.
|
|
67
|
+
* `get_error_logs()` - Returns the error logs for failed models generated during execution of AutoML.
|
|
68
|
+
|
|
69
|
+
* ##### Updates
|
|
70
|
+
* ###### teradataml: AutoML
|
|
71
|
+
* New argument added for `AutoML()`, `AutoRegressor()`, `AutoClassifier()`, `AutoFraud()`, `AutoChurn()` and `AutoDataPrep()`.
|
|
72
|
+
* Added `enable_lasso` to use lasso based feature selection during data preparation. By default, only 'RFE' and 'PCA' are enabled for feature selection.
|
|
73
|
+
* New arguments added for `AutoML()`, `AutoRegressor()`, `AutoClassifier()`, `AutoFraud()`, `AutoChurn()` and `AutoCluster()`.
|
|
74
|
+
* Added `id_column` to specify the ID column present in input data. By default, an AutoML-generated ID column `automl_id` is enabled for processing if user does not provide one.
|
|
75
|
+
* Added `raise_errors` to control whether non-blocking issues raise errors or only warnings. By default, it does not raise errors and continues processing with a user warning.
|
|
76
|
+
* Added `preserve_columns` to `predict()` to preserve columns from the transformed data in prediction DataFrame.
|
|
77
|
+
|
|
78
|
+
* ##### Bug Fixes
|
|
79
|
+
* CS3096238 - Teradata BYOM will now work with Secure Zone--CHBIT08
|
|
80
|
+
|
|
81
|
+
#### teradataml 20.00.00.07
|
|
82
|
+
* ##### New Features/Functionality
|
|
83
|
+
* Extending compatibility for Linux with ARM processors.
|
|
84
|
+
|
|
85
|
+
* ###### teradataml: DataFrame
|
|
86
|
+
* `DataFrame.df_type` - Added new property `df_type` to know the type of the DataFrame.
|
|
87
|
+
* `DataFrame.as_of()` - Added new function which supports temporal time qualifiers on teradataml DataFrame.
|
|
88
|
+
* `DataFrame.closed_rows()` - Added a new function to retrieve closed rows from a DataFrame created on a transaction-time or bi-temporal table/view.
|
|
89
|
+
* `DataFrame.open_rows()` - Added a new function to retrieve open rows from a DataFrame created on a transaction-time or bi-temporal table/view.
|
|
90
|
+
* `DataFrame.historic_rows()` - Added a new function to retrieve historical rows from a DataFrame created on a valid-time or bi-temporal table/view.
|
|
91
|
+
* `DataFrame.future_rows()` - Added a new function to retrieve future rows from a DataFrame created on a valid-time or bi-temporal table/view.
|
|
92
|
+
* `DataFrame.create_view()` - Creates a view from the DataFrame object. This function helps the user to persist the DataFrame as a view, which can be used across sessions.
|
|
93
|
+
* Added argument `persist` to `DataFrame.from_dict()`, `DataFrame.from_pandas()`, and `DataFrame.from_records()` to persist the created DataFrame.
|
|
94
|
+
|
|
95
|
+
* ###### teradataml DataFrameColumn a.k.a. ColumnExpression
|
|
96
|
+
* `DataFrameColumn.begin()` - Function to get beginning date or timestamp from a PERIOD column.
|
|
97
|
+
* `DataFrameColumn.end()` - Function to get ending date or timestamp from a PERIOD column.
|
|
98
|
+
* `DataFrameColumn.between()` - Function to check if the column value is between the lower and upper bounds.
|
|
99
|
+
|
|
100
|
+
* ###### teradataml: Functions
|
|
101
|
+
* `current_date()` - Gets the current date based on the specified time zone.
|
|
102
|
+
* `current_timestamp()` - Gets the current timestamp based on the specified time zone.
|
|
103
|
+
|
|
104
|
+
* ###### teradataml: General Functions
|
|
105
|
+
* Data Transfer Utility
|
|
106
|
+
* `copy_to_sql()`
|
|
107
|
+
* A new argument `partition_by` partitions the index while writing to Teradata Vantage.
|
|
108
|
+
* A new argument `partition_by_case` handles different cases for partitioning the index while writing to Teradata Vantage.
|
|
109
|
+
* A new argument `partition_by_range` partitions the data based on a range while writing to Teradata Vantage.
|
|
110
|
+
* A new argument `sub_partition` subpartitions the main partition according to the provided value.
|
|
111
|
+
* New keyword arguments `valid_time_columns` and `derived_column` helps to copy the data into temporal tables.
|
|
112
|
+
|
|
113
|
+
* ###### Enterprise Feature Store
|
|
114
|
+
* `FeatureStore` - Main class for managing Feature Store operations with comprehensive methods and properties.
|
|
115
|
+
* Methods:
|
|
116
|
+
* `apply()` - Adds Feature, Entity, DataSource, FeatureGroup to FeatureStore.
|
|
117
|
+
* `archive_data_source()` - Archives a specified DataSource.
|
|
118
|
+
* `archive_entity()` - Archives a specified Entity.
|
|
119
|
+
* `archive_feature()` - Archives a specified Feature.
|
|
120
|
+
* `archive_feature_group()` - Archives a specified FeatureGroup.
|
|
121
|
+
* `archive_feature_process()` - Archives a specified FeatureProcess.
|
|
122
|
+
* `delete()` - Deletes the FeatureStore and all its components.
|
|
123
|
+
* `delete_data_source()` - Deletes an archived DataSource.
|
|
124
|
+
* `delete_entity()` - Deletes an archived Entity.
|
|
125
|
+
* `delete_feature()` - Deletes an archived Feature.
|
|
126
|
+
* `delete_feature_group()` - Deletes an archived FeatureGroup.
|
|
127
|
+
* `delete_feature_process()` - Deletes an archived FeatureProcess.
|
|
128
|
+
* `get_data()` - Gets data based on features, entities, and processes.
|
|
129
|
+
* `get_data_domain()` - Retrieves DataDomain object.
|
|
130
|
+
* `get_data_source()` - Gets DataSources associated with FeatureStore.
|
|
131
|
+
* `get_dataset_catalog()` - Retrieves the DatasetCatalog object.
|
|
132
|
+
* `get_entity()` - Gets Entity associated with FeatureStore.
|
|
133
|
+
* `get_feature()` - Gets Feature associated with FeatureStore.
|
|
134
|
+
* `get_feature_group()` - Gets FeatureGroup associated with FeatureStore.
|
|
135
|
+
* `get_feature_process()` - Retrieves FeatureProcess based on arguments.
|
|
136
|
+
* `get_feature_catalog()` - Retrieves FeatureCatalog object.
|
|
137
|
+
* `get_group_features()` - Gets features from a specific feature group.
|
|
138
|
+
* `list_data_sources()` - Lists DataSources in the FeatureStore.
|
|
139
|
+
* `list_entities()` - Lists Entities in the FeatureStore.
|
|
140
|
+
* `list_feature_groups()` - Lists FeatureGroups in the FeatureStore.
|
|
141
|
+
* `list_features()` - Lists Features in the FeatureStore.
|
|
142
|
+
* `list_feature_processes()` - Lists all feature processes in the repo.
|
|
143
|
+
* `list_feature_runs()` - Lists feature process runs and execution status.
|
|
144
|
+
* `list_feature_catalogs()` - Lists all feature catalogs in the repo.
|
|
145
|
+
* `list_data_domains()` - Lists all data domains in the repo.
|
|
146
|
+
* `list_dataset_catalogs()` - Lists all dataset catalogs in the repo.
|
|
147
|
+
* `list_repos()` - Lists available repos configured for FeatureStore.
|
|
148
|
+
* `mind_map()` - Generates a mind map visualization of the feature store structure.
|
|
149
|
+
* `remove_data_domain()` - Removes the data domain from the feature store.
|
|
150
|
+
* `repair()` - Repairs the underlying FeatureStore schema on database.
|
|
151
|
+
* `set_features_active()` - Marks Features as active.
|
|
152
|
+
* `set_features_inactive()` - Marks Features as inactive.
|
|
153
|
+
* `setup()` - Sets up the FeatureStore for a repository.
|
|
154
|
+
* Properties:
|
|
155
|
+
* `data_domain` - Gets or sets the data domain of feature store.
|
|
156
|
+
* `grant` - Grants access to the FeatureStore.
|
|
157
|
+
* `repo` - Gets or sets the repository name.
|
|
158
|
+
* `revoke` - Revokes access from the FeatureStore.
|
|
159
|
+
* `version` - Gets the version of the FeatureStore.
|
|
160
|
+
* `FeatureGroup` - Represents a group of features with methods and properties.
|
|
161
|
+
* Methods:
|
|
162
|
+
* `apply()` - Applies the feature group to objects.
|
|
163
|
+
* `from_DataFrame()` - Creates a FeatureGroup from a DataFrame.
|
|
164
|
+
* `from_query()` - Creates a FeatureGroup from a query.
|
|
165
|
+
* `ingest_features()` - Ingests features from the FeatureGroup into the FeatureStore.
|
|
166
|
+
* `remove_feature()` - Removes a feature from the FeatureGroup.
|
|
167
|
+
* `reset_labels()` - Resets the labels of the FeatureGroup.
|
|
168
|
+
* `set_labels()` - Sets the labels of the FeatureGroup.
|
|
169
|
+
* Properties:
|
|
170
|
+
* `features` - Gets the features in the FeatureGroup.
|
|
171
|
+
* `labels` - Gets or sets the labels of the FeatureGroup.
|
|
172
|
+
* `DataDomain` - Represents a data domain within the FeatureStore with properties.
|
|
173
|
+
* Properties:
|
|
174
|
+
* `entities` - Gets the entities in the data domain.
|
|
175
|
+
* `features` - Gets the features in the data domain.
|
|
176
|
+
* `processes` - Gets the feature processes in the data domain.
|
|
177
|
+
* `datasets` - Gets the datasets in the data domain.
|
|
178
|
+
* `FeatureCatalog` - Manages features within a specific data domain.
|
|
179
|
+
* Methods:
|
|
180
|
+
* `upload_features()` - Uploads features to the catalog.
|
|
181
|
+
* `list_features()` - Lists features in the catalog.
|
|
182
|
+
* `list_feature_versions()` - Lists feature versions in the catalog.
|
|
183
|
+
* `archive_features()` - Archives features in the catalog.
|
|
184
|
+
* `delete_features()` - Deletes features from the catalog.
|
|
185
|
+
* Properties:
|
|
186
|
+
* `data_domain` - Gets the data domain of the catalog.
|
|
187
|
+
* `features` - Gets the features in the catalog.
|
|
188
|
+
* `entities` - Gets the entities in the catalog.
|
|
189
|
+
* `DatasetCatalog` - Manages datasets within a specific data domain.
|
|
190
|
+
* Methods:
|
|
191
|
+
* `build_dataset()` - Builds a dataset from features and entities.
|
|
192
|
+
* `build_time_series()` - Builds a time series dataset.
|
|
193
|
+
* `list_datasets()` - Lists datasets in the catalog.
|
|
194
|
+
* `list_entities()` - Lists entities available for dataset building.
|
|
195
|
+
* `list_features()` - Lists features available for dataset building.
|
|
196
|
+
* `get_dataset()` - Gets a specific dataset by ID.
|
|
197
|
+
* `archive_datasets()` - Archives datasets in the catalog.
|
|
198
|
+
* `delete_datasets()` - Deletes datasets from the catalog.
|
|
199
|
+
* Properties:
|
|
200
|
+
* `data_domain` - Gets the data domain of the catalog.
|
|
201
|
+
* `Dataset` - Represents a specific dataset in the catalog.
|
|
202
|
+
* Properties:
|
|
203
|
+
* `features` - Gets the features in the dataset.
|
|
204
|
+
* `entity` - Gets the entity of the dataset.
|
|
205
|
+
* `view_name` - Gets the view name of the dataset.
|
|
206
|
+
* `id` - Gets the ID of the dataset.
|
|
207
|
+
* `FeatureProcess` - Represents a feature processing workflow.
|
|
208
|
+
* Methods:
|
|
209
|
+
* `run()` - Executes the feature process with optional filters and as_of parameters.
|
|
210
|
+
* Properties:
|
|
211
|
+
* `process_id` - Gets the process ID.
|
|
212
|
+
* `df` - Gets the DataFrame associated with the process.
|
|
213
|
+
* `features` - Gets the features in the process.
|
|
214
|
+
* `entity` - Gets the entity in the process.
|
|
215
|
+
* `data_domain` - Gets the data domain of the process.
|
|
216
|
+
* `filters` - Gets the filters applied to the process.
|
|
217
|
+
* `as_of` - Gets the as_of parameter of the process.
|
|
218
|
+
* `description` - Gets the description of the process.
|
|
219
|
+
* `start_time` - Gets the start time of the process.
|
|
220
|
+
* `end_time` - Gets the end time of the process.
|
|
221
|
+
* `status` - Gets the status of the process.
|
|
222
|
+
|
|
223
|
+
* ###### OpensourceML
|
|
224
|
+
* `td_sklearn` - Now supports input from OTF tables.
|
|
225
|
+
|
|
226
|
+
* ###### BYOM Function
|
|
227
|
+
* `ONNXSeq2Seq()` - Applies sequence-to-sequence model in Vantage that has been created outside Vantage and stored in ONNX format.
|
|
228
|
+
|
|
229
|
+
* ###### teradataml: AutoFraud (Automated Machine Learning - Fraud Detection)
|
|
230
|
+
`AutoFraud` is a special purpose AutoML pipeline designed for fraud detection tasks. It automates the end-to-end process of data preprocessing, feature engineering, model training, evaluation, and deployment to efficiently identify fraudulent activities.
|
|
231
|
+
* Methods:
|
|
232
|
+
* `__init__()` - Instantiates an object of AutoFraud.
|
|
233
|
+
* `fit()` - Performs fit on specified data and target column.
|
|
234
|
+
* `leaderboard()` - Gets the leaderboard for the AutoFraud pipeline, with diverse models, feature selection methods, and performance metrics.
|
|
235
|
+
* `leader()` - Shows best performing model and its details such as feature selection method and performance metrics.
|
|
236
|
+
* `predict()` - Performs prediction on the data using the best model or the model of user's choice from the leaderboard.
|
|
237
|
+
* `evaluate()` - Performs evaluation on the data using the best model or the model of user's choice from the leaderboard.
|
|
238
|
+
* `load()` - Loads the saved model from database.
|
|
239
|
+
* `deploy()` - Saves the trained model inside database.
|
|
240
|
+
* `remove_saved_model()` - Removes the saved model in database.
|
|
241
|
+
* `model_hyperparameters()` - Returns the hyperparameters of fitted or loaded models.
|
|
242
|
+
* `get_persisted_tables()` - Lists the persisted tables created during AutoFraud execution.
|
|
243
|
+
* `visualize()` - Generates visualizations to analyze and understand the underlying patterns in the data.
|
|
244
|
+
* `generate_custom_config()` - Generates custom config JSON file required for customized run of AutoFraud.
|
|
245
|
+
|
|
246
|
+
* ###### teradataml: AutoChurn (Automated Machine Learning - Churn Prediction)
|
|
247
|
+
`AutoChurn` is a special purpose AutoML pipeline for customer churn prediction. It automates the end-to-end process of data preprocessing, feature engineering, model training, evaluation, and deployment to efficiently identify customers likely to churn.
|
|
248
|
+
* Methods:
|
|
249
|
+
* `__init__()` - Instantiates an object of AutoChurn.
|
|
250
|
+
* `fit()` - Performs fit on specified data and target column.
|
|
251
|
+
* `leaderboard()` - Gets the leaderboard for the AutoChurn pipeline, with diverse models, feature selection methods, and performance metrics.
|
|
252
|
+
* `leader()` - Shows best performing model and its details such as feature selection method and performance metrics.
|
|
253
|
+
* `predict()` - Performs prediction on the data using the best model or the model of user's choice from the leaderboard.
|
|
254
|
+
* `evaluate()` - Performs evaluation on the data using the best model or the model of user's choice from the leaderboard.
|
|
255
|
+
* `load()` - Loads the saved model from database.
|
|
256
|
+
* `deploy()` - Saves the trained model inside database.
|
|
257
|
+
* `remove_saved_model()` - Removes the saved model in database.
|
|
258
|
+
* `model_hyperparameters()` - Returns the hyperparameters of fitted or loaded models.
|
|
259
|
+
* `get_persisted_tables()` - Lists the persisted tables created during AutoChurn execution.
|
|
260
|
+
* `visualize()` - Generates visualizations to analyze and understand the underlying patterns in the data.
|
|
261
|
+
* `generate_custom_config()` - Generates custom config JSON file required for customized run of AutoChurn.
|
|
262
|
+
|
|
263
|
+
* ###### teradataml: AutoCluster (Automated Machine Learning - Clustering)
|
|
264
|
+
`AutoCluster` is a special purpose AutoML pipeline for clustering analysis. It automates the end-to-end process of data preprocessing, feature engineering, model training, and prediction to efficiently group data into clusters and extract insights from unlabeled datasets.
|
|
265
|
+
* Methods:
|
|
266
|
+
* `__init__()` - Instantiates an object of AutoCluster.
|
|
267
|
+
* `fit()` - Performs fit on specified data.
|
|
268
|
+
* `leaderboard()` - Gets the leaderboard for the AutoCluster pipeline, with diverse models, feature selection methods, and performance metrics.
|
|
269
|
+
* `leader()` - Shows best performing model and its details such as feature selection method and performance metrics.
|
|
270
|
+
* `predict()` - Performs prediction (cluster assignment) on the data using the best model or the model of user's choice from the leaderboard.
|
|
271
|
+
* `model_hyperparameters()` - Returns the hyperparameters of fitted or loaded models.
|
|
272
|
+
* `get_persisted_tables()` - Lists the persisted tables created during AutoCluster execution.
|
|
273
|
+
* `generate_custom_config()` - Generates custom config JSON file required for customized run of AutoCluster.
|
|
274
|
+
|
|
275
|
+
* ##### Updates
|
|
276
|
+
* ###### teradataml: Functions
|
|
277
|
+
* `udf()` - Added support for `td_buffer` to cache the data in the user defined function.
|
|
278
|
+
|
|
279
|
+
* ###### Open Analytics Framework (OpenAF)
|
|
280
|
+
* UserEnv Class.
|
|
281
|
+
* Properties:
|
|
282
|
+
* `models` - Supports listing of models installed from external model registry like HuggingFace as well.
|
|
283
|
+
* Methods:
|
|
284
|
+
* `install_model()` - Added new arguments `model_name`, `model_type` and `api_key` to support installation of models from external model registry like HuggingFace .
|
|
285
|
+
* `uninstall_model()` - Supports uninstallation of a model from user environment which is installed from external model registry like HuggingFace .
|
|
286
|
+
|
|
287
|
+
* ##### Bug Fixes
|
|
288
|
+
* `set_auth_token()` generates JWT token using default value for iat claim when authentication is being done using PEM file and PAT.
|
|
289
|
+
* `create_env` - When an unavailable R base environment is provided in `create_env()`, requested R user environment is created using latest R base environment version
|
|
290
|
+
out of available base environments. Earlier, `create_env()` would create user environment with latest Python base environment version even though the request is for R user environment.
|
|
291
|
+
* Fixed userWarning in `db_list_tables()`.
|
|
292
|
+
|
|
293
|
+
#### teradataml 20.00.00.06
|
|
294
|
+
* ##### New Features/Functionality
|
|
295
|
+
* ###### teradataml: SDK
|
|
296
|
+
* Added new client `teradataml.sdk.Client` which can be used by user to make REST calls through SDK.
|
|
297
|
+
* New exception added in `teradataml`, specifically for REST APIs `TeradatamlRestException` that has attribute `json_resonse` providing proper printable json.
|
|
298
|
+
* Exposed three different ways of authentication through `Client`.
|
|
299
|
+
* Client credentials Authentication through `ClientCredentialsAuth` class.
|
|
300
|
+
* Device code Authentication through `DeviceCodeAuth` class.
|
|
301
|
+
* Bearer Authentication through `BearerAuth` class.
|
|
302
|
+
|
|
303
|
+
* ###### teradataml: ModelOps SDK
|
|
304
|
+
* `teradataml` exposes Python interfaces for all the REST APIs provided by Teradata Vantage ModelOps.
|
|
305
|
+
* Added support for `blueprint()` method which prints available classes in `modelops` module.
|
|
306
|
+
* Added new client `ModelOpsClient` with some additional function compared to `teradataml.sdk.Client`.
|
|
307
|
+
* teradataml classes are added for the schema in ModelOps OpenAPI specification.
|
|
308
|
+
```python
|
|
309
|
+
>>> from teradataml.sdk.modelops import ModelOpsClient, Projects
|
|
310
|
+
>>> from teradataml.common.exceptions import TeradatamlRestException
|
|
311
|
+
>>> from teradataml.sdk import DeviceCodeAuth, BearerAuth, ClientCredentialsAuth # Authentication related classes.
|
|
312
|
+
>>> from teradataml.sdk.modelops import models # All classes related to OpenAPI schema are present in this module.
|
|
313
|
+
|
|
314
|
+
# Print available classes in modelops module.
|
|
315
|
+
>>> from teradataml.sdk.modelops import blueprint
|
|
316
|
+
>>> blueprint()
|
|
317
|
+
|
|
318
|
+
# Create ClientCredentialsAuth object and create ModelOpsClient object.
|
|
319
|
+
>>> cc_obj = ClientCredentialsAuth(auth_client_id="<client_id>",
|
|
320
|
+
auth_client_secret="<client_secret>",
|
|
321
|
+
auth_token_url="https://<example.com>/token")
|
|
322
|
+
>>> client = ModelOpsClient(base_url="<base_url>", auth=cc_obj, ssl_verify=False)
|
|
323
|
+
|
|
324
|
+
# Create Projects object.
|
|
325
|
+
>>> p = Projects(client=client)
|
|
326
|
+
|
|
327
|
+
# Create project using `body` argument taking object of ProjectRequestBody.
|
|
328
|
+
>>> project_paylod = {
|
|
329
|
+
"name": "dummy_project",
|
|
330
|
+
"description": "dummy_project created for testing",
|
|
331
|
+
"groupId": "<group_ID>",
|
|
332
|
+
"gitRepositoryUrl": "/app/built-in/empty",
|
|
333
|
+
"branch": "<branch>"
|
|
334
|
+
}
|
|
335
|
+
>>> p.create_project(body=models.ProjectRequestBody(**project_payload))
|
|
336
|
+
```
|
|
337
|
+
|
|
338
|
+
* ###### teradataml: Functions
|
|
339
|
+
* `get_formatters()` - Get the formatters for NUMERIC, DATE and CHAR types.
|
|
340
|
+
|
|
341
|
+
* ###### teradataml: DataFrame Methods
|
|
342
|
+
* `get_snapshot()` - Gets the snapshot data of a teradataml DataFrame created on OTF table for a given snapshot id or timestamp.
|
|
343
|
+
* `from_pandas()`: Creates a teradataml DataFrame from a pandas DataFrame.
|
|
344
|
+
* `from_records()`: Creates a teradataml DataFrame from a list.
|
|
345
|
+
* `from_dict()`: Creates a teradataml DataFrame from a dictionary.
|
|
346
|
+
|
|
347
|
+
* ###### teradataml: DataFrame Property
|
|
348
|
+
* `history` - Returns snapshot history for a DataFrame created on OTF table.
|
|
349
|
+
* `manifests` - Returns manifest information for a DataFrame created on OTF table.
|
|
350
|
+
* `partitions` - Returns partition information for a DataFrame created on OTF table.
|
|
351
|
+
* `snapshots` - Returns snapshot information for a DataFrame created on OTF table.
|
|
352
|
+
|
|
353
|
+
* ###### teradataml DataFrameColumn a.k.a. ColumnExpression
|
|
354
|
+
* `DataFrameColumn.rlike()` - Function to match a string against a regular expression pattern.
|
|
355
|
+
* `DataFrameColumn.substring_index()` - Function to return the substring from a column before a specified
|
|
356
|
+
delimiter, up to a given occurrence count.
|
|
357
|
+
* `DataFrameColumn.count_delimiters()` - Function to count the total number of occurrences of a specified delimiter.
|
|
358
|
+
|
|
359
|
+
* ##### Updates
|
|
360
|
+
* ###### teradataml DataFrameColumn a.k.a. ColumnExpression
|
|
361
|
+
* `DataFrameColumn.like()`
|
|
362
|
+
* Added argument `escape_char` to specify the escape character for the LIKE pattern.
|
|
363
|
+
* Argument `pattern` now accepts DataFrameColumn as input.
|
|
364
|
+
* `DataFrameColumn.ilike()`
|
|
365
|
+
* Added argument `escape_char` to specify the escape character for the ILIKE pattern.
|
|
366
|
+
* Argument `pattern` now accepts DataFrameColumn as input.
|
|
367
|
+
* `DataFrameColumn.parse_url()` - Added argument `key` to extract a specific query parameter when `url_part` is set to "QUERY".
|
|
368
|
+
|
|
369
|
+
* ###### teradataml: DataFrame function
|
|
370
|
+
* `groupby()`, `cube()` and `rollup()`
|
|
371
|
+
* Added argument `include_grouping_columns` to include aggregations on the grouping column(s).
|
|
372
|
+
* `DataFrame()`: New argument `data`, that accepts input data to create a teradataml DataFrame, is added.
|
|
373
|
+
|
|
374
|
+
* ###### General functions
|
|
375
|
+
* `set_auth_token()`
|
|
376
|
+
* New keyword argument `auth_url` accepts the endpoint URL for a keycloak server.
|
|
377
|
+
* New keyword argument `rest_client` accepts name of the service for which keycloak token is to be generated.
|
|
378
|
+
* New keyword argument `validate_jwt` accepts the boolean flag to decide whether to validate generated JWT token or not.
|
|
379
|
+
* New keyword argument `valid_from` accepts the epoch seconds representing time from which JWT token will be valid.
|
|
380
|
+
|
|
381
|
+
* ###### teradataml Options
|
|
382
|
+
* Configuration Options
|
|
383
|
+
* `configure.use_short_object_name`
|
|
384
|
+
Specifies whether to use a shorter name for temporary database objects which are created by teradataml internally.
|
|
385
|
+
|
|
386
|
+
* ###### BYOM Function
|
|
387
|
+
* Supports special characters.
|
|
388
|
+
|
|
389
|
+
#### teradataml 20.00.00.05
|
|
390
|
+
* ##### New Features/Functionality
|
|
391
|
+
* ##### teradataml: AutoML
|
|
392
|
+
* New methods added for `AutoML()`, `AutoRegressor()` and `AutoClassifier()`:
|
|
393
|
+
* `get_persisted_tables()` - List the persisted tables created during AutoML execution.
|
|
394
|
+
* `visualize()` - Generates visualizations to analyze and understand the underlying patterns in the data.
|
|
395
|
+
|
|
396
|
+
* ##### AutoDataPrep - Automated Data Preparation
|
|
397
|
+
AutoDataPrep simplifies the data preparation process by automating the different aspects of
|
|
398
|
+
data cleaning and transformation, enabling seamless exploration, transformation, and optimization of datasets.
|
|
399
|
+
* `AutoDataPrep`
|
|
400
|
+
* Methods of AutoDataPrep
|
|
401
|
+
* `__init__()` - Instantiate an object of AutoDataPrep with given parameters.
|
|
402
|
+
* `fit()` - Perform fit on specified data and target column.
|
|
403
|
+
* `get_data()` - Retrieve the data after AutoDataPrep.
|
|
404
|
+
* `load()` - Load the saved datasets from Teradata Vantage.
|
|
405
|
+
* `deploy()` - Persist the datasets generated by AutoDataPrep in Teradata Vantage.
|
|
406
|
+
* `delete_data()` - Deletes the deployed dataset from the Teradata Vantage.
|
|
407
|
+
* `visualize()` - Generates visualizations to analyze and understand the underlying patterns in the data.
|
|
408
|
+
|
|
409
|
+
* ##### teradataml: SQLE Engine Analytic Functions
|
|
410
|
+
* New Analytics Database Analytic Functions:
|
|
411
|
+
* `Apriori()`
|
|
412
|
+
* `NERExtractor()`
|
|
413
|
+
* `TextMorph()`
|
|
414
|
+
|
|
415
|
+
* ##### teradataml: Functions
|
|
416
|
+
* `td_range()` - Creates a DataFrame with a specified range of numbers.
|
|
417
|
+
|
|
418
|
+
* ##### teradataml DataFrameColumn a.k.a. ColumnExpression
|
|
419
|
+
* `DataFrameColumn.to_number()` - Function converts a string-like representation of a number to NUMBER type.
|
|
420
|
+
|
|
421
|
+
* ##### Updates
|
|
422
|
+
* ###### teradataml: DataFrame function
|
|
423
|
+
* `DataFrame.agg()`: User can request for different percentiles while running agg function.
|
|
424
|
+
* New argument `debug` is added to `DataFrame.map_row()`, `DataFrame.map_partition()`, `DataFrame.apply()` and `udf()`. During the execution of these functions, teradataml internally generates scripts, which are garbage collected implicitly. To debug the failures, this argument allows user to control the garbage collection of the script. When set to False (default), script generated is garbage collected, otherwise script is not garbage collected and displays the path to the script, and user is responsible to remove the script if required.
|
|
425
|
+
* `map_row()`, `map_partition()` and `apply()`
|
|
426
|
+
* Raises a TeradataMlException, if the Python interpreter major version is different between the Vantage Python environment and the local user environment.
|
|
427
|
+
* Displays a warning, if `dill` package version is different between the Vantage Python environment and the local user environment.
|
|
428
|
+
* `DataFrame.describe()`: Argument `include` is no longer supported.
|
|
429
|
+
* `assign()` - Optimized SQL query to enhance the performance for consecutive assign calls.
|
|
430
|
+
|
|
431
|
+
* ###### teradataml: Context Creation
|
|
432
|
+
* `create_context()`
|
|
433
|
+
* Enables user to set the authentication token while creating the connection. This authentication token is required to access services running on Teradata Vantage.
|
|
434
|
+
* New argument `sql_timeout` is added to specify timeout for SQL statement execution triggered from the current session.
|
|
435
|
+
|
|
436
|
+
* ###### teradataml: UAF Functions
|
|
437
|
+
* Integer type value is now accepted as a valid value for function arguments accepting float type.
|
|
438
|
+
|
|
439
|
+
* ###### General functions
|
|
440
|
+
* `set_auth_token()`
|
|
441
|
+
* Added argument `kid` to accept the name of the key used while generating `pem_file`.
|
|
442
|
+
* New keyword argument `auth_mech` accepts the authentication mechanism to be used for generating authentication token.
|
|
443
|
+
* Basic authentication is now supported as well. New keyword argument `password` accepts password for database user in such case.
|
|
444
|
+
* `copy_to_sql()` and `read_csv()` support the VECTOR data type.
|
|
445
|
+
|
|
446
|
+
* ###### Open Analytics Framework (OpenAF) APIs:
|
|
447
|
+
* `create_env()`:
|
|
448
|
+
* Supports creation of conda R environment.
|
|
449
|
+
|
|
450
|
+
* ###### teradataml DataFrameColumn a.k.a. ColumnExpression
|
|
451
|
+
* _String Functions_
|
|
452
|
+
* `DataFrameColumn.substr()` - Arguments `start_pos` and `length` now accept DataFrameColumn as input.
|
|
453
|
+
* `DataFrameColumn.to_char()` - Argument `formatter` now accepts DataFrameColumn as input.
|
|
454
|
+
|
|
455
|
+
* ###### teradataml: SQLE Engine Analytic Functions
|
|
456
|
+
* Updated Analytics Database Analytic Functions:
|
|
457
|
+
* `SMOTE()` is now supported on 17.20.00.00 as well.
|
|
458
|
+
* `TextParser()`
|
|
459
|
+
* New arguments added: `enforce_token_limit`, `delimiter_regex`, `doc_id_column`,
|
|
460
|
+
`list_positions`, `token_frequency`, `output_by_word`
|
|
461
|
+
|
|
462
|
+
#### teradataml 20.00.00.04
|
|
463
|
+
* ##### New Features/Functionality
|
|
464
|
+
* ###### teradataml OTF Support:
|
|
465
|
+
* This release has enabled the support for accessing OTF data from teradataml.
|
|
466
|
+
* User can now create a teradataml DataFrame on OTF table, allowing user to use teradataml functions.
|
|
467
|
+
* Example usage below:
|
|
468
|
+
* Creation of view on OTF/datalake table is not supported. Hence, user has to set `configure.temp_object_type` to `VT` using below-mentioned statement.
|
|
469
|
+
```configure.temp_object_type = "VT"```
|
|
470
|
+
* User needs to provide additional information about datalake while creating the DataFrame. There are two approaches to provide datalake information
|
|
471
|
+
* Approach 1: Using `in_schema()`
|
|
472
|
+
```
|
|
473
|
+
>>> from teradataml.dataframe.dataframe import in_schema
|
|
474
|
+
# Create an in_schema object to privide additional information about datalake.
|
|
475
|
+
>>> in_schema_tbl = in_schema(schema_name="datalake_db",
|
|
476
|
+
... table_name="datalake_table_name",
|
|
477
|
+
... datalake_name="datalake")
|
|
478
|
+
>>> otf_df = DataFrame(in_schema_tbl)
|
|
479
|
+
```
|
|
480
|
+
* Approach 2: Using `DataFrame.from_table()`
|
|
481
|
+
```
|
|
482
|
+
>>> otf_df = DataFrame.from_table(table_name = "datalake_table_name",
|
|
483
|
+
... schema_name="datalake_db",
|
|
484
|
+
... datalake_name="datalake")
|
|
485
|
+
```
|
|
486
|
+
* Once this DataFrame is created, users can use any DataFrame method or analytics features/functionality from teradataml with it. Visit Limitations and considerations section in _Teradata Python Package User Guide_ to check the supportability.
|
|
487
|
+
* Note: All further operations create volatile tables in local database.
|
|
488
|
+
```
|
|
489
|
+
>>> new_df = otf_df.assign(new_col=otf_df.existing_col*2)
|
|
490
|
+
```
|
|
491
|
+
* ###### teradataml: DataFrame
|
|
492
|
+
* Introduced a new feature 'Exploratory Data Analysis UI' (EDA-UI), which enhances
|
|
493
|
+
the user experience of teradataml with Jupyter notebook. EDA-UI is displayed by default
|
|
494
|
+
when a teradataml DataFrame is printed in the Jupyter notebook.
|
|
495
|
+
* User can control the EDA-UI using a new configuration option `display.enable_ui`.
|
|
496
|
+
It can be disabled by setting `display.enable_ui` to False.
|
|
497
|
+
* New Function
|
|
498
|
+
* `get_output()` is added to get the result of Analytic function when executed from EDA UI.
|
|
499
|
+
|
|
500
|
+
* ###### OpensourceML
|
|
501
|
+
* `td_lightgbm` - A teradataml OpenSourceML module
|
|
502
|
+
* `deploy()` - User can now deploy the models created by lightgbm `Booster` and `sklearn` modules. Deploying the model stores the model in Vantage for future use with `td_lightgbm`.
|
|
503
|
+
* `td_lightgbm.deploy()` - Deploy the lightgbm `Booster` or any `scikit-learn` model trained outside Vantage.
|
|
504
|
+
* `td_lightgbm.train().deploy()` - Deploys the lightgbm `Booster` object trained within Vantage.
|
|
505
|
+
* `td_lightgbm.<sklearn_class>().deploy()` - Deploys lightgbm's sklearn class object created/trained within Vantage.
|
|
506
|
+
* `load()` - User can load the deployed models back in the current session. This allows user to use the lightgbm functions with the `td_lightgbm` module.
|
|
507
|
+
* `td_lightgbm.load()` - Load the deployed model in the current session.
|
|
508
|
+
|
|
509
|
+
* ###### FeatureStore
|
|
510
|
+
* New function `FeatureStore.delete()` is added to drop the Feature Store and corresponding repo from Vantage.
|
|
511
|
+
|
|
512
|
+
* ###### Database Utility
|
|
513
|
+
* `db_python_version_diff()` - Identifies the Python interpreter major version difference between the interpreter installed on Vantage vs interpreter on the local user environment.
|
|
514
|
+
* `db_python_package_version_diff()` - Identifies the Python package version difference between the packages installed on Vantage vs the local user environment.
|
|
515
|
+
|
|
516
|
+
* ###### BYOM Function
|
|
517
|
+
* `ONNXEmbeddings()` - Calculate embeddings values in Vantage using an embeddings model that has been created outside Vantage and stored in ONNX format.
|
|
518
|
+
|
|
519
|
+
* ###### teradataml Options
|
|
520
|
+
* Configuration Options
|
|
521
|
+
* `configure.temp_object_type` - Allows user to choose between creating volatile tables or views for teradataml internal use. By default, teradataml internally creates the views for some of the operations. Now, with new configuration option, user can opt to create Volatile tables instead of views. This provides greater flexibility for users who lack the necessary permissions to create view or need to create views on tables without WITH GRANT permissions.
|
|
522
|
+
* Display Options
|
|
523
|
+
* `display.enable_ui` - Specifies whether to display exploratory data analysis UI when DataFrame is printed. By default, this option is enabled (True), allowing exploratory data analysis UI to be displayed. When set to False, exploratory data analysis UI is hidden.
|
|
524
|
+
|
|
525
|
+
* ##### Updates
|
|
526
|
+
* ###### teradataml: DataFrame function
|
|
527
|
+
* `describe()`
|
|
528
|
+
* New argument added: `pivot`.
|
|
529
|
+
* When argument `pivot` is set to False, Non-numeric columns are no longer supported for generating statistics.
|
|
530
|
+
Use `CategoricalSummary` and `ColumnSummary`.
|
|
531
|
+
* `fillna()` - Accepts new argument `partition_column` to partition the data and impute null values accordingly.
|
|
532
|
+
* Optimised performance for `DataFrame.plot()`.
|
|
533
|
+
* `DataFrame.plot()` will not regenerate the image when run more than once with same arguments.
|
|
534
|
+
* `DataFrame.from_table()`: New argument `datalake_name` added to accept datalake name while creating DataFrame on datalake table.
|
|
535
|
+
|
|
536
|
+
* ###### teradataml: DataFrame Utilities
|
|
537
|
+
* `in_schema()`: New argument `datalake_name` added to accept datalake name.
|
|
538
|
+
|
|
539
|
+
* ###### Table Operator
|
|
540
|
+
* `Apply()` no longer looks at authentication token by default. Authentication token is now required only if user wants to consume Open Analytics Framework REST APIs.
|
|
541
|
+
|
|
542
|
+
* ###### Hyper Parameter Tuner
|
|
543
|
+
* `GridSearch()` and `RandomSearch()` now displays a message to refer to `get_error_log()` api when model training fails in HPT.
|
|
544
|
+
|
|
545
|
+
* ###### teradataml Options
|
|
546
|
+
* Configuration Options
|
|
547
|
+
* `configure.indb_install_location`
|
|
548
|
+
Determines the installation location of the In-DB Python package based on the installed RPM version.
|
|
549
|
+
|
|
550
|
+
* ###### teradataml Context Creation
|
|
551
|
+
* `create_context()` - Enables user to create connection using either parameters set in environment or config file, in addition to previous method. Newly added options help users to hide the sensitive data from the script.
|
|
552
|
+
|
|
553
|
+
* ###### Open Analytics Framework
|
|
554
|
+
* Enhanced the `create_env()` to display a message when an invalid base_env is passed, informing users that the default base_env is being used.
|
|
555
|
+
|
|
556
|
+
* ###### OpensourceML
|
|
557
|
+
* Raises a TeradataMlException, if the Python interpreter major version is different between the Vantage Python environment and the local user environment.
|
|
558
|
+
* Displays a warning, if specific Python package versions are different between the Vantage Python environment and the local user environment.
|
|
559
|
+
|
|
560
|
+
* ###### Database Utility
|
|
561
|
+
* `db_list_tables()`: New argument `datalake_name` added to accept datalake name to list tables from.
|
|
562
|
+
* `db_drop_table()`:
|
|
563
|
+
* New argument `datalake_name` added to accept datalake name to drop tables from.
|
|
564
|
+
* New argument `purge` added to specify whether to use `PURGE ALL` or `NO PURGE` clause while dropping table.
|
|
565
|
+
|
|
566
|
+
* ##### Bug Fixes
|
|
567
|
+
* `td_lightgbm` OpensourceML module: In multi model case, `td_lightgbm.Dataset().add_features_from()` function should add features of one partition in first Dataset to features of the same partition in second Dataset. This is not the case before and this function fails. Fixed this now.
|
|
568
|
+
* Fixed a minor bug in the `Shap()` and converted argument `training_method` to required argument.
|
|
569
|
+
* Fixed PCA-related warnings in `AutoML`.
|
|
570
|
+
* `AutoML` no longer fails when data with all categorical columns are provided.
|
|
571
|
+
* Fixed `AutoML` issue with upsampling method.
|
|
572
|
+
* Excluded the identifier column from outlier processing in `AutoML`.
|
|
573
|
+
* `DataFrame.set_index()` no longer modifies the original DataFrame's index when argument `append` is used.
|
|
574
|
+
* `concat()` function now supports the DataFrame with column name starts with digit or contains special characters or contains reserved keywords.
|
|
575
|
+
* `create_env()` proceeds to install other files even if current file installation fails.
|
|
576
|
+
* Corrected the error message being raised in `create_env()` when authentication token is not set.
|
|
577
|
+
* Added missing argument `charset` for Vantage Analytic Library functions.
|
|
578
|
+
* New argument `seed` is added to `AutoML`, `AutoRegressor` and `AutoClassifier` to ensure consistency on result.
|
|
579
|
+
* Analytic functions now work even if name of columns for underlying tables has non-ascii characters.
|
|
580
|
+
|
|
581
|
+
#### teradataml 20.00.00.03
|
|
582
|
+
|
|
583
|
+
* teradataml no longer supports setting the `auth_token` using `set_config_params()`. Users should use `set_auth_token()` to set the token.
|
|
584
|
+
|
|
585
|
+
* ##### New Features/Functionality
|
|
586
|
+
* ###### teradataml: DataFrame
|
|
587
|
+
* New Function
|
|
588
|
+
* `alias()` - Creates a DataFrame with alias name.
|
|
589
|
+
* New Properties
|
|
590
|
+
* `db_object_name` - Get the underlying database object name, on which DataFrame is created.
|
|
591
|
+
|
|
592
|
+
* ###### teradataml: GeoDataFrame
|
|
593
|
+
* New Function
|
|
594
|
+
* `alias()` - Creates a GeoDataFrame with alias name.
|
|
595
|
+
|
|
596
|
+
* ###### teradataml: DataFrameColumn a.k.a. ColumnExpression
|
|
597
|
+
* _Arithmetic Functions_
|
|
598
|
+
* `DataFrameColumn.isnan()` - Function evaluates expression to determine if the floating-point
|
|
599
|
+
argument is a NaN (Not-a-Number) value.
|
|
600
|
+
* `DataFrameColumn.isinf()` - Function evaluates expression to determine if the floating-point
|
|
601
|
+
argument is an infinite number.
|
|
602
|
+
* `DataFrameColumn.isfinite()` - Function evaluates expression to determine if it is a finite
|
|
603
|
+
floating value.
|
|
604
|
+
|
|
605
|
+
* ###### FeatureStore - handles feature management within the Vantage environment
|
|
606
|
+
* FeatureStore Components
|
|
607
|
+
* Feature - Represents a feature which is used in ML Modeling.
|
|
608
|
+
* Entity - Represents the columns which serves as uniqueness for the data used in ML Modeling.
|
|
609
|
+
* DataSource - Represents the source of Data.
|
|
610
|
+
* FeatureGroup - Collection of Feature, Entity and DataSource.
|
|
611
|
+
* Methods
|
|
612
|
+
* `apply()` - Adds Feature, Entity, DataSource to a FeatureGroup.
|
|
613
|
+
* `from_DataFrame()` - Creates a FeatureGroup from teradataml DataFrame.
|
|
614
|
+
* `from_query()` - Creates a FeatureGroup using a SQL query.
|
|
615
|
+
* `remove()` - Removes Feature, Entity, or DataSource from a FeatureGroup.
|
|
616
|
+
* `reset_labels()` - Removes the labels assigned to the FeatureGroup, that are set using `set_labels()`.
|
|
617
|
+
* `set_labels()` - Sets the Features as labels for a FeatureGroup.
|
|
618
|
+
* Properties
|
|
619
|
+
* `features` - Get the features of a FeatureGroup.
|
|
620
|
+
* `labels` - Get the labels of FeatureGroup.
|
|
621
|
+
* FeatureStore
|
|
622
|
+
* Methods
|
|
623
|
+
* `apply()` - Adds Feature, Entity, DataSource, FeatureGroup to FeatureStore.
|
|
624
|
+
* `archive_data_source()` - Archives a specified DataSource from a FeatureStore.
|
|
625
|
+
* `archive_entity()` - Archives a specified Entity from a FeatureStore.
|
|
626
|
+
* `archive_feature()` - Archives a specified Feature from a FeatureStore.
|
|
627
|
+
* `archive_feature_group()` - Archives a specified FeatureGroup from a FeatureStore. Method archives underlying Feature, Entity, DataSource also.
|
|
628
|
+
* `delete_data_source()` - Deletes an archived DataSource.
|
|
629
|
+
* `delete_entity()` - Deletes an archived Entity.
|
|
630
|
+
* `delete_feature()` - Deletes an archived Feature.
|
|
631
|
+
* `delete_feature_group()` - Deletes an archived FeatureGroup.
|
|
632
|
+
* `get_data_source()` - Get the DataSources associated with FeatureStore.
|
|
633
|
+
* `get_dataset()` - Get the teradataml DataFrame based on Features, Entities and DataSource from FeatureGroup.
|
|
634
|
+
* `get_entity()` - Get the Entity associated with FeatureStore.
|
|
635
|
+
* `get_feature()` - Get the Feature associated with FeatureStore.
|
|
636
|
+
* `get_feature_group()` - Get the FeatureGroup associated with FeatureStore.
|
|
637
|
+
* `list_data_sources()` - List DataSources.
|
|
638
|
+
* `list_entities()` - List Entities.
|
|
639
|
+
* `list_feature_groups()` - List FeatureGroups.
|
|
640
|
+
* `list_features()` - List Features.
|
|
641
|
+
* `list_repos()` - List available repos which are configured for FeatureStore.
|
|
642
|
+
* `repair()` - Repairs the underlying FeatureStore schema on database.
|
|
643
|
+
* `set_features_active()` - Marks the Features as active.
|
|
644
|
+
* `set_features_inactive()` - Marks the Features as inactive.
|
|
645
|
+
* `setup()` - Setup the FeatureStore for a repo.
|
|
646
|
+
* Property
|
|
647
|
+
* `repo` - Property for FeatureStore repo.
|
|
648
|
+
* `grant` - Property to Grant access on FeatureStore to user.
|
|
649
|
+
* `revoke` - Property to Revoke access on FeatureStore from user.
|
|
650
|
+
|
|
651
|
+
* ###### teradataml: Table Operator Functions
|
|
652
|
+
* `Image2Matrix()` - Converts an image into a matrix.
|
|
653
|
+
|
|
654
|
+
* ###### teradataml: SQLE Engine Analytic Functions
|
|
655
|
+
* New Analytics Database Analytic Functions:
|
|
656
|
+
* `CFilter()`
|
|
657
|
+
* `NaiveBayes()`
|
|
658
|
+
* `TDNaiveBayesPredict()`
|
|
659
|
+
* `Shap()`
|
|
660
|
+
* `SMOTE()`
|
|
661
|
+
|
|
662
|
+
* ###### teradataml: Unbounded Array Framework (UAF) Functions
|
|
663
|
+
* New Unbounded Array Framework(UAF) Functions:
|
|
664
|
+
* `CopyArt()`
|
|
665
|
+
|
|
666
|
+
* ###### General functions
|
|
667
|
+
* Vantage File Management Functions
|
|
668
|
+
* `list_files()` - List the installed files in Database.
|
|
669
|
+
|
|
670
|
+
* ###### OpensourceML: LightGBM
|
|
671
|
+
* teradataml adds support for lightGBM package through `OpensourceML` (`OpenML`) feature.
|
|
672
|
+
The following functionality is added in the current release:
|
|
673
|
+
* `td_lightgbm` - Interface object to run lightgbm functions and classes through Teradata Vantage.
|
|
674
|
+
Example usage below:
|
|
675
|
+
```
|
|
676
|
+
from teradataml import td_lightgbm, DataFrame
|
|
677
|
+
|
|
678
|
+
df_train = DataFrame("multi_model_classification")
|
|
679
|
+
|
|
680
|
+
feature_columns = ["col1", "col2", "col3", "col4"]
|
|
681
|
+
label_columns = ["label"]
|
|
682
|
+
part_columns = ["partition_column_1", "partition_column_2"]
|
|
683
|
+
|
|
684
|
+
df_x = df_train.select(feature_columns)
|
|
685
|
+
df_y = df_train.select(label_columns)
|
|
686
|
+
|
|
687
|
+
# Dataset creation.
|
|
688
|
+
# Single model case.
|
|
689
|
+
obj_s = td_lightgbm.Dataset(df_x, df_y, silent=True, free_raw_data=False)
|
|
690
|
+
|
|
691
|
+
# Multi model case.
|
|
692
|
+
obj_m = td_lightgbm.Dataset(df_x, df_y, free_raw_data=False, partition_columns=part_columns)
|
|
693
|
+
obj_m_v = td_lightgbm.Dataset(df_x, df_y, free_raw_data=False, partition_columns=part_columns)
|
|
694
|
+
|
|
695
|
+
## Model training.
|
|
696
|
+
# Single model case.
|
|
697
|
+
opt = td_lightgbm.train(params={}, train_set = obj_s, num_boost_round=30)
|
|
698
|
+
|
|
699
|
+
opt.predict(data=df_x, num_iteration=20, pred_contrib=True)
|
|
700
|
+
|
|
701
|
+
# Multi model case.
|
|
702
|
+
opt = td_lightgbm.train(params={}, train_set = obj_m, num_boost_round=30,
|
|
703
|
+
callbacks=[td_lightgbm.record_evaluation(rec)],
|
|
704
|
+
valid_sets=[obj_m_v, obj_m_v])
|
|
705
|
+
|
|
706
|
+
# Passing `label` argument to get it returned in output DataFrame.
|
|
707
|
+
opt.predict(data=df_x, label=df_y, num_iteration=20)
|
|
708
|
+
|
|
709
|
+
```
|
|
710
|
+
* Added support for accessing scikit-learn APIs using exposed inteface object `td_lightgbm`.
|
|
711
|
+
|
|
712
|
+
Refer Teradata Python Package User Guide for more details of this feature, arguments, usage, examples and supportability in Vantage.
|
|
713
|
+
|
|
714
|
+
* ###### teradataml: Functions
|
|
715
|
+
* `register()` - Registers a user defined function (UDF).
|
|
716
|
+
* `call_udf()` - Calls a registered user defined function (UDF) and returns ColumnExpression.
|
|
717
|
+
* `list_udfs()` - List all the UDFs registered using 'register()' function.
|
|
718
|
+
* `deregister()` - Deregisters a user defined function (UDF).
|
|
719
|
+
|
|
720
|
+
* ###### teradataml: Options
|
|
721
|
+
* Configuration Options
|
|
722
|
+
* `table_operator` - Specifies the name of table operator.
|
|
723
|
+
|
|
724
|
+
* ##### Updates
|
|
725
|
+
* ###### General functions
|
|
726
|
+
* `set_auth_token()` - Added `base_url` parameter which accepts the CCP url.
|
|
727
|
+
'ues_url' will be deprecated in future and users
|
|
728
|
+
will need to specify 'base_url' instead.
|
|
729
|
+
|
|
730
|
+
* ###### teradataml: DataFrame function
|
|
731
|
+
* `join()`
|
|
732
|
+
* Now supports compound ColumExpression having more than one binary operator in `on` argument.
|
|
733
|
+
* Now supports ColumExpression containing FunctionExpression(s) in `on` argument.
|
|
734
|
+
* self-join now expects aliased DataFrame in `other` argument.
|
|
735
|
+
|
|
736
|
+
* ###### teradataml: GeoDataFrame function
|
|
737
|
+
* `join()`
|
|
738
|
+
* Now supports compound ColumExpression having more than one binary operator in `on` argument.
|
|
739
|
+
* Now supports ColumExpression containing FunctionExpression(s) in `on` argument.
|
|
740
|
+
* self-join now expects aliased DataFrame in `other` argument.
|
|
741
|
+
|
|
742
|
+
* ###### teradataml: Unbounded Array Framework (UAF) Functions
|
|
743
|
+
* `SAX()` - Default value added for `window_size` and `output_frequency`.
|
|
744
|
+
* `DickeyFuller()`
|
|
745
|
+
* Supports TDAnalyticResult as input.
|
|
746
|
+
* Default value added for `max_lags`.
|
|
747
|
+
* Removed parameter `drift_trend_formula`.
|
|
748
|
+
* Updated permitted values for `algorithm`.
|
|
749
|
+
|
|
750
|
+
* ##### teradataml: AutoML
|
|
751
|
+
* `AutoML`, `AutoRegressor` and `AutoClassifier`
|
|
752
|
+
* Now supports DECIMAL datatype as input.
|
|
753
|
+
|
|
754
|
+
* ##### teradataml: SQLE Engine Analytic Functions
|
|
755
|
+
* `TextParser()`
|
|
756
|
+
* Argument name `covert_to_lowercase` changed to `convert_to_lowercase`.
|
|
757
|
+
|
|
758
|
+
* ##### Bug Fixes
|
|
759
|
+
* `db_list_tables()` now returns correct results when '%' is used.
|
|
760
|
+
|
|
761
|
+
#### teradataml 20.00.00.02
|
|
762
|
+
|
|
763
|
+
* teradataml will no longer be supported with SQLAlchemy < 2.0.
|
|
764
|
+
* teradataml no longer shows the warnings from Vantage by default.
|
|
765
|
+
* Users should set `display.suppress_vantage_runtime_warnings` to `False` to display warnings.
|
|
766
|
+
|
|
767
|
+
* ##### New Features/Functionality
|
|
768
|
+
* ##### teradataml: SQLE Engine Analytic Functions
|
|
769
|
+
* New Analytics Database Analytic Functions:
|
|
770
|
+
* `TFIDF()`
|
|
771
|
+
* `Pivoting()`
|
|
772
|
+
* `UnPivoting()`
|
|
773
|
+
* New Unbounded Array Framework(UAF) Functions:
|
|
774
|
+
* `AutoArima()`
|
|
775
|
+
* `DWT()`
|
|
776
|
+
* `DWT2D()`
|
|
777
|
+
* `FilterFactory1d()`
|
|
778
|
+
* `IDWT()`
|
|
779
|
+
* `IDWT2D()`
|
|
780
|
+
* `IQR()`
|
|
781
|
+
* `Matrix2Image()`
|
|
782
|
+
* `SAX()`
|
|
783
|
+
* `WindowDFFT()`
|
|
784
|
+
* ###### teradataml: Functions
|
|
785
|
+
* `udf()` - Creates a user defined function (UDF) and returns ColumnExpression.
|
|
786
|
+
* `set_session_param()` is added to set the database session parameters.
|
|
787
|
+
* `unset_session_param()` is added to unset database session parameters.
|
|
788
|
+
|
|
789
|
+
* ###### teradataml: DataFrame
|
|
790
|
+
* `materialize()` - Persists DataFrame into database for current session.
|
|
791
|
+
* `create_temp_view()` - Creates a temporary view for session on the DataFrame.
|
|
792
|
+
|
|
793
|
+
* ###### teradataml DataFrameColumn a.k.a. ColumnExpression
|
|
794
|
+
* _Date Time Functions_
|
|
795
|
+
* `DataFrameColumn.to_timestamp()` - Converts string or integer value to a TIMESTAMP data type or TIMESTAMP WITH TIME ZONE data type.
|
|
796
|
+
* `DataFrameColumn.extract()` - Extracts date component to a numeric value.
|
|
797
|
+
* `DataFrameColumn.to_interval()` - Converts a numeric value or string value into an INTERVAL_DAY_TO_SECOND or INTERVAL_YEAR_TO_MONTH value.
|
|
798
|
+
* _String Functions_
|
|
799
|
+
* `DataFrameColumn.parse_url()` - Extracts a part from a URL.
|
|
800
|
+
* _Arithmetic Functions_
|
|
801
|
+
* `DataFrameColumn.log` - Returns the logarithm value of the column with respect to 'base'.
|
|
802
|
+
|
|
803
|
+
* ##### teradataml: AutoML
|
|
804
|
+
* New methods added for `AutoML()`, `AutoRegressor()` and `AutoClassifier()`:
|
|
805
|
+
* `evaluate()` - Performs evaluation on the data using the best model or the model of users choice
|
|
806
|
+
from the leaderboard.
|
|
807
|
+
* `load()`: Loads the saved model from database.
|
|
808
|
+
* `deploy()`: Saves the trained model inside database.
|
|
809
|
+
* `remove_saved_model()`: Removes the saved model in database.
|
|
810
|
+
* `model_hyperparameters()`: Returns the hyperparameter of fitted or loaded models.
|
|
811
|
+
|
|
812
|
+
* ##### Updates
|
|
813
|
+
* ##### teradataml: AutoML
|
|
814
|
+
* `AutoML()`, `AutoRegressor()`
|
|
815
|
+
* New performance metrics added for task type regression i.e., "MAPE", "MPE", "ME", "EV", "MPD" and "MGD".
|
|
816
|
+
* `AutoML()`, `AutoRegressor()` and `AutoClassifier`
|
|
817
|
+
* New arguments added: `volatile`, `persist`.
|
|
818
|
+
* `predict()` - Data input is now mandatory for generating predictions. Default model
|
|
819
|
+
evaluation is now removed.
|
|
820
|
+
* `DataFrameColumn.cast()`: Accepts 2 new arguments `format` and `timezone`.
|
|
821
|
+
* `DataFrame.assign()`: Accepts ColumnExpressions returned by `udf()`.
|
|
822
|
+
|
|
823
|
+
* ##### teradataml: Options
|
|
824
|
+
* `set_config_params()`
|
|
825
|
+
* Following arguments will be deprecated in the future:
|
|
826
|
+
* `ues_url`
|
|
827
|
+
* `auth_token`
|
|
828
|
+
|
|
829
|
+
* #### teradata DataFrame
|
|
830
|
+
* `to_pandas()` - Function returns the pandas dataframe with Decimal columns types as float instead of object.
|
|
831
|
+
If user want datatype to be object, set argument `coerce_float` to False.
|
|
832
|
+
|
|
833
|
+
* ###### Database Utility
|
|
834
|
+
* `list_td_reserved_keywords()` - Accepts a list of strings as argument.
|
|
835
|
+
|
|
836
|
+
* ##### Updates to existing UAF Functions:
|
|
837
|
+
* `ACF()` - `round_results` parameter removed as it was used for internal testing.
|
|
838
|
+
* `BreuschGodfrey()` - Added default_value 0.05 for parameter `significance_level`.
|
|
839
|
+
* `GoldfeldQuandt()` -
|
|
840
|
+
* Removed parameters `weights` and `formula`.
|
|
841
|
+
Replaced parameter `orig_regr_paramcnt` with `const_term`.
|
|
842
|
+
Changed description for parameter `algorithm`. Please refer document for more details.
|
|
843
|
+
* Note: This will break backward compatibility.
|
|
844
|
+
* `HoltWintersForecaster()` - Default value of parameter `seasonal_periods` removed.
|
|
845
|
+
* `IDFFT2()` - Removed parameter `output_fmt_row_major` as it is used for internal testing.
|
|
846
|
+
* `Resample()` - Added parameter `output_fmt_index_style`.
|
|
847
|
+
|
|
848
|
+
* ##### Bug Fixes
|
|
849
|
+
* KNN `predict()` function can now predict on test data which does not contain target column.
|
|
850
|
+
* Metrics functions are supported on the Lake system.
|
|
851
|
+
* The following OpensourceML functions from different sklearn modules in single model case are fixed.
|
|
852
|
+
* `sklearn.ensemble`:
|
|
853
|
+
* ExtraTreesClassifier - `apply()`
|
|
854
|
+
* ExtraTreesRegressor - `apply()`
|
|
855
|
+
* RandomForestClassifier - `apply()`
|
|
856
|
+
* RandomForestRegressor - `apply()`
|
|
857
|
+
* `sklearn.impute`:
|
|
858
|
+
* SimpleImputer - `transform()`, `fit_transform()`, `inverse_transform()`
|
|
859
|
+
* MissingIndicator - `transform()`, `fit_transform()`
|
|
860
|
+
* `sklearn.kernel_approximations`:
|
|
861
|
+
* Nystroem - `transform()`, `fit_transform()`
|
|
862
|
+
* PolynomialCountSketch - `transform()`, `fit_transform()`
|
|
863
|
+
* RBFSampler - `transform()`, `fit_transform()`
|
|
864
|
+
* `sklearn.neighbors`:
|
|
865
|
+
* KNeighborsTransformer - `transform()`, `fit_transform()`
|
|
866
|
+
* RadiusNeighborsTransformer - `transform()`, `fit_transform()`
|
|
867
|
+
* `sklearn.preprocessing`:
|
|
868
|
+
* KernelCenterer - `transform()`
|
|
869
|
+
* OneHotEncoder - `transform()`, `inverse_transform()`
|
|
870
|
+
* The following OpensourceML functions from different sklearn modules in multi model case are fixed.
|
|
871
|
+
* `sklearn.feature_selection`:
|
|
872
|
+
* SelectFpr - `transform()`, `fit_transform()`, `inverse_transform()`
|
|
873
|
+
* SelectFdr - `transform()`, `fit_transform()`, `inverse_transform()`
|
|
874
|
+
* SelectFromModel - `transform()`, `fit_transform()`, `inverse_transform()`
|
|
875
|
+
* SelectFwe - `transform()`, `fit_transform()`, `inverse_transform()`
|
|
876
|
+
* RFECV - `transform()`, `fit_transform()`, `inverse_transform()`
|
|
877
|
+
* `sklearn.clustering`:
|
|
878
|
+
* Birch - `transform()`, `fit_transform()`
|
|
879
|
+
* OpensourceML returns teradataml objects for model attributes and functions instead of sklearn
|
|
880
|
+
objects so that the user can perform further operations like `score()`, `predict()` etc on top
|
|
881
|
+
of the returned objects.
|
|
882
|
+
* AutoML `predict()` function now generates correct ROC-AUC value for positive class.
|
|
883
|
+
* `deploy()` method of `Script` and `Apply` classes retries model deployment if there is any
|
|
884
|
+
intermittent network issues.
|
|
885
|
+
|
|
886
|
+
#### teradataml 20.00.00.01
|
|
887
|
+
* teradataml no longer supports Python versions less than 3.8.
|
|
888
|
+
|
|
889
|
+
* ##### New Features/Functionality
|
|
890
|
+
* ##### Personal Access Token (PAT) support in teradataml
|
|
891
|
+
* `set_auth_token()` - teradataml now supports authentication via PAT in addition to
|
|
892
|
+
OAuth 2.0 Device Authorization Grant (formerly known as the Device Flow).
|
|
893
|
+
* It accepts UES URL, Personal AccessToken (PAT) and Private Key file generated from VantageCloud Lake Console
|
|
894
|
+
and optional argument `username` and `expiration_time` in seconds.
|
|
895
|
+
|
|
896
|
+
* ##### Updates
|
|
897
|
+
* ##### teradataml: SQLE Engine Analytic Functions
|
|
898
|
+
* `ANOVA()`
|
|
899
|
+
* New arguments added: `group_name_column`, `group_value_name`, `group_names`, `num_groups` for data containing group values and group names.
|
|
900
|
+
* `FTest()`
|
|
901
|
+
* New arguments added: `sample_name_column`, `sample_name_value`, `first_sample_name`, `second_sample_name`.
|
|
902
|
+
* `GLM()`
|
|
903
|
+
* Supports stepwise regression and accept new arguments `stepwise_direction`, `max_steps_num` and `initial_stepwise_columns`.
|
|
904
|
+
* New arguments added: `attribute_data`, `parameter_data`, `iteration_mode` and `partition_column`.
|
|
905
|
+
* `GetFutileColumns()`
|
|
906
|
+
* Arguments `category_summary_column` and `threshold_value` are now optional.
|
|
907
|
+
* `KMeans()`
|
|
908
|
+
* New argument added: `initialcentroids_method`.
|
|
909
|
+
* `NonLinearCombineFit()`
|
|
910
|
+
* Argument `result_column` is now optional.
|
|
911
|
+
* `ROC()`
|
|
912
|
+
* Argument `positive_class` is now optional.
|
|
913
|
+
* `SVMPredict()`
|
|
914
|
+
* New argument added: `model_type`.
|
|
915
|
+
* `ScaleFit()`
|
|
916
|
+
* New arguments added: `ignoreinvalid_locationscale`, `unused_attributes`, `attribute_name_column`, `attribute_value_column`.
|
|
917
|
+
* Arguments `attribute_name_column`, `attribute_value_column` and `target_attributes` are supported for sparse input.
|
|
918
|
+
* Arguments `attribute_data`, `parameter_data` and `partition_column` are supported for partitioning.
|
|
919
|
+
* `ScaleTransform()`
|
|
920
|
+
* New arguments added: `attribute_name_column` and `attribute_value_column` support for sparse input.
|
|
921
|
+
* `TDGLMPredict()`
|
|
922
|
+
* New arguments added: `family` and `partition_column`.
|
|
923
|
+
* `XGBoost()`
|
|
924
|
+
* New argument `base_score` is added for initial prediction value for all data points.
|
|
925
|
+
* `XGBoostPredict()`
|
|
926
|
+
* New argument `detailed` is added for detailed information of each prediction.
|
|
927
|
+
* `ZTest()`
|
|
928
|
+
* New arguments added: `sample_name_column`, `sample_value_column`, `first_sample_name` and `second_sample_name`.
|
|
929
|
+
* ##### teradataml: AutoML
|
|
930
|
+
* `AutoML()`, `AutoRegressor()` and `AutoClassifier()`
|
|
931
|
+
* New argument `max_models` is added as an early stopping criterion to limit the maximum number of models to be trained.
|
|
932
|
+
* ##### teradataml: DataFrame functions
|
|
933
|
+
* `DataFrame.agg()`
|
|
934
|
+
* Accepts ColumnExpressions and list of ColumnExpressions as arguments.
|
|
935
|
+
* ##### teradataml: General Functions
|
|
936
|
+
* Data Transfer Utility
|
|
937
|
+
* `fastload()` - Improved error and warning table handling with below-mentioned new arguments.
|
|
938
|
+
* `err_staging_db`
|
|
939
|
+
* `err_tbl_name`
|
|
940
|
+
* `warn_tbl_name`
|
|
941
|
+
* `err_tbl_1_suffix`
|
|
942
|
+
* `err_tbl_2_suffix`
|
|
943
|
+
* `fastload()` - Change in behaviour of `save_errors` argument.
|
|
944
|
+
When `save_errors` is set to `True`, error information will be available in two persistent tables `ERR_1` and `ERR_2`.
|
|
945
|
+
When `save_errors` is set to `False`, error information will be available in single pandas dataframe.
|
|
946
|
+
* Garbage collector location is now configurable.
|
|
947
|
+
User can set configure.local_storage to a desired location.
|
|
948
|
+
|
|
949
|
+
* ##### Bug Fixes
|
|
950
|
+
* UAF functions now work if the database name has special characters.
|
|
951
|
+
* OpensourceML can now read and process NULL/nan values.
|
|
952
|
+
* Boolean values output will now be returned as VARBYTE column with 0 or 1 values in OpensourceML.
|
|
953
|
+
* Fixed bug for `Apply`'s `deploy()`.
|
|
954
|
+
* Issue with volatile table creation is fixed where it is created in the right database, i.e., user's spool space, regardless of the temp database specified.
|
|
955
|
+
* `ColumnTransformer` function now processes its arguments in the order they are passed.
|
|
956
|
+
|
|
957
|
+
#### teradataml 20.00.00.00
|
|
958
|
+
* ##### New Features/Functionality
|
|
959
|
+
* ###### teradataml OpenML: Run Opensource packages through Teradata Vantage
|
|
960
|
+
`OpenML` dynamically exposes opensource packages through Teradata Vantage. `OpenML` provides an
|
|
961
|
+
interface object through which exposed classes and functions of opensource packages can be accessed
|
|
962
|
+
with the same syntax and arguments.
|
|
963
|
+
The following functionality is added in the current release:
|
|
964
|
+
* `td_sklearn` - Interface object to run scikit-learn functions and classes through Teradata Vantage.
|
|
965
|
+
Example usage below:
|
|
966
|
+
```
|
|
967
|
+
from teradataml import td_sklearn, DataFrame
|
|
968
|
+
|
|
969
|
+
df_train = DataFrame("multi_model_classification")
|
|
970
|
+
|
|
971
|
+
feature_columns = ["col1", "col2", "col3", "col4"]
|
|
972
|
+
label_columns = ["label"]
|
|
973
|
+
part_columns = ["partition_column_1", "partition_column_2"]
|
|
974
|
+
|
|
975
|
+
linear_svc = td_sklearn.LinearSVC()
|
|
976
|
+
```
|
|
977
|
+
* `OpenML` is supported in both Teradata Vantage Enterprise and Teradata Vantage Lake.
|
|
978
|
+
* Argument Support:
|
|
979
|
+
* `Use of X and y arguments` - Scikit-learn users are familiar with using `X` and `y` as argument names
|
|
980
|
+
which take data as pandas DataFrames, numpy arrays or lists etc. However, in OpenML, we pass
|
|
981
|
+
teradataml DataFrames for arguments `X` and `y`.
|
|
982
|
+
```
|
|
983
|
+
df_x = df_train.select(feature_columns)
|
|
984
|
+
df_y = df_train.select(label_columns)
|
|
985
|
+
|
|
986
|
+
linear_svc = linear_svc.fit(X=df_x, y=df_y)
|
|
987
|
+
```
|
|
988
|
+
* `Additional support for data, feature_columns, label_columns and group_columns arguments` -
|
|
989
|
+
Apart from traditional arguments, OpenML supports additional arguments - `data`,
|
|
990
|
+
`feature_columns`, `label_columns` and `group_columns`. These are used as alternatives to `X`, `y`
|
|
991
|
+
and `groups`.
|
|
992
|
+
```
|
|
993
|
+
linear_svc = linear_svc.fit(data=df_train, feature_columns=feature_columns, label_colums=label_columns)
|
|
994
|
+
```
|
|
995
|
+
* `Support for classification and regression metrics` - Metrics functions for classification and
|
|
996
|
+
regression in `sklearn.metrics` module are supported. Other metrics functions' support will be added
|
|
997
|
+
in future releases.
|
|
998
|
+
* `Distributed Modeling and partition_columns argument support` - Existing scikit-learn supports
|
|
999
|
+
only single model generation. However, OpenML supports both single model use case and distributed
|
|
1000
|
+
(multi) model use case. For this, user has to additionally pass `partition_columns` argument to
|
|
1001
|
+
existing `fit()`, `predict()` or any other function to be run. This will generate multiple models
|
|
1002
|
+
for multiple partitions, using the data in corresponding partition.
|
|
1003
|
+
```
|
|
1004
|
+
df_x_1 = df_train.select(feature_columns + part_columns)
|
|
1005
|
+
linear_svc = linear_svc.fit(X=df_x_1, y=df_y, partition_columns=part_columns)
|
|
1006
|
+
```
|
|
1007
|
+
* `Support for load and deploy models` - OpenML provides additional support for saving (deploying) the
|
|
1008
|
+
trained models. These models can be loaded later to perform operations like prediction, score etc. The
|
|
1009
|
+
following functions are provided by OpenML:
|
|
1010
|
+
* `<obj>.deploy()` - Used to deploy/save the model created and/or trained by OpenML.
|
|
1011
|
+
* `td_sklearn.deploy()` - Used to deploy/save the model created and/or trained outside teradataml.
|
|
1012
|
+
* `td_sklearn.load()` - Used to load the saved models.
|
|
1013
|
+
|
|
1014
|
+
<br>Refer Teradata Python Package User Guide for more details of this feature, arguments, usage, examples and supportability in both VantageCloud Enterprise and VantageCloud Lake.
|
|
1015
|
+
|
|
1016
|
+
* ###### teradataml: AutoML - Automated end to end Machine Learning flow.
|
|
1017
|
+
AutoML is an approach to automate the process of building, training, and validating machine learning models.
|
|
1018
|
+
It involves automation of various aspects of the machine learning workflow, such as feature exploration,
|
|
1019
|
+
feature engineering, data preparation, model training and evaluation for given dataset.
|
|
1020
|
+
teradataml AutoML feature offers best model identification, model leaderboard generation, parallel execution,
|
|
1021
|
+
early stopping feature, model evaluation, model prediction, live logging, customization on default process.
|
|
1022
|
+
* `AutoML`
|
|
1023
|
+
AutoML is a generic algorithm that supports all three tasks, i.e. 'Regression',
|
|
1024
|
+
'Binary Classification' and 'Multiclass Classification'.
|
|
1025
|
+
* Methods of AutoML
|
|
1026
|
+
* `__init__()` - Instantiate an object of AutoML with given parameters.
|
|
1027
|
+
* `fit()` - Perform fit on specified data and target column.
|
|
1028
|
+
* `leaderboard()` - Get the leaderboard for the AutoML. Presents diverse models, feature
|
|
1029
|
+
selection method, and performance metrics.
|
|
1030
|
+
* `leader()` - Show best performing model and its details such as feature
|
|
1031
|
+
selection method, and performance metrics.
|
|
1032
|
+
* `predict()` - Perform prediction on the data using the best model or the model of users
|
|
1033
|
+
choice from the leaderboard.
|
|
1034
|
+
* `generate_custom_config()` - Generate custom config JSON file required for customized
|
|
1035
|
+
run of AutoML.
|
|
1036
|
+
* `AutoRegressor`
|
|
1037
|
+
AutoRegressor is a special purpose AutoML feature to run regression specific tasks.
|
|
1038
|
+
* Methods of AutoRegressor
|
|
1039
|
+
* `__init__()` - Instantiate an object of AutoRegressor with given parameters.
|
|
1040
|
+
* `fit()` - Perform fit on specified data and target column.
|
|
1041
|
+
* `leaderboard()` - Get the leaderboard for the AutoRegressor. Presents diverse models, feature
|
|
1042
|
+
selection method, and performance metrics.
|
|
1043
|
+
* `leader()` - Show best performing model and its details such as feature
|
|
1044
|
+
selection method, and performance metrics.
|
|
1045
|
+
* `predict()` - Perform prediction on the data using the best model or the model of users
|
|
1046
|
+
choice from the leaderboard.
|
|
1047
|
+
* `generate_custom_config()` - Generate custom config JSON file required for customized
|
|
1048
|
+
run of AutoRegressor.
|
|
1049
|
+
* `AutoClassifier`
|
|
1050
|
+
AutoClassifier is a special purpose AutoML feature to run classification specific tasks.
|
|
1051
|
+
* Methods of AutoClassifier
|
|
1052
|
+
* `__init__()` - Instantiate an object of AutoClassifier with given parameters.
|
|
1053
|
+
* `fit()` - Perform fit on specified data and target column.
|
|
1054
|
+
* `leaderboard()` - Get the leaderboard for the AutoClassifier. Presents diverse models, feature
|
|
1055
|
+
selection method, and performance metrics.
|
|
1056
|
+
* `leader()` - Show best performing model and its details such as feature
|
|
1057
|
+
selection method, and performance metrics.
|
|
1058
|
+
* `predict()` - Perform prediction on the data using the best model or the model of users
|
|
1059
|
+
choice from the leaderboard.
|
|
1060
|
+
* `generate_custom_config()` - Generate custom config JSON file required for customized
|
|
1061
|
+
run of AutoClassifier.
|
|
1062
|
+
|
|
1063
|
+
* ###### teradataml: DataFrame
|
|
1064
|
+
* `fillna` - Replace the null values in a column with the value specified.
|
|
1065
|
+
* Data Manipulation
|
|
1066
|
+
* `cube()`- Analyzes data by grouping it into multiple dimensions.
|
|
1067
|
+
* `rollup()` - Analyzes a set of data across a single dimension with more than one level of detail.
|
|
1068
|
+
* `replace()` - Replaces the values for columns.
|
|
1069
|
+
|
|
1070
|
+
* ###### teradataml: Script and Apply
|
|
1071
|
+
* `deploy()` - Function deploys the model, generated after `execute_script()`, in database or user
|
|
1072
|
+
environment in lake. The function is available in both Script and Apply.
|
|
1073
|
+
|
|
1074
|
+
* ###### teradataml: DataFrameColumn
|
|
1075
|
+
* `fillna` - Replaces every occurrence of null value in column with the value specified.
|
|
1076
|
+
|
|
1077
|
+
* ###### teradataml DataFrameColumn a.k.a. ColumnExpression
|
|
1078
|
+
* _Date Time Functions_
|
|
1079
|
+
* `DataFrameColumn.week_start()` - Returns the first date or timestamp of the week that begins immediately before the specified date or timestamp value in a column as a literal.
|
|
1080
|
+
* `DataFrameColumn.week_begin()` - It is an alias for `DataFrameColumn.week_start()` function.
|
|
1081
|
+
* `DataFrameColumn.week_end()` - Returns the last date or timestamp of the week that ends immediately after the specified date or timestamp value in a column as a literal.
|
|
1082
|
+
* `DataFrameColumn.month_start()` - Returns the first date or timestamp of the month that begins immediately before the specified date or timestamp value in a column or as a literal.
|
|
1083
|
+
* `DataFrameColumn.month_begin()` - It is an alias for `DataFrameColumn.month_start()` function.
|
|
1084
|
+
* `DataFrameColumn.month_end()` - Returns the last date or timestamp of the month that ends immediately after the specified date or timestamp value in a column or as a literal.
|
|
1085
|
+
* `DataFrameColumn.year_start()` - Returns the first date or timestamp of the year that begins immediately before the specified date or timestamp value in a column or as a literal.
|
|
1086
|
+
* `DataFrameColumn.year_begin()` - It is an alias for `DataFrameColumn.year_start()` function.
|
|
1087
|
+
* `DataFrameColumn.year_end()` - Returns the last date or timestamp of the year that ends immediately after the specified date or timestamp value in a column or as a literal.
|
|
1088
|
+
* `DataFrameColumn.quarter_start()` - Returns the first date or timestamp of the quarter that begins immediately before the specified date or timestamp value in a column as a literal.
|
|
1089
|
+
* `DataFrameColumn.quarter_begin()` - It is an alias for `DataFrameColumn.quarter_start()` function.
|
|
1090
|
+
* `DataFrameColumn.quarter_end()` - Returns the last date or timestamp of the quarter that ends immediately after the specified date or timestamp value in a column as a literal.
|
|
1091
|
+
* `DataFrameColumn.last_sunday()` - Returns the date or timestamp of Sunday that falls immediately before the specified date or timestamp value in a column as a literal.
|
|
1092
|
+
* `DataFrameColumn.last_monday()` - Returns the date or timestamp of Monday that falls immediately before the specified date or timestamp value in a column as a literal.
|
|
1093
|
+
* `DataFrameColumn.last_tuesday()` - Returns the date or timestamp of Tuesday that falls immediately before the specified date or timestamp value in a column as a literal.
|
|
1094
|
+
* `DataFrameColumn.last_wednesday()` - Returns the date or timestamp of Wednesday that falls immediately before specified date or timestamp value in a column as a literal.
|
|
1095
|
+
* `DataFrameColumn.last_thursday()`- Returns the date or timestamp of Thursday that falls immediately before specified date or timestamp value in a column as a literal.
|
|
1096
|
+
* `DataFrameColumn.last_friday()` - Returns the date or timestamp of Friday that falls immediately before specified date or timestamp value in a column as a literal.
|
|
1097
|
+
* `DataFrameColumn.last_saturday()` - Returns the date or timestamp of Saturday that falls immediately before specified date or timestamp value in a column as a literal.
|
|
1098
|
+
* `DataFrameColumn.day_of_week()` - Returns the number of days from the beginning of the week to the specified date or timestamp value in a column as a literal.
|
|
1099
|
+
* `DataFrameColumn.day_of_month()` - Returns the number of days from the beginning of the month to the specified date or timestamp value in a column as a literal.
|
|
1100
|
+
* `DataFrameColumn.day_of_year()` - Returns the number of days from the beginning of the year to the specified date or timestamp value in a column as a literal.
|
|
1101
|
+
* `DataFrameColumn.day_of_calendar()` - Returns the number of days from the beginning of the business calendar to the specified date or timestamp value in a column as a literal.
|
|
1102
|
+
* `DataFrameColumn.week_of_month()` - Returns the number of weeks from the beginning of the month to the specified date or timestamp value in a column as a literal.
|
|
1103
|
+
* `DataFrameColumn.week_of_quarter()` - Returns the number of weeks from the beginning of the quarter to the specified date or timestamp value in a column as a literal.
|
|
1104
|
+
* `DataFrameColumn.week_of_year()` - Returns the number of weeks from the beginning of the year to the specified date or timestamp value in a column as a literal.
|
|
1105
|
+
* `DataFrameColumn.week_of_calendar()` - Returns the number of weeks from the beginning of the calendar to the specified date or timestamp value in a column as a literal.
|
|
1106
|
+
* `DataFrameColumn.month_of_year()` - Returns the number of months from the beginning of the year to the specified date or timestamp value in a column as a literal.
|
|
1107
|
+
* `DataFrameColumn.month_of_calendar()` - Returns the number of months from the beginning of the calendar to the specified date or timestamp value in a column as a literal.
|
|
1108
|
+
* `DataFrameColumn.month_of_quarter()` - Returns the number of months from the beginning of the quarter to the specified date or timestamp value in a column as a literal.
|
|
1109
|
+
* `DataFrameColumn.quarter_of_year()` - Returns the number of quarters from the beginning of the year to the specified date or timestamp value in a column as a literal.
|
|
1110
|
+
* `DataFrameColumn.quarter_of_calendar()` - Returns the number of quarters from the beginning of the calendar to the specified date or timestamp value in a column as a literal.
|
|
1111
|
+
* `DataFrameColumn.year_of_calendar()` - Returns the year of the specified date or timestamp value in a column as a literal.
|
|
1112
|
+
* `DataFrameColumn.day_occurrence_of_month()` - Returns the nth occurrence of the weekday in the month for the date to the specified date or timestamp value in a column as a literal.
|
|
1113
|
+
* `DataFrameColumn.year()` - Returns the integer value for year in the specified date or timestamp value in a column as a literal.
|
|
1114
|
+
* `DataFrameColumn.month()` - Returns the integer value for month in the specified date or timestamp value in a column as a literal.
|
|
1115
|
+
* `DataFrameColumn.hour()` - Returns the integer value for hour in the specified timestamp value in a column as a literal.
|
|
1116
|
+
* `DataFrameColumn.minute()` - Returns the integer value for minute in the specified timestamp value in a column as a literal.
|
|
1117
|
+
* `DataFrameColumn.second()` - Returns the integer value for seconds in the specified timestamp value in a column as a literal.
|
|
1118
|
+
* `DataFrameColumn.week()` - Returns the number of weeks from the beginning of the year to the specified date or timestamp value in a column as a literal.
|
|
1119
|
+
* `DataFrameColumn.next_day()` - Returns the date of the first weekday specified as 'day_value' that is later than the specified date or timestamp value in a column as a literal.
|
|
1120
|
+
* `DataFrameColumn.months_between()` - Returns the number of months between value in specified date or timestamp value in a column as a literal and date or timestamp value in argument.
|
|
1121
|
+
* `DataFrameColumn.add_months()` - Adds an integer number of months to specified date or timestamp value in a column as a literal.
|
|
1122
|
+
* `DataFrameColumn.oadd_months()` - Adds an integer number of months, date or timestamp value in specified date or timestamp value in a column as a literal.
|
|
1123
|
+
* `DataFrameColumn.to_date()` - Function converts a string-like representation of a DATE or PERIOD type to Date type.
|
|
1124
|
+
* _String Functions_
|
|
1125
|
+
* `DataFrameColumn.concat()` - Function to concatenate the columns with a separator.
|
|
1126
|
+
* `DataFrameColumn.like()` - Function to match the string pattern. String match is case sensitive.
|
|
1127
|
+
* `DataFrameColumn.ilike()` - Function to match the string pattern. String match is not case sensitive.
|
|
1128
|
+
* `DataFrameColumn.substr()` - Returns the substring from a string column.
|
|
1129
|
+
* `DataFrameColumn.startswith()` - Function to check if the column value starts with the specified value or not.
|
|
1130
|
+
* `DataFrameColumn.endswith()` - Function to check if the column value ends with the specified value or not.
|
|
1131
|
+
* `DataFrameColumn.format()` - Function to format the values in column based on formatter.
|
|
1132
|
+
* `DataFrameColumn.to_char()` - Function converts numeric type or datetype to character type.
|
|
1133
|
+
* `DataFrameColumn.trim()` - Function trims the string values in the column.
|
|
1134
|
+
* _Regular Arithmetic Functions_
|
|
1135
|
+
* `DataFrameColumn.cbrt()` - Computes the cube root of values in the column.
|
|
1136
|
+
* `DataFrameColumn.hex()` - Computes the Hexadecimal from decimal for the values in the column.
|
|
1137
|
+
* `DataframeColumn.hypot()` - Computes the decimal from Hexadecimal for the values in the column.
|
|
1138
|
+
* `DataFrameColumn.unhex()` - computes the hypotenuse for the values between two columns.
|
|
1139
|
+
* _Bit Byte Manipulation Functions_
|
|
1140
|
+
* `DataFrameColumn.from_byte()` - Encodes a sequence of bits into a sequence of characters.
|
|
1141
|
+
* _Comparison Functions_
|
|
1142
|
+
* `DataFrameColumn.greatest()` - Returns the greatest values from columns.
|
|
1143
|
+
* `DataFrameColumn.least()` - Returns the least values from columns.
|
|
1144
|
+
* Behaviour of `DataFrameColumn.replace()` is changed.
|
|
1145
|
+
* Behaviour of `DataFrameColumn.to_byte()` is changed. It now decodes a sequence of characters in a given encoding into a sequence of bits.
|
|
1146
|
+
* Behaviour of `DataFrameColumn.trunc()` is changed. It now accepts Date type columns.
|
|
1147
|
+
|
|
1148
|
+
* ##### Bug Fixes
|
|
1149
|
+
* Argument `url_encode` is no longer used in `create_context()` and is deprecated.
|
|
1150
|
+
* **Important notes**
|
|
1151
|
+
* Users do not need to encode password even if password contain special characters.
|
|
1152
|
+
* Pass the password to the `create_context()` function argument `password` as it is without changing special characters.
|
|
1153
|
+
* `fillna()` in VAL transformation allows to replace NULL values with empty string.
|
|
1154
|
+
|
|
1155
|
+
* ##### Updates
|
|
1156
|
+
* Support for following deprecated functionality is removed:
|
|
1157
|
+
* ML Engine functions
|
|
1158
|
+
* STO and APPLY sandbox feature support for testing the script.
|
|
1159
|
+
* sandbox_container_utils is removed. Following methods can no longer be used:
|
|
1160
|
+
* `setup_sandbox_env()`
|
|
1161
|
+
* `copy_files_from_container()`
|
|
1162
|
+
* `cleanup_sandbox_env()`
|
|
1163
|
+
* Model Cataloging APIs can no longer be used:
|
|
1164
|
+
* `describe_model()`
|
|
1165
|
+
* `delete_model()`
|
|
1166
|
+
* `list_models()`
|
|
1167
|
+
* `publish_model()`
|
|
1168
|
+
* `retrieve_model()`
|
|
1169
|
+
* `save_model()`
|
|
1170
|
+
* `DataFrame.join()`
|
|
1171
|
+
* Arguments `lsuffix` and `rsuffix` now add suffixes to new column names for join operation.
|
|
1172
|
+
* `DataFrame.describe()`
|
|
1173
|
+
* New argument `columns` is added to generate statistics on only those columns instead of all applicable columns.
|
|
1174
|
+
* `DataFrame.groupby()`
|
|
1175
|
+
* Supports `CUBE` and `ROLLUP` with additional optional argument `option`.
|
|
1176
|
+
* `DataFrame.column.window()`
|
|
1177
|
+
* Supports ColumnExpressions for `partition_columns` and `order_columns` arguments.
|
|
1178
|
+
* `DataFrame.column.contains()` allows ColumnExpressions for `pattern` argument.
|
|
1179
|
+
* `DataFrame.window()`
|
|
1180
|
+
* Supports ColumnExpressions for `partition_columns` and `order_columns` arguments.
|
|
1181
|
+
|
|
1182
|
+
#### teradataml 17.20.00.07
|
|
1183
|
+
* ##### New Features/Functionality
|
|
1184
|
+
* ###### Open Analytics Framework (OpenAF) APIs:
|
|
1185
|
+
* Manage all user environments.
|
|
1186
|
+
* `create_env()`:
|
|
1187
|
+
* new argument `conda_env` is added to create a conda environment.
|
|
1188
|
+
* `list_user_envs()`:
|
|
1189
|
+
* User can list conda environment(s) by using filter with new argument `conda_env`.
|
|
1190
|
+
* Conda environment(s) can be managed using APIs for installing , updating, removing files/libraries.
|
|
1191
|
+
* ##### Bug Fixes
|
|
1192
|
+
* `columns` argument for `FillNa` function is made optional.
|
|
1193
|
+
|
|
1194
|
+
#### teradataml 17.20.00.06
|
|
1195
|
+
* ##### New Features/Functionality
|
|
1196
|
+
* ###### teradataml DataFrameColumn a.k.a. ColumnExpression
|
|
1197
|
+
* `ColumnExpression.nulls_first()` - Displays NULL values at first.
|
|
1198
|
+
* `ColumnExpression.nulls_last()` - Displays NULL values at last.
|
|
1199
|
+
* _Bit Byte Manipulation Functions_
|
|
1200
|
+
* `DataFrameColumn.bit_and()` - Returns the logical AND operation on the bits from
|
|
1201
|
+
the column and corresponding bits from the argument.
|
|
1202
|
+
* `DataFrameColumn.bit_get()` - Returns the bit specified by input argument from the column and
|
|
1203
|
+
returns either 0 or 1 to indicate the value of that bit.
|
|
1204
|
+
* `DataFrameColumn.bit_or()` - Returns the logical OR operation on the bits from the column and
|
|
1205
|
+
corresponding bits from the argument.
|
|
1206
|
+
* `DataFrameColumn.bit_xor()` - Returns the bitwise XOR operation on the binary representation of the
|
|
1207
|
+
column and corresponding bits from the argument.
|
|
1208
|
+
* `DataFrameColumn.bitand()` - It is an alias for `DataFrameColumn.bit_and()` function.
|
|
1209
|
+
* `DataFrameColumn.bitnot()` - Returns a bitwise complement on the binary representation of the column.
|
|
1210
|
+
* `DataFrameColumn.bitor()` - It is an alias for `DataFrameColumn.bit_or()` function.
|
|
1211
|
+
* `DataFrameColumn.bitwise_not()` - It is an alias for `DataFrameColumn.bitnot()` function.
|
|
1212
|
+
* `DataFrameColumn.bitwiseNOT()` - It is an alias for `DataFrameColumn.bitnot()` function.
|
|
1213
|
+
* `DataFrameColumn.bitxor()` - It is an alias for `DataFrameColumn.bit_xor()` function.
|
|
1214
|
+
* `DataFrameColumn.countset()` - Returns the count of the binary bits within the column that are either set to 1
|
|
1215
|
+
or set to 0, depending on the input argument value.
|
|
1216
|
+
* `DataFrameColumn.getbit()` - It is an alias for `DataFrameColumn.bit_get()` function.
|
|
1217
|
+
* `DataFrameColumn.rotateleft()` - Returns an expression rotated to the left by the specified number of bits,
|
|
1218
|
+
with the most significant bits wrapping around to the right.
|
|
1219
|
+
* `DataFrameColumn.rotateright()` - Returns an expression rotated to the right by the specified number of bits,
|
|
1220
|
+
with the least significant bits wrapping around to the left.
|
|
1221
|
+
* `DataFrameColumn.setbit()` - Sets the value of the bit specified by input argument to the value
|
|
1222
|
+
of column.
|
|
1223
|
+
* `DataFrameColumn.shiftleft()` - Returns the expression when value in column is shifted by the specified
|
|
1224
|
+
number of bits to the left.
|
|
1225
|
+
* `DataFrameColumn.shiftright()` - Returns the expression when column expression is shifted by the specified
|
|
1226
|
+
number of bits to the right.
|
|
1227
|
+
* `DataFrameColumn.subbitstr()` - Extracts a bit substring from the column expression based on the specified
|
|
1228
|
+
bit position.
|
|
1229
|
+
* `DataFrameColumn.to_byte()` - Converts a numeric data type to the Vantage byte representation
|
|
1230
|
+
(byte value) of the column expression value.
|
|
1231
|
+
|
|
1232
|
+
* _Regular Expression Functions_
|
|
1233
|
+
* `DataFrameColumn.regexp_instr()` - Searches string value in column for a match to value specified in argument.
|
|
1234
|
+
* `DataFrameColumn.regexp_replace()` - Replaces the portions of string value in a column that matches the value
|
|
1235
|
+
specified regex string and replaces with the replace string.
|
|
1236
|
+
* `DataFrameColumn.regexp_similar()` - Compares value in column to value in argument and returns integer value.
|
|
1237
|
+
* `DataFrameColumn.regexp_substr()` - Extracts a substring from column that matches a regular expression
|
|
1238
|
+
specified in the input argument.
|
|
1239
|
+
|
|
1240
|
+
* ###### Open Analytics Framework (OpenAF) APIs:
|
|
1241
|
+
* Manage all user environments.
|
|
1242
|
+
* `create_env()`:
|
|
1243
|
+
* User can create one or more user environments using newly added argument `template` by providing specifications in template json file. New feature allows user to create complete user environment, including file and library installation, in just single function call.
|
|
1244
|
+
* UserEnv Class – Manage individual user environment.
|
|
1245
|
+
* Properties:
|
|
1246
|
+
* `models` - Supports listing of models in user environment.
|
|
1247
|
+
* Methods:
|
|
1248
|
+
* `install_model()` - Install a model in user environment.
|
|
1249
|
+
* `uninstall_model()` - Uninstall a model from user environment.
|
|
1250
|
+
* `snapshot()`- Take the snapshot of the user environment.
|
|
1251
|
+
|
|
1252
|
+
* ###### teradataml: Bring Your Own Model
|
|
1253
|
+
* _New Functions_
|
|
1254
|
+
* `DataRobotPredict()` - Score the data in Vantage using the model trained externally in datarobot and stored
|
|
1255
|
+
in Vantage.
|
|
1256
|
+
|
|
1257
|
+
* ##### Updates
|
|
1258
|
+
* `DataFrame.describe()`
|
|
1259
|
+
* Method now accepts an argument `statistics`, which specifies the aggregate operation to be performed.
|
|
1260
|
+
* `DataFrame.sort()`
|
|
1261
|
+
* Method now accepts ColumnExpressions as well.
|
|
1262
|
+
* Enables sorting using NULLS FIRST and NULLS LAST.
|
|
1263
|
+
* `view_log()` downloads the Apply query logs based on query id.
|
|
1264
|
+
* Arguments which accepts floating numbers will accept integers also for `Analytics Database Analytic Functions`.
|
|
1265
|
+
* Argument `ignore_nulls` added to `DataFrame.plot()` to ignore the null values while plotting the data.
|
|
1266
|
+
* `Dataframe.sample()`
|
|
1267
|
+
* Method supports column stratification.
|
|
1268
|
+
|
|
1269
|
+
* ##### Bug Fixes
|
|
1270
|
+
* `DataFrameColumn.cast()` accepts all teradatasqlalchemy types.
|
|
1271
|
+
* Minor bug fix related to `DataFrame.merge()`.
|
|
1272
|
+
|
|
1273
|
+
#### teradataml 17.20.00.05
|
|
1274
|
+
* ##### New Features/Functionality
|
|
1275
|
+
* ###### teradataml: Hyperparameter-Tuning - Technique to identify best model parameters.
|
|
1276
|
+
Hyperparameter tuning is an optimization method to determine the optimal set of
|
|
1277
|
+
hyperparameters for the given dataset and learning model. teradataml hyperparameter tuning feature
|
|
1278
|
+
offers best model identification, parallel execution, early stopping feature, best data identification,
|
|
1279
|
+
model evaluation, model prediction, live logging, input data hyper-parameterization, input data sampling,
|
|
1280
|
+
numerous scoring functions, hyper-parameterization for non-model trainer functions.
|
|
1281
|
+
* `GridSearch`
|
|
1282
|
+
GridSearch is an exhaustive search algorithm that covers all possible
|
|
1283
|
+
parameter values to identify optimal hyperparameters.
|
|
1284
|
+
* Methods of GridSearch
|
|
1285
|
+
* `__init__()` - Instantiate an object of GridSearch for given model function and parameters.
|
|
1286
|
+
* `evaluate()` - Function to perform evaluation on the given teradataml DataFrame using default model.
|
|
1287
|
+
* `fit()` - Function to perform hyperparameter-tuning for given hyperparameters and model on teradataml DataFrame.
|
|
1288
|
+
* `get_error_log()` - Useful to get the error log if model execution failed, using the model identifier.
|
|
1289
|
+
* `get_input_data()` - Useful to get the input data using the data identifier, when input data is also parameterized.
|
|
1290
|
+
* `get_model()` - Returns the trained model for the given model identifier.
|
|
1291
|
+
* `get_parameter_grid()` - Returns the hyperparameter space used for hyperparameter optimization.
|
|
1292
|
+
* `is_running()` - Returns the execution status of hyperaparameter tuning.
|
|
1293
|
+
* `predict()` - Function to perform prediction on the given teradataml DataFrame using default model.
|
|
1294
|
+
* `set_model()` - Function to update the default model.
|
|
1295
|
+
* Properties of GridSearch
|
|
1296
|
+
* `best_data_id` - Returns the best data identifier used for model training.
|
|
1297
|
+
* `best_model` - Returns the best trained model.
|
|
1298
|
+
* `best_model_id` - Returns the identifier for best model.
|
|
1299
|
+
* `best_params_` - Returns the best set of hyperparameter.
|
|
1300
|
+
* `best_sampled_data_` - Returns the best sampled data used to train the best model.
|
|
1301
|
+
* `best_score_` - Returns the best trained model score.
|
|
1302
|
+
* `model_stats` - Returns the model evaluation reports.
|
|
1303
|
+
* `models` - Returns the metadata of all the models.
|
|
1304
|
+
* `RandomSearch`
|
|
1305
|
+
RandomSearch algorithm performs random sampling on hyperparameter
|
|
1306
|
+
space to identify optimal hyperparameters.
|
|
1307
|
+
* Methods of RandomSearch
|
|
1308
|
+
* `__init__()` - Instantiate an object of RandomSearch for given model function and parameters.
|
|
1309
|
+
* `evaluate()` - Function to perform evaluation on the given teradataml DataFrame using default model.
|
|
1310
|
+
* `fit()` - Function to perform hyperparameter-tuning for given hyperparameters and model on teradataml DataFrame.
|
|
1311
|
+
* `get_error_log()` - Useful to get the error log if model execution failed, using the model identifier.
|
|
1312
|
+
* `get_input_data()` - Useful to get the input data using the data identifier, when input data is also parameterized.
|
|
1313
|
+
* `get_model()` - Returns the trained model for the given model identifier.
|
|
1314
|
+
* `get_parameter_grid()` - Returns the hyperparameter space used for hyperparameter optimization.
|
|
1315
|
+
* `is_running()` - Returns the execution status of hyperaparameter tuning.
|
|
1316
|
+
* `predict()` - Function to perform prediction on the given teradataml DataFrame using default model.
|
|
1317
|
+
* `set_model()` - Function to update the default model.
|
|
1318
|
+
* Properties of GridSearch
|
|
1319
|
+
* `best_data_id` - Returns the best data identifier used for model training.
|
|
1320
|
+
* `best_model` - Returns the best trained model.
|
|
1321
|
+
* `best_model_id` - Returns the identifier for best model.
|
|
1322
|
+
* `best_params_` - Returns the best set of hyperparameter.
|
|
1323
|
+
* `best_sampled_data_` - Returns the best sampled data used to train the best model.
|
|
1324
|
+
* `best_score_` - Returns the best trained model score.
|
|
1325
|
+
* `model_stats` - Returns the model evaluation reports.
|
|
1326
|
+
* `models` - Returns the metadata of all the models.
|
|
1327
|
+
|
|
1328
|
+
* ###### teradataml: Analytic Functions
|
|
1329
|
+
teradataml currently has different functions to generate a model, predict, transform and evaluate. All these functions are needed to be invoked individually, i.e., predict(), evaluate(), transform() cannot be invoked using the model trainer function output. Enhancement done to this feature now enables user to invoke these functions as methods of the model trainer function. Below is the list of functions, updated with this enhancement:
|
|
1330
|
+
* Analytics Database Analytic Functions
|
|
1331
|
+
* `BincodeFit()` - Supports `transform()` method.
|
|
1332
|
+
* `DecisionForest()` - Supports `predict()`, `evaluate()` methods.
|
|
1333
|
+
* `Fit()` - Supports `transform()` method.
|
|
1334
|
+
* `GLM()` - Supports `predict()`, `evaluate()` methods.
|
|
1335
|
+
* `GLMPerSegment()` - Supports `predict()`, `evaluate()` methods.
|
|
1336
|
+
* `KMeans()` - Supports `predict()` method.
|
|
1337
|
+
* `KNN()` - Supports `predict()`, `evaluate()` methods.
|
|
1338
|
+
* `NaiveBayesTextClassifierTrainer()` - Supports `predict()`, `evaluate()` methods.
|
|
1339
|
+
* `NonLinearCombineFit()` - Supports `transform()` method.
|
|
1340
|
+
* `OneClassSVM()` - Supports `predict()` method.
|
|
1341
|
+
* `OneHotEncodingFit()` - Supports `transform()` method.
|
|
1342
|
+
* `OrdinalEncodingFit()` - Supports `transform()` method.
|
|
1343
|
+
* `OutlierFilterFit()` - Supports `transform()` method.
|
|
1344
|
+
* `PolynomialFeaturesFit()` - Supports `transform()` method.
|
|
1345
|
+
* `RandomProjectionFit()` - Supports `transform()` method.
|
|
1346
|
+
* `RowNormalizeFit()` - Supports `transform()` method.
|
|
1347
|
+
* `ScaleFit()` - Supports `transform()` method.
|
|
1348
|
+
* `SimpleImputeFit()` - Supports `transform()` method.
|
|
1349
|
+
* `SVM()` - Supports `predict()`, `evaluate()` methods.
|
|
1350
|
+
* `TargetEncodingFit()` - Supports `transform()` method.
|
|
1351
|
+
* `XGBoost()` - Supports `predict()`, `evaluate()` methods.
|
|
1352
|
+
* Time Series Analytic (UAF) Functions
|
|
1353
|
+
* `ArimaEstimate()` - Supports `forecast()`, `validate()` methods.
|
|
1354
|
+
* `DFFT()` - Supports `convolve()`, `inverse()` methods.
|
|
1355
|
+
* `IDFFT()` - Supports `inverse()` method.
|
|
1356
|
+
* `DFFT2()` - Supports `convolve()`, `inverse()` methods.
|
|
1357
|
+
* `IDFFT2()` - Supports `inverse()` method.
|
|
1358
|
+
* `DIFF()` - Supports `inverse()` method.
|
|
1359
|
+
* `UNDIFF()` - Supports `inverse()` method.
|
|
1360
|
+
* `SeasonalNormalize()` - Supports `inverse()` method.
|
|
1361
|
+
|
|
1362
|
+
* ###### teradataml: DataFrame
|
|
1363
|
+
* New Functions
|
|
1364
|
+
* `DataFrame.plot()` - Generates the below type of plots on teradataml DataFrame.
|
|
1365
|
+
* line - Generates line plot.
|
|
1366
|
+
* bar - Generates bar plot.
|
|
1367
|
+
* scatter - Generates scatter plot.
|
|
1368
|
+
* corr - Generates correlation plot.
|
|
1369
|
+
* wiggle - Generates a wiggle plot.
|
|
1370
|
+
* mesh - Generates a mesh plot.
|
|
1371
|
+
* `DataFrame.itertuples()` - iterate over teradataml DataFrame rows as namedtuples or list.
|
|
1372
|
+
* ###### teradataml: GeoDataFrame
|
|
1373
|
+
* New Functions
|
|
1374
|
+
* `GeoDataFrame.plot()` - Generate the below type of plots on teradataml GeoDataFrame.
|
|
1375
|
+
* line - Generates line plot.
|
|
1376
|
+
* bar - Generates bar plot.
|
|
1377
|
+
* scatter - Generates scatter plot.
|
|
1378
|
+
* corr - Generates correlation plot.
|
|
1379
|
+
* wiggle - Generates a wiggle plot.
|
|
1380
|
+
* mesh - Generates a mesh plot.
|
|
1381
|
+
* geometry - Generates plot on geospatial data.
|
|
1382
|
+
* Plot:
|
|
1383
|
+
* `Axis` - Genertes the axis for plot.
|
|
1384
|
+
* `Figure` - Generates the figure for plot.
|
|
1385
|
+
* `subplots` - Helps in generating multiple plots on a single `Figure`.
|
|
1386
|
+
* Bring Your Own Model (BYOM) Function:
|
|
1387
|
+
* `DataikuPredict` - Score the data in Vantage using the model trained externally in Dataiku UI and stored in Vantage.
|
|
1388
|
+
* `async_run_status()` - Function to check the status of asynchronous run(s) using unique run id(s).
|
|
1389
|
+
|
|
1390
|
+
* ###### teradataml DataFrameColumn a.k.a. ColumnExpression
|
|
1391
|
+
* _Regular Arithmetic Functions_
|
|
1392
|
+
* `DataFrameColumn.abs()` - Computes the absolute value.
|
|
1393
|
+
* `DataFrameColumn.ceil()` - Returns the ceiling value of the column.
|
|
1394
|
+
* `DataFrameColumn.ceiling()` - It is an alias for `DataFrameColumn.ceil()` function.
|
|
1395
|
+
* `DataFrameColumn.degrees()` - Converts radians value from the column to degrees.
|
|
1396
|
+
* `DataFrameColumn.exp()` - Raises e (the base of natural logarithms) to the power of the value in the column, where e = 2.71828182845905.
|
|
1397
|
+
* `DataFrameColumn.floor()` - Returns the largest integer equal to or less than the value in the column.
|
|
1398
|
+
* `DataFrameColumn.ln()` - Computes the natural logarithm of values in column.
|
|
1399
|
+
* `DataFrameColumn.log10()` - Computes the base 10 logarithm.
|
|
1400
|
+
* `DataFrameColumn.mod()` - Returns the modulus of the column.
|
|
1401
|
+
* `DataFrameColumn.pmod()` - It is an alias for `DataFrameColumn.mod()` function.
|
|
1402
|
+
* `DataFrameColumn.nullifzero()` - Converts data from zero to null to avoid problems with division by zero.
|
|
1403
|
+
* `DataFrameColumn.pow()` - Computes the power of the column raised to expression or constant.
|
|
1404
|
+
* `DataFrameColumn.power()` - It is an alias for `DataFrameColumn.pow()` function.
|
|
1405
|
+
* `DataFrameColumn.radians()` - Converts degree value from the column to radians.
|
|
1406
|
+
* `DataFrameColumn.round()` - Returns the rounded off value.
|
|
1407
|
+
* `DataFrameColumn.sign()` - Returns the sign.
|
|
1408
|
+
* `DataFrameColumn.signum()` - It is an alias for `DataFrameColumn.sign()` function.
|
|
1409
|
+
* `DataFrameColumn.sqrt()` - Computes the square root of values in the column.
|
|
1410
|
+
* `DataFrameColumn.trunc()` - Provides the truncated value of columns.
|
|
1411
|
+
* `DataFrameColumn.width_bucket()` - Returns the number of the partition to which column is assigned.
|
|
1412
|
+
* `DataFrameColumn.zeroifnull()` - Converts data from null to zero to avoid problems with null.
|
|
1413
|
+
* _Trigonometric Functions_
|
|
1414
|
+
* `DataFrameColumn.acos()` - Returns the arc-cosine value.
|
|
1415
|
+
* `DataFrameColumn.asin()` - Returns the arc-sine value.
|
|
1416
|
+
* `DataFrameColumn.atan()` - Returns the arc-tangent value.
|
|
1417
|
+
* `DataFrameColumn.atan2()` - Returns the arc-tangent value based on x and y coordinates.
|
|
1418
|
+
* `DataFrameColumn.cos()` - Returns the cosine value.
|
|
1419
|
+
* `DataFrameColumn.sin()` - Returns the sine value.
|
|
1420
|
+
* `DataFrameColumn.tan()` - Returns the tangent value.
|
|
1421
|
+
* _Hyperbolic Functions_
|
|
1422
|
+
* `DataFrameColumn.acosh()` - Returns the inverse hyperbolic cosine value.
|
|
1423
|
+
* `DataFrameColumn.asinh()` - Returns the inverse hyperbolic sine value.
|
|
1424
|
+
* `DataFrameColumn.atanh()` - Returns the inverse hyperbolic tangent value.
|
|
1425
|
+
* `DataFrameColumn.cosh()` - Returns the hyperbolic cosine value.
|
|
1426
|
+
* `DataFrameColumn.sinh()` - Returns the hyperbolic sine value
|
|
1427
|
+
* `DataFrameColumn.tanh()` - Returns the hyperbolic tangent value.
|
|
1428
|
+
* _String Functions_
|
|
1429
|
+
* `DataFrameColumn.ascii()` - Returns the decimal representation of the first character in column.
|
|
1430
|
+
* `DataFrameColumn.char2hexint()` - Returns the hexadecimal representation for a character string in a column.
|
|
1431
|
+
* `DataFrameColumn.chr()` - Returns the Latin ASCII character of a given a numeric code value in column.
|
|
1432
|
+
* `DataFrameColumn.char()` - It is an alias for `DataFrameColumn.chr()` function.
|
|
1433
|
+
* `DataFrameColumn.character_length()` - Returns the number of characters in the column.
|
|
1434
|
+
* `DataFrameColumn.char_length()` - It is an alias for `DataFrameColumn.character_length()` function.
|
|
1435
|
+
* `DataFrameColumn.edit_distance()` - Returns the minimum number of edit operations required to
|
|
1436
|
+
transform string in a column into string specified in argument.
|
|
1437
|
+
* `DataFrameColumn.index()` - Returns the position of a string in a column where string specified in argument starts.
|
|
1438
|
+
* `DataFrameColumn.initcap()` - Modifies a string column and returns the string with the first character
|
|
1439
|
+
of each word in uppercase.
|
|
1440
|
+
* `DataFrameColumn.instr()` - Searches the string in a column for occurrences of search string passed as argument.
|
|
1441
|
+
* `DataFrameColumn.lcase()` - Returns a character string identical to string values in column,
|
|
1442
|
+
with all uppercase letters replaced with their lowercase equivalents.
|
|
1443
|
+
* `DataFrameColumn.left()` - Truncates string in a column to a specified number of characters desired from
|
|
1444
|
+
the left side of the string.
|
|
1445
|
+
* `DataFrameColumn.length()` - It is an alias for `DataFrameColumn.character_length()` function.
|
|
1446
|
+
* `DataFrameColumn.levenshtein()` - It is an alias for `DataFrameColumn.edit_distance()` function.
|
|
1447
|
+
* `DataFrameColumn.locate()` - Returns the position of the first occurrence of a string in a column within
|
|
1448
|
+
string in argument.
|
|
1449
|
+
* `DataFrameColumn.lower()` - It is an alias for `DataFrameColumn.character_lcase()` function.
|
|
1450
|
+
* `DataFrameColumn.lpad()` - Returns the string in a column padded to the left with the characters specified
|
|
1451
|
+
in argument so that the resulting string has length specified in argument.
|
|
1452
|
+
* `DataFrameColumn.ltrim()` - Returns the string in a column, with its left-most characters removed up
|
|
1453
|
+
to the first character that is not in the string specified in argument.
|
|
1454
|
+
* `DataFrameColumn.ngram()` - Returns the number of n-gram matches between string in a column,
|
|
1455
|
+
and string specified in argument.
|
|
1456
|
+
* `DataFrameColumn.nvp()` - Extracts the value of a name-value pair where the name in the pair matches
|
|
1457
|
+
the name and the number of the occurrence specified.
|
|
1458
|
+
* `DataFrameColumn.oreplace()` - Replaces every occurrence of search string in the column.
|
|
1459
|
+
* `DataFrameColumn.otranslate()` - Returns string in a column with every occurrence of each character in
|
|
1460
|
+
string in argument replaced with the corresponding character in another argument.
|
|
1461
|
+
* `DataFrameColumn.replace()` - It is an alias for `DataFrameColumn.oreplace()` function.
|
|
1462
|
+
* `DataFrameColumn.reverse()` - Returns the reverse of string in column.
|
|
1463
|
+
* `DataFrameColumn.right()` - Truncates input string to a specified number of characters desired from
|
|
1464
|
+
the right side of the string.
|
|
1465
|
+
* `DataFrameColumn.rpad()` - Returns the string in a column padded to the right with the characters specified
|
|
1466
|
+
in argument so the resulting string has length specified in argument.
|
|
1467
|
+
* `DataFrameColumn.rtrim()` - Returns the string in column, with its right-most characters removed up
|
|
1468
|
+
to the first character that is not in the string specified in argument.
|
|
1469
|
+
* `DataFrameColumn.soundex()` - Returns a character string that represents the Soundex code for
|
|
1470
|
+
string in a column.
|
|
1471
|
+
* `DataFrameColumn.string_cs()` - Returns a heuristically derived integer value that can be used to determine
|
|
1472
|
+
which KANJI1-compatible client character set was used to encode string in a column.
|
|
1473
|
+
* `DataFrameColumn.translate()` - It is an alias for `DataFrameColumn.otranslate()` function.
|
|
1474
|
+
* `DataFrameColumn.upper()` - Returns a character string with all lowercase letters in a column replaced
|
|
1475
|
+
with their uppercase equivalents.
|
|
1476
|
+
|
|
1477
|
+
* ##### teradataml Options
|
|
1478
|
+
* Configuration Options
|
|
1479
|
+
* `configure.indb_install_location`
|
|
1480
|
+
Specifies the installation location of In-DB Python package.
|
|
1481
|
+
|
|
1482
|
+
* ##### Updates
|
|
1483
|
+
* Open Analytics Framework (OpenAF) APIs:
|
|
1484
|
+
* `set_auth_token()`
|
|
1485
|
+
* `set_auth_token()` does not accept username and password anymore. Instead, function opens up a browser session and user should authenticate in browser.
|
|
1486
|
+
* After token expiry, teradataml will open a browser and user needs to authenticate again.
|
|
1487
|
+
* If client machine does not have browser, then user should copy the URL posted by teradataml and authenticate themselves.
|
|
1488
|
+
* Security fixes - `auth_token` is not set or retrieved from the `configure` option anymore.
|
|
1489
|
+
* Manage all user environments.
|
|
1490
|
+
* `create_env()` - supports creation of R environment.
|
|
1491
|
+
* `remove_env()` - Supports removal of remote R environment.
|
|
1492
|
+
* `remove_all_envs()` - Supports removal of all remote R environments.
|
|
1493
|
+
* `remove_env()` and `remove_all_envs()` supports asynchronous call.
|
|
1494
|
+
* UserEnv Class – Supports managing of R remote environments.
|
|
1495
|
+
* Properties:
|
|
1496
|
+
* `libs` - Supports listing of libraries in R remote environment.
|
|
1497
|
+
* Methods:
|
|
1498
|
+
* `install_lib()` - Supports installing of libraries in remote R environment.
|
|
1499
|
+
* `uninstall_lib()` - Supports uninstalling of libraries in remote R environment.
|
|
1500
|
+
* `update_lib()` - Supports updating of libraries in remote R environment.
|
|
1501
|
+
* Unbounded Array Framework (UAF) Functions:
|
|
1502
|
+
* `ArimaEstimate()`
|
|
1503
|
+
* Added support for `CSS` algorithm via `algorithm` argument.
|
|
1504
|
+
|
|
1505
|
+
* ##### Bug Fixes
|
|
1506
|
+
* Installation location of In-DB 2.0.0 package is changed. Script() will now work with both 2.0.0 and previous version.
|
|
1507
|
+
|
|
1508
|
+
## Release Notes:
|
|
1509
|
+
#### teradataml 17.20.00.04
|
|
1510
|
+
* ##### New Features/Functionality
|
|
1511
|
+
* teradataml is now compatible with SQLAlchemy 2.0.X
|
|
1512
|
+
* **Important notes** when user has sqlalchemy version >= 2.0:
|
|
1513
|
+
* Users will not be able to run the `execute()` method on SQLAlchemy engine object returned by
|
|
1514
|
+
`get_context()` and `create_context()` teradataml functions. This is due to the SQLAlchemy has
|
|
1515
|
+
removed the support for `execute()` method on the engine object. Thus, user scripts where
|
|
1516
|
+
`get_context().execute()` and `create_context().execute()`, is used, Teradata recommends to
|
|
1517
|
+
replace those with either `execute_sql()` function exposed by teradataml or `exec_driver_sql()`
|
|
1518
|
+
method on the `Connection` object returned by `get_connection()` function in teradataml.
|
|
1519
|
+
* Now `get_connection().execute()` accepts only executable sqlalchemy object. Refer to
|
|
1520
|
+
`sqlalchemy.engine.base.execute()` for more details.
|
|
1521
|
+
* Teradata recommends to use either `execute_sql()` function exposed by teradataml or
|
|
1522
|
+
`exec_driver_sql()` method on the `Connection` object returned by `get_connection()`
|
|
1523
|
+
function in teradataml, in such cases.
|
|
1524
|
+
* New utility function `execute_sql()` is added to execute the SQL.
|
|
1525
|
+
* Extending compatibility for MAC with ARM processors.
|
|
1526
|
+
* Added support for floor division (//) between two teradataml DataFrame Columns.
|
|
1527
|
+
* Analytics Database Analytic Functions:
|
|
1528
|
+
* `GLMPerSegment()`
|
|
1529
|
+
* `GLMPredictPerSegment()`
|
|
1530
|
+
* `OneClassSVM()`
|
|
1531
|
+
* `OneClassSVMPredict()`
|
|
1532
|
+
* `SVM()`
|
|
1533
|
+
* `SVMPredict()`
|
|
1534
|
+
* `TargetEncodingFit()`
|
|
1535
|
+
* `TargetEncodingTransform()`
|
|
1536
|
+
* `TrainTestSplit()`
|
|
1537
|
+
* `WordEmbeddings()`
|
|
1538
|
+
* `XGBoost()`
|
|
1539
|
+
* `XGBoostPredict()`
|
|
1540
|
+
|
|
1541
|
+
* ###### teradataml Options
|
|
1542
|
+
* Display Options
|
|
1543
|
+
* `display.geometry_column_length`
|
|
1544
|
+
Option to display the default length of geometry column in GeoDataFrame.
|
|
1545
|
+
|
|
1546
|
+
* ##### Updates
|
|
1547
|
+
* `set_auth_token()` function can generate the client id automatically based on org_id when user do not specify it.
|
|
1548
|
+
* Analytics Database Analytic Functions:
|
|
1549
|
+
* `ColumnTransformer()`
|
|
1550
|
+
* Does not allow list values for arguments - `onehotencoding_fit_data` and `ordinalencoding_fit_data`.
|
|
1551
|
+
* `OrdidnalEncodingFit()`
|
|
1552
|
+
* New arguments added - `category_data`, `target_column_names`, `categories_column`, `ordinal_values_column`.
|
|
1553
|
+
* Allows the list of values for arguments - `target_column`, `start_value`, `default_value`.
|
|
1554
|
+
* `OneHotEncodingFit()`
|
|
1555
|
+
* New arguments added - `category_data`, `approach`, `target_columns`, `categories_column`, `category_counts`.
|
|
1556
|
+
* Allows the list of values for arguments - `target_column`, `other_column`.
|
|
1557
|
+
|
|
1558
|
+
* ##### Bug Fixes
|
|
1559
|
+
* `DataFrame.sample()` method output is now deterministic.
|
|
1560
|
+
* `copy_to_sql()` now preserves the rows of the table even when the view content is copied to the same table name.
|
|
1561
|
+
* `list_user_envs()` does not raise warning when no user environments found.
|
|
1562
|
+
|
|
1563
|
+
## Release Notes:
|
|
1564
|
+
#### teradataml 17.20.00.03
|
|
1565
|
+
|
|
1566
|
+
* ##### Updates
|
|
1567
|
+
* DataFrame.join
|
|
1568
|
+
* New arguments `lprefix` and `rprefix` added.
|
|
1569
|
+
* Behavior of arguments `lsuffix` and `rsuffix` will be changed in future, use new arguments instead.
|
|
1570
|
+
* New and old affix arguments can now be used independently.
|
|
1571
|
+
* Analytic functions can be imported regardless of context creation.
|
|
1572
|
+
Import after create context constraint is now removed.
|
|
1573
|
+
* `ReadNOS` and `WriteNOS` now accept dictionary value for `authorization` and `row_format` arguments.
|
|
1574
|
+
* `WriteNOS` supports writing CSV files to external store.
|
|
1575
|
+
* Following model cataloging APIs will be deprecated in future:
|
|
1576
|
+
* describe_model
|
|
1577
|
+
* delete_model
|
|
1578
|
+
* list_models
|
|
1579
|
+
* publish_model
|
|
1580
|
+
* retrieve_model
|
|
1581
|
+
* save_model
|
|
1582
|
+
|
|
1583
|
+
* ##### Bug Fixes
|
|
1584
|
+
* `copy_to_sql()` bug related to NaT value has been fixed.
|
|
1585
|
+
* Tooltip on PyCharm IDE now points to SQLE.
|
|
1586
|
+
* `value` argument of `FillNa()`, a Vantage Analytic Library function supports special characters.
|
|
1587
|
+
* `case` function accepts DataFrame column as value in `whens` argument.
|
|
1588
|
+
|
|
1589
|
+
## Release Notes:
|
|
1590
|
+
#### teradataml 17.20.00.02
|
|
1591
|
+
* ##### New Features/Functionality
|
|
1592
|
+
* ###### teradataml: Open Analytics
|
|
1593
|
+
* New Functions
|
|
1594
|
+
* `set_auth_token()` - Sets the JWT token automatically for using Open AF API's.
|
|
1595
|
+
|
|
1596
|
+
* ###### teradataml Options
|
|
1597
|
+
* Display Options
|
|
1598
|
+
* `display.suppress_vantage_runtime_warnings`
|
|
1599
|
+
Suppresses the VantageRuntimeWarning raised by teradataml, when set to True.
|
|
1600
|
+
|
|
1601
|
+
* ##### Updates
|
|
1602
|
+
* SimpleImputeFit function arguments `stats_columns` and `stats` are made to be optional.
|
|
1603
|
+
* New argument `table_format` is added to ReadNOS().
|
|
1604
|
+
* Argument `full_scan` is changed to `scan_pct` in ReadNOS().
|
|
1605
|
+
|
|
1606
|
+
* ##### Bug Fixes
|
|
1607
|
+
* Minor bug fix related to read_csv.
|
|
1608
|
+
* APPLY and `DataFrame.apply()` supports hash by and local order by.
|
|
1609
|
+
* Output column names are changed for DataFrame.dtypes and DataFrame.tdtypes.
|
|
1610
|
+
|
|
1611
|
+
## Release Notes:
|
|
1612
|
+
#### teradataml 17.20.00.01
|
|
1613
|
+
* ##### New Features/Functionality
|
|
1614
|
+
* ###### teradataml: DataFrame
|
|
1615
|
+
* New Functions
|
|
1616
|
+
* `DataFrame.pivot()` - Rotate data from rows into columns to create easy-to-read DataFrames.
|
|
1617
|
+
* `DataFrame.unpivot()` - Rotate data from columns into rows to create easy-to-read DataFrames.
|
|
1618
|
+
* `DataFrame.drop_duplicate()` - Drop duplicate rows from teradataml DataFrame.
|
|
1619
|
+
* New properties
|
|
1620
|
+
* `Dataframe.is_art` - Check whether teradataml DataFrame is created on an Analytic Result Table, i.e., ART table or not.
|
|
1621
|
+
|
|
1622
|
+
* ###### teradataml: Unbounded Array Framework (UAF) Functions:
|
|
1623
|
+
* New Functions
|
|
1624
|
+
* New Functions Supported on Database Versions: 17.20.x.x
|
|
1625
|
+
* MODEL PREPARATION AND PARAMETER ESTIMATION functions:
|
|
1626
|
+
1. `ACF()`
|
|
1627
|
+
2. `ArimaEstimate()`
|
|
1628
|
+
3. `ArimaValidate()`
|
|
1629
|
+
4. `DIFF()`
|
|
1630
|
+
5. `LinearRegr()`
|
|
1631
|
+
6. `MultivarRegr()`
|
|
1632
|
+
7. `PACF()`
|
|
1633
|
+
8. `PowerTransform()`
|
|
1634
|
+
9. `SeasonalNormalize()`
|
|
1635
|
+
10. `Smoothma()`
|
|
1636
|
+
11. `UNDIFF()`
|
|
1637
|
+
12. `Unnormalize()`
|
|
1638
|
+
* SERIES FORECASTING functions:
|
|
1639
|
+
1. `ArimaForecast()`
|
|
1640
|
+
2. `DTW()`
|
|
1641
|
+
3. `HoltWintersForecaster()`
|
|
1642
|
+
4. `MAMean()`
|
|
1643
|
+
5. `SimpleExp()`
|
|
1644
|
+
* DATA PREPARATION functions:
|
|
1645
|
+
1. `BinaryMatrixOp()`
|
|
1646
|
+
2. `BinarySeriesOp()`
|
|
1647
|
+
3. `GenseriesFormula()`
|
|
1648
|
+
4. `MatrixMultiply()`
|
|
1649
|
+
5. `Resample()`
|
|
1650
|
+
* DIAGNOSTIC STATISTICAL TEST functions:
|
|
1651
|
+
1. `BreuschGodfrey()`
|
|
1652
|
+
2. `BreuschPaganGodfrey()`
|
|
1653
|
+
3. `CumulPeriodogram()`
|
|
1654
|
+
4. `DickeyFuller()`
|
|
1655
|
+
5. `DurbinWatson()`
|
|
1656
|
+
6. `FitMetrics()`
|
|
1657
|
+
7. `GoldfeldQuandt()`
|
|
1658
|
+
8. `Portman()`
|
|
1659
|
+
9. `SelectionCriteria()`
|
|
1660
|
+
10. `SignifPeriodicities()`
|
|
1661
|
+
11. `SignifResidmean()`
|
|
1662
|
+
12. `WhitesGeneral()`
|
|
1663
|
+
* TEMPORAL AND SPATIAL functions:
|
|
1664
|
+
1. `Convolve()`
|
|
1665
|
+
2. `Convolve2()`
|
|
1666
|
+
3. `DFFT()`
|
|
1667
|
+
4. `DFFT2()`
|
|
1668
|
+
5. `DFFT2Conv()`
|
|
1669
|
+
6. `DFFTConv()`
|
|
1670
|
+
7. `GenseriesSinusoids()`
|
|
1671
|
+
8. `IDFFT()`
|
|
1672
|
+
9. `IDFFT2()`
|
|
1673
|
+
10. `LineSpec()`
|
|
1674
|
+
11. `PowerSpec()`
|
|
1675
|
+
* GENERAL UTILITY functions:
|
|
1676
|
+
1. `ExtractResults()`
|
|
1677
|
+
2. `InputValidator()`
|
|
1678
|
+
3. `MInfo()`
|
|
1679
|
+
4. `SInfo()`
|
|
1680
|
+
5. `TrackingOp()`
|
|
1681
|
+
|
|
1682
|
+
* New Features: Inputs to Unbounded Array Framework (UAF) functions
|
|
1683
|
+
* `TDAnalyticResult()` - Allows to prepare function output generated by UAF functions to be passed.
|
|
1684
|
+
* `TDGenSeries()` - Allows to generate a series, that can be passed to a UAF function.
|
|
1685
|
+
* `TDMatrix()` - Represents a Matrix in time series, that can be created from a teradataml DataFrame.
|
|
1686
|
+
* `TDSeries()` - Represents a Series in time series, that can be created from a teradataml DataFrame.
|
|
1687
|
+
|
|
1688
|
+
* ##### Updates
|
|
1689
|
+
* Native Object Store (NOS) functions support authorization by specifying authorization object.
|
|
1690
|
+
* `display_analytic_functions()` categorizes the analytic functions based on function type.
|
|
1691
|
+
* ColumnTransformer accepts multiple values for arguments nonlinearcombine_fit_data,
|
|
1692
|
+
onehotencoding_fit_data, ordinalencoding_fit_data.
|
|
1693
|
+
|
|
1694
|
+
* ##### Bug Fixes
|
|
1695
|
+
* Redundant warnings thrown by teradataml are suppressed.
|
|
1696
|
+
* OpenAF supports when context is created with JWT Token.
|
|
1697
|
+
* New argument "match_column_order" added to copy_to_sql, that allows DataFrame loading with any column order.
|
|
1698
|
+
* `copy_to_sql` updated to map data type timezone(tzinfo) to TIMESTAMP(timezone=True), instead of VARCHAR.
|
|
1699
|
+
* Improved performance for DataFrame.sum and DataFrameColumn.sum functions.
|
|
1700
|
+
|
|
1701
|
+
## Release Notes:
|
|
1702
|
+
#### teradataml 17.20.00.00
|
|
1703
|
+
* ##### New Features/Functionality
|
|
1704
|
+
* ###### teradataml: Analytics Database Analytic Functions
|
|
1705
|
+
* _New Functions_
|
|
1706
|
+
* ###### New Functions Supported on Database Versions: 17.20.x.x
|
|
1707
|
+
* `ANOVA()`
|
|
1708
|
+
* `ClassificationEvaluator()`
|
|
1709
|
+
* `ColumnTransformer()`
|
|
1710
|
+
* `DecisionForest()`
|
|
1711
|
+
* `GLM()`
|
|
1712
|
+
* `GetFutileColumns()`
|
|
1713
|
+
* `KMeans()`
|
|
1714
|
+
* `KMeansPredict()`
|
|
1715
|
+
* `NaiveBayesTextClassifierTrainer()`
|
|
1716
|
+
* `NonLinearCombineFit()`
|
|
1717
|
+
* `NonLinearCombineTransform()`
|
|
1718
|
+
* `OrdinalEncodingFit()`
|
|
1719
|
+
* `OrdinalEncodingTransform()`
|
|
1720
|
+
* `RandomProjectionComponents()`
|
|
1721
|
+
* `RandomProjectionFit()`
|
|
1722
|
+
* `RandomProjectionTransform()`
|
|
1723
|
+
* `RegressionEvaluator()`
|
|
1724
|
+
* `ROC()`
|
|
1725
|
+
* `SentimentExtractor()`
|
|
1726
|
+
* `Silhouette()`
|
|
1727
|
+
* `TDGLMPredict()`
|
|
1728
|
+
* `TextParser()`
|
|
1729
|
+
* `VectorDistance()`
|
|
1730
|
+
* _Updates_
|
|
1731
|
+
* `display_analytic_functions()` categorizes the analytic functions based on function type.
|
|
1732
|
+
* Users can provide range value for columns argument.
|
|
1733
|
+
|
|
1734
|
+
* ###### teradataml: Open Analytics
|
|
1735
|
+
* Manage all user environments.
|
|
1736
|
+
* `list_base_envs()` - list the available python base versions.
|
|
1737
|
+
* `create_env()` - create a new user environment.
|
|
1738
|
+
* `get_env()` - get existing user environment.
|
|
1739
|
+
* `list_user_envs()` - list the available user environments.
|
|
1740
|
+
* `remove_env()` - delete user environment.
|
|
1741
|
+
* `remove_all_envs()` - delete all the user environments.
|
|
1742
|
+
* UserEnv Class – Manage individual user environment.
|
|
1743
|
+
* Properties
|
|
1744
|
+
* `files` - Get files in user environment.
|
|
1745
|
+
* `libs` - Get libraries in user environment.
|
|
1746
|
+
* Methods
|
|
1747
|
+
* `install_file()` - Install a file in user environment.
|
|
1748
|
+
* `remove_file()` - Remove a file in user environment.
|
|
1749
|
+
* `install_lib()` - Install a library in user environment.
|
|
1750
|
+
* `update_lib()` - Update a library in user environment.
|
|
1751
|
+
* `uninstall_lib()` - Uninstall a library in user environment.
|
|
1752
|
+
* `status()` - Check the status of
|
|
1753
|
+
* file installation
|
|
1754
|
+
* library installation
|
|
1755
|
+
* library update
|
|
1756
|
+
* library uninstallation
|
|
1757
|
+
* `refresh()` - Refresh the environment details in local client.
|
|
1758
|
+
* Apply Class – Execute a user script on VantageCloud Lake.
|
|
1759
|
+
* `__init__()` - Instantiate an object of apply for script execution.
|
|
1760
|
+
* `install_file()` - Install a file in user environment.
|
|
1761
|
+
* `remove_file()` - Remove a file in user environment.
|
|
1762
|
+
* `set_data()` – Reset data and related arguments.
|
|
1763
|
+
* `execute_script()` – Executes Python script.
|
|
1764
|
+
|
|
1765
|
+
* ###### teradataml: DataFrame
|
|
1766
|
+
* _New Functions_
|
|
1767
|
+
* `DataFrame.apply()` - Execute a user defined Python function on VantageLake Cloud.
|
|
1768
|
+
|
|
1769
|
+
* ###### teradataml: Bring Your Own Model
|
|
1770
|
+
* _New Functions_
|
|
1771
|
+
* `ONNXPredict()` - Score using model trained externally on ONNX and stored in Vantage.
|
|
1772
|
+
|
|
1773
|
+
* ###### teradataml: Options
|
|
1774
|
+
* _New Functions_
|
|
1775
|
+
* set_config_params() New API to set all config params in one go.
|
|
1776
|
+
* _New Configuration Options_
|
|
1777
|
+
* For Open Analytics support.
|
|
1778
|
+
* ues_url – User Environment Service URL for VantageCloud Lake.
|
|
1779
|
+
* auth_token – Authentication token to connect to VantageCloud Lake.
|
|
1780
|
+
* certificate_file – Path to a CA_BUNDLE file or directory with certificates of trusted CAs.
|
|
1781
|
+
|
|
1782
|
+
* ##### Updates
|
|
1783
|
+
* `accumulate` argument is working for `ScaleTransform()`.
|
|
1784
|
+
* Following functions have `accumulate` argument added on Database Versions: 17.20.x.x
|
|
1785
|
+
* `ConvertTo()`
|
|
1786
|
+
* `GetRowsWithoutMissingValues()`
|
|
1787
|
+
* `GetRowsWithoutMissingValues()`
|
|
1788
|
+
* `OutlierFilterFit()` supports multiple output.
|
|
1789
|
+
* For `OutlierFilterFit()` function below arguments are optional in teradataml 17.20.x.x
|
|
1790
|
+
* `lower_percentile`
|
|
1791
|
+
* `upper_percentile`
|
|
1792
|
+
* `outlier_method`
|
|
1793
|
+
* `replacement_value`
|
|
1794
|
+
* `percentile_method`
|
|
1795
|
+
* Analytics Database analytic functions – In line help, i.e., help() for the functions
|
|
1796
|
+
is available.
|
|
1797
|
+
|
|
1798
|
+
* ##### Bug Fixes
|
|
1799
|
+
* Vantage Analytic Library FillNa() function: Now `columns` argument is required.
|
|
1800
|
+
* `output_responses` argument in MLE function `DecisionTreePredict()`, does not allow empty string.
|
|
1801
|
+
* teradataml closes docker sandbox environment properly.
|
|
1802
|
+
* Users can create context using JWT token.
|
|
1803
|
+
|
|
1804
|
+
#### teradataml 17.10.00.02
|
|
1805
|
+
* ##### New Features/Functionality
|
|
1806
|
+
* ###### Database Utility
|
|
1807
|
+
* `list_td_reserved_keywords()` - Validates if the specified string is Teradata reserved
|
|
1808
|
+
keyword or not, else lists down all the Teradata reserved keywords.
|
|
1809
|
+
|
|
1810
|
+
* ##### Updates
|
|
1811
|
+
* ###### DataFrame
|
|
1812
|
+
* _Updates_
|
|
1813
|
+
* Multiple columns can be selected using slice operator ([]).
|
|
1814
|
+
|
|
1815
|
+
* ###### Script
|
|
1816
|
+
* _Updates_
|
|
1817
|
+
* A warning will be raised, when Teradata reserved keyword is used in Script local mode.
|
|
1818
|
+
|
|
1819
|
+
* ##### Bug Fixes
|
|
1820
|
+
* Numeric overflow issue observed for describe(), sum(), csum(), and mean() has been fixed.
|
|
1821
|
+
* Error messages are updated for SQLE function arguments accepting multiple datatypes.
|
|
1822
|
+
* Error messages are updated for SQLE function arguments volatile and persist arguments when
|
|
1823
|
+
non-boolean value is provided.
|
|
1824
|
+
* DataFrame sample() method can handle column names with special characters like space, hyphen,
|
|
1825
|
+
period etc.
|
|
1826
|
+
* In-DB SQLE functions can be loaded for any locale setting.
|
|
1827
|
+
* `create_context()` - Password containing special characters requires URL encoding as per
|
|
1828
|
+
https://docs.microfocus.com/OMi/10.62/Content/OMi/ExtGuide/ExtApps/URL_encoding.html.
|
|
1829
|
+
teradataml has added a fix to take care of the URL encoding of the password while creating a context.
|
|
1830
|
+
Also, a new argument is added to give a more control over the URL encoding to be done at the time of context creation.
|
|
1831
|
+
|
|
1832
|
+
#### teradataml 17.10.00.01
|
|
1833
|
+
* ##### New Features/Functionality
|
|
1834
|
+
* ###### Geospatial
|
|
1835
|
+
The Geospatial feature in teradataml enables data manipulation, exploration and analysis on tables, views, and queries on Teradata Vantage that contains Geospatial data.
|
|
1836
|
+
* ###### Geomtery Types
|
|
1837
|
+
* Point
|
|
1838
|
+
* LineString
|
|
1839
|
+
* Polygon
|
|
1840
|
+
* MultiPoint
|
|
1841
|
+
* MultiLineString
|
|
1842
|
+
* MultiPolygon
|
|
1843
|
+
* GeometryCollection
|
|
1844
|
+
* GeoSequence
|
|
1845
|
+
* ###### teradataml GeoDataFrame
|
|
1846
|
+
* Properties
|
|
1847
|
+
* columns
|
|
1848
|
+
* dtypes
|
|
1849
|
+
* geometry
|
|
1850
|
+
* iloc
|
|
1851
|
+
* index
|
|
1852
|
+
* loc
|
|
1853
|
+
* shape
|
|
1854
|
+
* size
|
|
1855
|
+
* tdtypes
|
|
1856
|
+
* Geospatial Specific Properties
|
|
1857
|
+
* ###### Properties for all Types of Geometries
|
|
1858
|
+
* boundary
|
|
1859
|
+
* centroid
|
|
1860
|
+
* convex_hell
|
|
1861
|
+
* coord_dim
|
|
1862
|
+
* dimension
|
|
1863
|
+
* geom_type
|
|
1864
|
+
* is_3D
|
|
1865
|
+
* is_empty
|
|
1866
|
+
* is_simple
|
|
1867
|
+
* is_valid
|
|
1868
|
+
* max_x
|
|
1869
|
+
* max_y
|
|
1870
|
+
* max_z
|
|
1871
|
+
* min_x
|
|
1872
|
+
* min_y
|
|
1873
|
+
* min_z
|
|
1874
|
+
* srid
|
|
1875
|
+
* ###### Properties for Point Geometry
|
|
1876
|
+
* x
|
|
1877
|
+
* y
|
|
1878
|
+
* z
|
|
1879
|
+
* ###### Properties for LineString Geometry
|
|
1880
|
+
* is_closed_3D
|
|
1881
|
+
* is_closed
|
|
1882
|
+
* is_ring
|
|
1883
|
+
* ###### Properties for Polygon Geometry
|
|
1884
|
+
* area
|
|
1885
|
+
* exterior
|
|
1886
|
+
* perimeter
|
|
1887
|
+
* Methods
|
|
1888
|
+
* `__getattr__()`
|
|
1889
|
+
* `__getitem__()`
|
|
1890
|
+
* `__init__()`
|
|
1891
|
+
* `__repr__()`
|
|
1892
|
+
* `assign()`
|
|
1893
|
+
* `concat()`
|
|
1894
|
+
* `count()`
|
|
1895
|
+
* `drop()`
|
|
1896
|
+
* `dropna()`
|
|
1897
|
+
* `filter()`
|
|
1898
|
+
* `from_query()`
|
|
1899
|
+
* `from_table()`
|
|
1900
|
+
* `get()`
|
|
1901
|
+
* `get_values()`
|
|
1902
|
+
* `groupby()`
|
|
1903
|
+
* `head()`
|
|
1904
|
+
* `info()`
|
|
1905
|
+
* `join()`
|
|
1906
|
+
* `keys()`
|
|
1907
|
+
* `merge()`
|
|
1908
|
+
* `sample()`
|
|
1909
|
+
* `select()`
|
|
1910
|
+
* `set_index()`
|
|
1911
|
+
* `show_query()`
|
|
1912
|
+
* `sort()`
|
|
1913
|
+
* `sort_index()`
|
|
1914
|
+
* `squeeze()`
|
|
1915
|
+
* `tail()`
|
|
1916
|
+
* `to_csv()`
|
|
1917
|
+
* `to_pandas()`
|
|
1918
|
+
* `to_sql()`
|
|
1919
|
+
* Geospatial Specific Methods
|
|
1920
|
+
* ###### Methods for All Type of Geometry
|
|
1921
|
+
* `buffer()`
|
|
1922
|
+
* `contains()`
|
|
1923
|
+
* `crosses()`
|
|
1924
|
+
* `difference()`
|
|
1925
|
+
* `disjoint()`
|
|
1926
|
+
* `distance()`
|
|
1927
|
+
* `distance_3D()`
|
|
1928
|
+
* `envelope()`
|
|
1929
|
+
* `geom_equals()`
|
|
1930
|
+
* `intersection()`
|
|
1931
|
+
* `intersects()`
|
|
1932
|
+
* `make_2D()`
|
|
1933
|
+
* `mbb()`
|
|
1934
|
+
* `mbr()`
|
|
1935
|
+
* `overlaps()`
|
|
1936
|
+
* `relates()`
|
|
1937
|
+
* `set_exterior()`
|
|
1938
|
+
* `set_srid()`
|
|
1939
|
+
* `simplify()`
|
|
1940
|
+
* `sym_difference()`
|
|
1941
|
+
* `to_binary()`
|
|
1942
|
+
* `to_text()`
|
|
1943
|
+
* `touches()`
|
|
1944
|
+
* `transform()`
|
|
1945
|
+
* `union()`
|
|
1946
|
+
* `within()`
|
|
1947
|
+
* `wkb_geom_to_sql()`
|
|
1948
|
+
* `wkt_geom_to_sql()`
|
|
1949
|
+
* ###### Methods for Point Geometry
|
|
1950
|
+
* `spherical_buffer()`
|
|
1951
|
+
* `spherical_distance()`
|
|
1952
|
+
* `spheriodal_buffer()`
|
|
1953
|
+
* `spheriodal_distance()`
|
|
1954
|
+
* `set_x()`
|
|
1955
|
+
* `set_y()`
|
|
1956
|
+
* `set_z()`
|
|
1957
|
+
* ###### Methods for LineString Geometry
|
|
1958
|
+
* `end_point()`
|
|
1959
|
+
* `length()`
|
|
1960
|
+
* `length_3D()`
|
|
1961
|
+
* `line_interpolate_point()`
|
|
1962
|
+
* `num_points()`
|
|
1963
|
+
* `point()`
|
|
1964
|
+
* `start_point()`
|
|
1965
|
+
* ###### Methods for Polygon Geometry
|
|
1966
|
+
* `interiors()`
|
|
1967
|
+
* `num_interior_ring()`
|
|
1968
|
+
* `point_on_surface()`
|
|
1969
|
+
* ###### Methods for GeometryCollection Geometry
|
|
1970
|
+
* `geom_component()`
|
|
1971
|
+
* `num_geometry()`
|
|
1972
|
+
* ###### Methods for GeoSequence Geometry
|
|
1973
|
+
* `clip()`
|
|
1974
|
+
* `get_final_timestamp()`
|
|
1975
|
+
* `get_init_timestamp()`
|
|
1976
|
+
* `get_link()`
|
|
1977
|
+
* `get_user_field()`
|
|
1978
|
+
* `get_user_field_count()`
|
|
1979
|
+
* `point_heading()`
|
|
1980
|
+
* `set_link()`
|
|
1981
|
+
* `speed()`
|
|
1982
|
+
* ###### Filtering Functions and Methods
|
|
1983
|
+
* `intersects_mbb()`
|
|
1984
|
+
* `mbb_filter()`
|
|
1985
|
+
* `mbr_filter()`
|
|
1986
|
+
* `within_mbb()`
|
|
1987
|
+
* ###### teradataml GeoDataFrameColumn
|
|
1988
|
+
* Geospatial Specific Properties
|
|
1989
|
+
* ###### Properties for all Types of Geometries
|
|
1990
|
+
* boundary
|
|
1991
|
+
* centroid
|
|
1992
|
+
* convex_hell
|
|
1993
|
+
* coord_dim
|
|
1994
|
+
* dimension
|
|
1995
|
+
* geom_type
|
|
1996
|
+
* is_3D
|
|
1997
|
+
* is_empty
|
|
1998
|
+
* is_simple
|
|
1999
|
+
* is_valid
|
|
2000
|
+
* max_x
|
|
2001
|
+
* max_y
|
|
2002
|
+
* max_z
|
|
2003
|
+
* min_x
|
|
2004
|
+
* min_y
|
|
2005
|
+
* min_z
|
|
2006
|
+
* srid
|
|
2007
|
+
* ###### Properties for Point Geometry
|
|
2008
|
+
* x
|
|
2009
|
+
* y
|
|
2010
|
+
* z
|
|
2011
|
+
* ###### Properties for LineString Geometry
|
|
2012
|
+
* is_closed_3D
|
|
2013
|
+
* is_closed
|
|
2014
|
+
* is_ring
|
|
2015
|
+
* ###### Properties for Polygon Geometry
|
|
2016
|
+
* area
|
|
2017
|
+
* exterior
|
|
2018
|
+
* perimeter
|
|
2019
|
+
* Geospatial Specific Methods
|
|
2020
|
+
* ###### Methods for All Type of Geometry
|
|
2021
|
+
* `buffer()`
|
|
2022
|
+
* `contains()`
|
|
2023
|
+
* `crosses()`
|
|
2024
|
+
* `difference()`
|
|
2025
|
+
* `disjoint()`
|
|
2026
|
+
* `distance()`
|
|
2027
|
+
* `distance_3D()`
|
|
2028
|
+
* `envelope()`
|
|
2029
|
+
* `geom_equals()`
|
|
2030
|
+
* `intersection()`
|
|
2031
|
+
* `intersects()`
|
|
2032
|
+
* `make_2D()`
|
|
2033
|
+
* `mbb()`
|
|
2034
|
+
* `mbr()`
|
|
2035
|
+
* `overlaps()`
|
|
2036
|
+
* `relates()`
|
|
2037
|
+
* `set_exterior()`
|
|
2038
|
+
* `set_srid()`
|
|
2039
|
+
* `simplify()`
|
|
2040
|
+
* `sym_difference()`
|
|
2041
|
+
* `to_binary()`
|
|
2042
|
+
* `to_text()`
|
|
2043
|
+
* `touches()`
|
|
2044
|
+
* `transform()`
|
|
2045
|
+
* `union()`
|
|
2046
|
+
* `within()`
|
|
2047
|
+
* `wkb_geom_to_sql()`
|
|
2048
|
+
* `wkt_geom_to_sql()`
|
|
2049
|
+
* ###### Methods for Point Geometry
|
|
2050
|
+
* `spherical_buffer()`
|
|
2051
|
+
* `spherical_distance()`
|
|
2052
|
+
* `spheriodal_buffer()`
|
|
2053
|
+
* `spheriodal_distance()`
|
|
2054
|
+
* `set_x()`
|
|
2055
|
+
* `set_y()`
|
|
2056
|
+
* `set_z()`
|
|
2057
|
+
* ###### Methods for LineString Geometry
|
|
2058
|
+
* `endpoint()`
|
|
2059
|
+
* `length()`
|
|
2060
|
+
* `length_3D()`
|
|
2061
|
+
* `line_interpolate_point()`
|
|
2062
|
+
* `num_points()`
|
|
2063
|
+
* `point()`
|
|
2064
|
+
* `start_point()`
|
|
2065
|
+
* ###### Methods for Polygon Geometry
|
|
2066
|
+
* `interiors()`
|
|
2067
|
+
* `num_interior_ring()`
|
|
2068
|
+
* `point_on_surface()`
|
|
2069
|
+
* ###### Methods for GeometryCollection Geometry
|
|
2070
|
+
* `geom_component()`
|
|
2071
|
+
* `num_geometry()`
|
|
2072
|
+
* ###### Methods for GeoSequence Geometry
|
|
2073
|
+
* `clip()`
|
|
2074
|
+
* `get_final_timestamp()`
|
|
2075
|
+
* `get_init_timestamp()`
|
|
2076
|
+
* `get_link()`
|
|
2077
|
+
* `get_user_field()`
|
|
2078
|
+
* `get_user_field_count()`
|
|
2079
|
+
* `point_heading()`
|
|
2080
|
+
* `set_link()`
|
|
2081
|
+
* `speed()`
|
|
2082
|
+
* ###### Filtering Functions and Methods
|
|
2083
|
+
* `intersects_mbb()`
|
|
2084
|
+
* `mbb_filter()`
|
|
2085
|
+
* `mbr_filter()`
|
|
2086
|
+
* `within_mbb()`
|
|
2087
|
+
|
|
2088
|
+
* ###### teradataml DataFrame
|
|
2089
|
+
* _New Functions_
|
|
2090
|
+
* `to_csv()`
|
|
2091
|
+
|
|
2092
|
+
* ###### teradataml: SQLE Engine Analytic Functions
|
|
2093
|
+
* _New Functions_
|
|
2094
|
+
* Newly added SQLE functions are accessible only after establishing the connection to Vantage.
|
|
2095
|
+
* `display_analytic_functions()` API displays all the available SQLE Analytic functions based on database version.
|
|
2096
|
+
* ###### Functions Supported on DatabaseVersions: 16.20.x.x, 17.10.x.x, 17.05.x.x
|
|
2097
|
+
* `Antiselect()`
|
|
2098
|
+
* `Attribution()`
|
|
2099
|
+
* `DecisionForestPredict()`
|
|
2100
|
+
* `DecisionTreePredict()`
|
|
2101
|
+
* `GLMPredict()`
|
|
2102
|
+
* `MovingAverage()`
|
|
2103
|
+
* `NaiveBayesPredict()`
|
|
2104
|
+
* `NaiveBayesTextClassifierPredict()`
|
|
2105
|
+
* `NGramSplitter()`
|
|
2106
|
+
* `NPath()`
|
|
2107
|
+
* `Pack()`
|
|
2108
|
+
* `Sessionize()`
|
|
2109
|
+
* `StringSimilarity()`
|
|
2110
|
+
* `SVMParsePredict()`
|
|
2111
|
+
* `Unpack()`
|
|
2112
|
+
* ###### Functions Supported on DatabaseVersions: 17.10.x.x
|
|
2113
|
+
* `Antiselect()`
|
|
2114
|
+
* `Attribution()`
|
|
2115
|
+
* `BincoodeFit()`
|
|
2116
|
+
* `BncodeTransform()`
|
|
2117
|
+
* `CategoricalSummary()`
|
|
2118
|
+
* `ChiSq()`
|
|
2119
|
+
* `ColumnSummary()`
|
|
2120
|
+
* `ConvertTo()`
|
|
2121
|
+
* `DecisionForestPredict()`
|
|
2122
|
+
* `DecisionTreePredict()`
|
|
2123
|
+
* `GLMPredict()`
|
|
2124
|
+
* `FillRowId()`
|
|
2125
|
+
* `FTest()`
|
|
2126
|
+
* `Fit()`
|
|
2127
|
+
* `Transform()`
|
|
2128
|
+
* `GetRowsWithMissingValues()`
|
|
2129
|
+
* `GetRowsWithoutMissingValues()`
|
|
2130
|
+
* `MovingAverage()`
|
|
2131
|
+
* `Histogram()`
|
|
2132
|
+
* `NaiveBayesPredict()`
|
|
2133
|
+
* `NaiveBayesTextClassifierPredict()`
|
|
2134
|
+
* `NGramSplitter()`
|
|
2135
|
+
* `NPath()`
|
|
2136
|
+
* `NumApply()`
|
|
2137
|
+
* `OneHotEncodingFit()`
|
|
2138
|
+
* `OneHotEncodingTransform()`
|
|
2139
|
+
* `OutlierFilterFit()`
|
|
2140
|
+
* `OutlierFilterTransform()`
|
|
2141
|
+
* `Pack()`
|
|
2142
|
+
* `PolynomialFeatuesFit()`
|
|
2143
|
+
* `PolynomialFeatuesTransform()`
|
|
2144
|
+
* `QQNorm()`
|
|
2145
|
+
* `RoundColumns()`
|
|
2146
|
+
* `RowNormalizeFit()`
|
|
2147
|
+
* `RowNormalizeTransform()`
|
|
2148
|
+
* `ScaleFit()`
|
|
2149
|
+
* `ScaleTransform()`
|
|
2150
|
+
* `Sessionize()`
|
|
2151
|
+
* `SimpleImputeFit()`
|
|
2152
|
+
* `SimpleImputeTransform()`
|
|
2153
|
+
* `StrApply()`
|
|
2154
|
+
* `StringSimilarity()`
|
|
2155
|
+
* `SVMParsePredict()`
|
|
2156
|
+
* `UniVariateStatistics()`
|
|
2157
|
+
* `Unpack()`
|
|
2158
|
+
* `WhichMax()`
|
|
2159
|
+
* `WhichMin()`
|
|
2160
|
+
* `ZTest()`
|
|
2161
|
+
|
|
2162
|
+
* ###### teradataml: General Functions
|
|
2163
|
+
* _New Functions_
|
|
2164
|
+
* Data Transfer Utility
|
|
2165
|
+
* `read_csv()`
|
|
2166
|
+
|
|
2167
|
+
* ###### Operators
|
|
2168
|
+
* _New Functions_
|
|
2169
|
+
* Table Operators
|
|
2170
|
+
* `read_nos()`
|
|
2171
|
+
* `write_nos()`
|
|
2172
|
+
|
|
2173
|
+
* ###### teradataml: Bring Your Own Model
|
|
2174
|
+
* _New Functions_
|
|
2175
|
+
* Model Cataloging
|
|
2176
|
+
* `get_license()`
|
|
2177
|
+
* `set_byom_catalog()`
|
|
2178
|
+
* `set_license()`
|
|
2179
|
+
|
|
2180
|
+
* ##### Updates
|
|
2181
|
+
* ###### teradataml: General Functions
|
|
2182
|
+
* Data Transfer Utility
|
|
2183
|
+
* `copy_to_sql()` - New argument "chunksize" added to load data in chunks.
|
|
2184
|
+
* Following Data Transfer Utility Functions updated to specify the number of Teradata sessions to open for data transfer using "open_session" argument:
|
|
2185
|
+
* `fastexport()`
|
|
2186
|
+
* `fastload()`
|
|
2187
|
+
* `to_pandas()`
|
|
2188
|
+
|
|
2189
|
+
* ###### Operators
|
|
2190
|
+
* Following Set Operator Functions updated to work with Geospatial data:
|
|
2191
|
+
* `concat()`
|
|
2192
|
+
* `td_intersect()`
|
|
2193
|
+
* `td_expect()`
|
|
2194
|
+
* `td_minus()`
|
|
2195
|
+
|
|
2196
|
+
* ###### teradataml: Bring Your Own Model
|
|
2197
|
+
* Model cataloging APIs mentioned below are updated to use session level parameters set by `set_byom_catalog()` and `set_license()` such as table name, schema name and license details respectively.
|
|
2198
|
+
* `delete_byom()`
|
|
2199
|
+
* `list_byom()`
|
|
2200
|
+
* `retrieve_byom()`
|
|
2201
|
+
* `save_byom()`
|
|
2202
|
+
* `view_log()` - Allows user to view BYOM logs.
|
|
2203
|
+
|
|
2204
|
+
* ##### Bug Fixes
|
|
2205
|
+
* CS0733758 - `db_python_package_details()` function is fixed to support latest STO release for pip and Python aliases used.
|
|
2206
|
+
* DataFrame `print()` issue related to `Response Row size is greater than the 1MB allowed maximum.` has been fixed to print the data with lot of columns.
|
|
2207
|
+
* New parameter "chunksize" is added to `DataFrame.to_sql()` and `copy_to_sql()` to fix the issue where the function was failing with error - "Request requires too many SPOOL files.". Reducing the chunksize than the default one will result in successful operation.
|
|
2208
|
+
* `remove_context()` is fixed to remove the active connection from database.
|
|
2209
|
+
* Support added to specify the number of Teradata data transfer sessions to open for data transfer using `fastexport()` and `fastload()` functions.
|
|
2210
|
+
* `DataFrame.to_sql()` is fixed to support temporary table when default database differs from the username.
|
|
2211
|
+
* `DataFrame.to_pandas()` now by default support data transfer using regular method. Change is carried out for user to allow the data transfer if utility throttles are configured, i.e., TASM configuration does not support data export using FastExport.
|
|
2212
|
+
* `save_byom()` now notifies if VARCHAR column is trimmed out if data passed to the API is greater than the length of the VARCHAR column.
|
|
2213
|
+
* Standard error can now be captured for `DataFrame.map_row()` and `DataFrame.map_parition()` when executed in LOCAL mode.
|
|
2214
|
+
* Vantage Analytic Library - Underlying SQL can be retrieved using newly added arguments "gen_sql"/"gen_sql_only" for the functions. Query can be viewed with the help `show_query()`.
|
|
2215
|
+
* Documentation example has been fixed for `fastexport()` to show the correct import statement.
|
|
2216
|
+
|
|
2217
|
+
|
|
2218
|
+
#### teradataml 17.00.00.05
|
|
2219
|
+
Fixed [CS0733758] db_python_package_details() fails on recent STO release due to changes in pip and python aliases.
|
|
2220
|
+
|
|
2221
|
+
|
|
2222
|
+
#### teradataml 17.00.00.04
|
|
2223
|
+
* ##### New Features/Functionality
|
|
2224
|
+
* ###### Analytic Functions
|
|
2225
|
+
* Bring Your Own Analytics Functions
|
|
2226
|
+
The BYOM feature in Vantage provides flexibility to score the data in Vantage using external models using following BYOM functions:
|
|
2227
|
+
* `H2OPredict()` - Score using model trained externally in H2O and stored in Vantage.
|
|
2228
|
+
* `PMMLPredict()` - Score using model trained externally in PMML and stored in Vantage.
|
|
2229
|
+
* BYOM Model Catalog APIs
|
|
2230
|
+
* `save_byom()` - Save externally trained models in Teradata Vantage.
|
|
2231
|
+
* `delete_byom()` - Delete a model from the user specified table in Teradata Vantage.
|
|
2232
|
+
* `list_byom()` - List models.
|
|
2233
|
+
* `retrieve_byom()` - Function to retrieve a saved model.
|
|
2234
|
+
* Vantage Analytic Library Functions
|
|
2235
|
+
* _New Functions_
|
|
2236
|
+
* `XmlToHtmlReport()` - Transforms XML output of VAL functions to HTML.
|
|
2237
|
+
* ###### teradataml DataFrame
|
|
2238
|
+
* `DataFrame.window()` - Generates Window object on a teradataml DataFrame to run window aggregate functions.
|
|
2239
|
+
* `DataFrame.csum()` - Returns column-wise cumulative sum for rows in the partition of the dataframe.
|
|
2240
|
+
* `DataFrame.mavg()` - Returns moving average for the current row and the preceding rows.
|
|
2241
|
+
* `DataFrame.mdiff()` - Returns moving difference for the current row and the preceding rows.
|
|
2242
|
+
* `DataFrame.mlinreg()` - Returns moving linear regression for the current row and the preceding rows.
|
|
2243
|
+
* `DataFrame.msum()` - Returns moving sum for the current row and the preceding rows.
|
|
2244
|
+
* _Regular Aggregate Functions_
|
|
2245
|
+
* `DataFrame.corr()` - Returns the Sample Pearson product moment correlation coefficient.
|
|
2246
|
+
* `DataFrame.covar_pop()` - Returns the population covariance.
|
|
2247
|
+
* `DataFrame.covar_samp()` - Returns the sample covariance.
|
|
2248
|
+
* `DataFrame.regr_avgx()` - Returns the mean of the independent variable.
|
|
2249
|
+
* `DataFrame.regr_avgy()` - Returns the mean of the dependent variable.
|
|
2250
|
+
* `DataFrame.regr_count()` - Returns the count of the dependent and independent variable arguments.
|
|
2251
|
+
* `DataFrame.rege_intercept()` - Returns the intercept of the univariate linear regression line.
|
|
2252
|
+
* `DataFrame.regr_r2()` - Returns the coefficient of determination.
|
|
2253
|
+
* `DataFrame.regr_slope()` - Returns the slope of the univariate linear regression line through.
|
|
2254
|
+
* `DataFrame.regr_sxx()` - Returns the sum of the squares of the independent variable expression.
|
|
2255
|
+
* `DataFrame.regr_sxy()` - Returns the sum of the products of the independent variable and the dependent variable.
|
|
2256
|
+
* `DataFrame.regr_syy()` - Returns the sum of the squares of the dependent variable expression.
|
|
2257
|
+
* ###### teradataml DataFrameColumn a.k.a. ColumnExpression
|
|
2258
|
+
* `ColumnExpression.window()` - Generates Window object on a teradataml DataFrameColumn to run window aggregate functions.
|
|
2259
|
+
* `ColumnExpression.desc()` - Sorts ColumnExpression in descending order.
|
|
2260
|
+
* `ColumnExpression.asc()` - Sorts ColumnExpression in ascending order.
|
|
2261
|
+
* `ColumnExpression.distinct()` - Removes duplicate value from ColumnExpression.
|
|
2262
|
+
* _Regular Aggregate Functions_
|
|
2263
|
+
* `ColumnExpression.corr()` - Returns the Sample Pearson product moment correlation coefficient.
|
|
2264
|
+
* `ColumnExpression.count()` - Returns the column-wise count.
|
|
2265
|
+
* `ColumnExpression.covar_pop()` - Returns the population covariance.
|
|
2266
|
+
* `ColumnExpression.covar_samp()` - Returns the sample covariance.
|
|
2267
|
+
* `ColumnExpression.kurtosis()` - Returns kurtosis value for a column.
|
|
2268
|
+
* `ColumnExpression.median()` - Returns column-wise median value.
|
|
2269
|
+
* `ColumnExpression.max()` - Returns the column-wise max value.
|
|
2270
|
+
* `ColumnExpression.mean()` - Returns the column-wise average value.
|
|
2271
|
+
* `ColumnExpression.min()` - Returns the column-wise min value.
|
|
2272
|
+
* `ColumnExpression.regr_avgx()` - Returns the mean of the independent variable.
|
|
2273
|
+
* `ColumnExpression.regr_avgy()` - Returns the mean of the dependent variable.
|
|
2274
|
+
* `ColumnExpression.regr_count()` - Returns the count of the dependent and independent variable arguments.
|
|
2275
|
+
* `ColumnExpression.rege_intercept()` - Returns the intercept of the univariate linear regression line.
|
|
2276
|
+
* `ColumnExpression.regr_r2()` - Returns the coefficient of determination arguments.
|
|
2277
|
+
* `ColumnExpression.regr_slope()` - Returns the slope of the univariate linear regression line.
|
|
2278
|
+
* `ColumnExpression.regr_sxx()` - Returns the sum of the squares of the independent variable expression.
|
|
2279
|
+
* `ColumnExpression.regr_sxy()` - Returns the sum of the products of the independent variable and the dependent variable.
|
|
2280
|
+
* `ColumnExpression.regr_syy()` - Returns the sum of the squares of the dependent variable expression.
|
|
2281
|
+
* `ColumnExpression.skew()` - Returns skew value for a column.
|
|
2282
|
+
* `ColumnExpression.std()` - Returns the column-wise population/sample standard deviation.
|
|
2283
|
+
* `ColumnExpression.sum()` - Returns the column-wise sum.
|
|
2284
|
+
* `ColumnExpression.var()` - Returns the column-wise population/sample variance.
|
|
2285
|
+
* `ColumnExpression.percentile()` - Returns the column-wise percentile.
|
|
2286
|
+
* ###### teradataml Window - Window Aggregate Functions
|
|
2287
|
+
Following set of _Window Aggregate Functions_ return the results over a specified window which can be of any type:
|
|
2288
|
+
* Cumulative/Expanding window
|
|
2289
|
+
* Moving/Rolling window
|
|
2290
|
+
* Contracting/Remaining window
|
|
2291
|
+
* Grouping window
|
|
2292
|
+
_Window Aggregate Functions_
|
|
2293
|
+
* `Window.corr()` - Returns the Sample Pearson product moment correlation coefficient.
|
|
2294
|
+
* `Window.count()` - Returns the count.
|
|
2295
|
+
* `Window.covar_pop()` - Returns the population covariance.
|
|
2296
|
+
* `Window.covar_samp()` - Returns the sample covariance.
|
|
2297
|
+
* `Window.cume_dist()` - Returns the cumulative distribution of values.
|
|
2298
|
+
* `Window.dense_Rank()` - Returns the ordered ranking of all the rows.
|
|
2299
|
+
* `Window.first_value()` - Returns the first value of an ordered set of values.
|
|
2300
|
+
* `Window.lag()` - Returns data from the row preceding the current row at a specified offset value.
|
|
2301
|
+
* `Window.last_value()` - Returns the last value of an ordered set of values.
|
|
2302
|
+
* `Window.lead()` - Returns data from the row following the current row at a specified offset value.
|
|
2303
|
+
* `Window.max()` - Returns the column-wise max value.
|
|
2304
|
+
* `Window.mean()` - Returns the column-wise average value.
|
|
2305
|
+
* `Window.min()` - Returns the column-wise min value.
|
|
2306
|
+
* `Window.percent_rank()` - Returns the relative rank of all the rows.
|
|
2307
|
+
* `Window.rank()` - Returns the rank (1 … n) of all the rows.
|
|
2308
|
+
* `Window.regr_avgx()` - Returns the mean of the independent variable arguments.
|
|
2309
|
+
* `Window.regr_avgy()` - Returns the mean of the dependent variable arguments.
|
|
2310
|
+
* `Window.regr_count()` - Returns the count of the dependent and independent variable arguments.
|
|
2311
|
+
* `Window.rege_intercept()` - Returns the intercept of the univariate linear regression line arguments.
|
|
2312
|
+
* `Window.regr_r2()` - Returns the coefficient of determination arguments.
|
|
2313
|
+
* `Window.regr_slope()` - Returns the slope of the univariate linear regression line.
|
|
2314
|
+
* `Window.regr_sxx()` - Returns the sum of the squares of the independent variable expression.
|
|
2315
|
+
* `Window.regr_sxy()` - Returns the sum of the products of the independent variable and the dependent variable.
|
|
2316
|
+
* `Window.regr_syy()` - Returns the sum of the squares of the dependent variable expression.
|
|
2317
|
+
* `Window.row_number()` - Returns the sequential row number.
|
|
2318
|
+
* `Window.std()` - Returns the column-wise population/sample standard deviation.
|
|
2319
|
+
* `Window.sum()` - Returns the column-wise sum.
|
|
2320
|
+
* `Window.var()` - Returns the column-wise population/sample variance.
|
|
2321
|
+
* ###### General functions
|
|
2322
|
+
* _New functions_
|
|
2323
|
+
* `fastexport()` - Exports teradataml DataFrame to Pandas DataFrame using FastExport data transfer protocol.
|
|
2324
|
+
* ###### teradataml Options
|
|
2325
|
+
* Display Options
|
|
2326
|
+
* `display.blob_length`
|
|
2327
|
+
Specifies default display length of BLOB column in teradataml DataFrame.
|
|
2328
|
+
* Configuration Options
|
|
2329
|
+
* `configure.temp_table_database`
|
|
2330
|
+
Specifies database name for storing the tables created internally.
|
|
2331
|
+
* `configure.temp_view_database`
|
|
2332
|
+
Specifies database name for storing the views created internally.
|
|
2333
|
+
* `configure.byom_install_location`
|
|
2334
|
+
Specifies the install location for the BYOM functions.
|
|
2335
|
+
* `configure.val_install_location`
|
|
2336
|
+
Specifies the install location for the Vantage Analytic Library functions.
|
|
2337
|
+
* ##### Updates
|
|
2338
|
+
* ###### teradataml DataFrame
|
|
2339
|
+
* `to_pandas()` -
|
|
2340
|
+
* Support added to transfer data to Pandas DataFrame using fastexport protocol improving the performance.
|
|
2341
|
+
* Support added for other arguments similar to Pandas `read_sql()`:
|
|
2342
|
+
* `coerce_float`
|
|
2343
|
+
* `parse_dates`
|
|
2344
|
+
* ###### Analytic functions
|
|
2345
|
+
* Vantage Analytic Library Functions
|
|
2346
|
+
* Support added to accept datetime.date object for literals/values in
|
|
2347
|
+
following transformation functions:
|
|
2348
|
+
* `FillNa()`
|
|
2349
|
+
* `Binning()`
|
|
2350
|
+
* `OneHotEncoder()`
|
|
2351
|
+
* `LabelEncoder()`
|
|
2352
|
+
* All transformation functions now supports accepting
|
|
2353
|
+
teradatasqlalchemy datatypes as input to "datatype" argument for
|
|
2354
|
+
casting the result.
|
|
2355
|
+
* ##### Bug Fixes.
|
|
2356
|
+
* CS0249633 - Support added for teradataml to work with user/database/tablename
|
|
2357
|
+
containing period (.).
|
|
2358
|
+
* CS0086594 - Use of dbc.tablesvx versus dbc.tablesvx in teradatasqlalchemy.
|
|
2359
|
+
* IPython integration to print the teradataml DataFrames in pretty format.
|
|
2360
|
+
* teradataml DataFrame APIs now support column names same as that of Teradata
|
|
2361
|
+
reserved keywords.
|
|
2362
|
+
* Issue has been fixed for duplicate rows being loaded via teradataml
|
|
2363
|
+
fastload() API.
|
|
2364
|
+
* VAL - Empty string now can be passed as input for recoding values using
|
|
2365
|
+
LabelEncoder.
|
|
2366
|
+
* teradataml extension with SQLAlchemy functions:
|
|
2367
|
+
* mod() function is fixed to return correct datatype.
|
|
2368
|
+
* sum() function is fixed to return correct datatype.
|
|
2369
|
+
|
|
2370
|
+
|
|
2371
|
+
#### teradataml 17.00.00.03
|
|
2372
|
+
- New release of SQLAlchemy1.4.x introduced backward compatibility issue. A fix has been carried out so that teradataml can support latest SQLAlchemy changes.
|
|
2373
|
+
- Other minor bug fixes.
|
|
2374
|
+
|
|
2375
|
+
#### teradataml 17.00.00.02
|
|
2376
|
+
Fixed the internal library load issue related to the GCC version discrepancies on CentOS platform.
|
|
2377
|
+
|
|
2378
|
+
#### teradataml 17.00.00.01
|
|
2379
|
+
* ##### New Features/Functionality
|
|
2380
|
+
* ###### Analytic Functions
|
|
2381
|
+
* Vantage Analytic Library
|
|
2382
|
+
teradataml now supports executing analytic functions offered by Vantage Analytic Library.
|
|
2383
|
+
These functions are available via new 'valib' sub-package of teradataml.
|
|
2384
|
+
Following functions are added as part of this:
|
|
2385
|
+
* Association Rules:
|
|
2386
|
+
* `Association()`
|
|
2387
|
+
* Descriptive Statistics:
|
|
2388
|
+
* `AdaptiveHistogram()`
|
|
2389
|
+
* `Explore()`
|
|
2390
|
+
* `Frequency()`
|
|
2391
|
+
* `Histogram()`
|
|
2392
|
+
* `Overlaps()`
|
|
2393
|
+
* `Statistics()`
|
|
2394
|
+
* `TextAnalyzer()`
|
|
2395
|
+
* `Values()`
|
|
2396
|
+
* Decision Tree:
|
|
2397
|
+
* `DecisionTree()`
|
|
2398
|
+
* `DecisionTreePredict()`
|
|
2399
|
+
* `DecisionTreeEvaluator()`
|
|
2400
|
+
* Fast K-Means Clustering:
|
|
2401
|
+
* `KMeans()`
|
|
2402
|
+
* `KMeansPredict()`
|
|
2403
|
+
* Linear Regression:
|
|
2404
|
+
* `LinReg()`
|
|
2405
|
+
* `LinRegPredict()`
|
|
2406
|
+
* Logistic Regression:
|
|
2407
|
+
* `LogReg()`
|
|
2408
|
+
* `LogRegPredict()`
|
|
2409
|
+
* `LogRegEvaluator()`
|
|
2410
|
+
* Factor Analysis:
|
|
2411
|
+
* `PCA()`
|
|
2412
|
+
* `PCAPredict()`
|
|
2413
|
+
* `PCAEvaluator()`
|
|
2414
|
+
* Matrix Building:
|
|
2415
|
+
* `Matrix()`
|
|
2416
|
+
* Statistical Tests:
|
|
2417
|
+
* `BinomialTest()`
|
|
2418
|
+
* `ChiSquareTest()`
|
|
2419
|
+
* `KSTest()`
|
|
2420
|
+
* `ParametricTest()`
|
|
2421
|
+
* `RankTest()`
|
|
2422
|
+
* Variable Transformation:
|
|
2423
|
+
* `Transform()`
|
|
2424
|
+
* Transformation Techniques supported for variable transformation:
|
|
2425
|
+
* `Binning()` - Perform bin coding to replaces continuous numeric column with a
|
|
2426
|
+
categorical one to produce ordinal values.
|
|
2427
|
+
* `Derive()` - Perform free-form transformation done using arithmetic formula.
|
|
2428
|
+
* `FillNa()` - Perform missing value/null replacement transformations.
|
|
2429
|
+
* `LabelEncoder()` - Re-express categorical column values into a new coding scheme.
|
|
2430
|
+
* `MinMaxScalar()` - Rescale data limiting the upper and lower boundaries.
|
|
2431
|
+
* `OneHotEncoder()` - Re-express a categorical data element as one or more
|
|
2432
|
+
numeric data elements, creating a binary numeric field for each
|
|
2433
|
+
categorical data value.
|
|
2434
|
+
* `Retain()` - Copy one or more columns into the final analytic data set.
|
|
2435
|
+
* `Sigmoid()` - Rescale data using sigmoid or s-shaped functions.
|
|
2436
|
+
* `ZScore()` - Rescale data using Z-Score values.
|
|
2437
|
+
* ML Engine Functions (mle)
|
|
2438
|
+
* Correlation2
|
|
2439
|
+
* NaiveBayesTextClassifier2
|
|
2440
|
+
* ###### DataFrame
|
|
2441
|
+
* _New Functions_
|
|
2442
|
+
* `DataFrame.map_row()` - Function to apply a user defined function to each row in the
|
|
2443
|
+
teradataml DataFrame.
|
|
2444
|
+
* `DataFrame.map_partition()` - Function to apply a user defined function to a group or
|
|
2445
|
+
partition of rows in the teradataml DataFrame.
|
|
2446
|
+
* _New Property_
|
|
2447
|
+
* `DataFrame.tdtypes` - Get the teradataml DataFrame metadata containing column names and
|
|
2448
|
+
corresponding teradatasqlalchemy types.
|
|
2449
|
+
* ###### General functions
|
|
2450
|
+
* _New functions_
|
|
2451
|
+
* Database Utility Functions
|
|
2452
|
+
* `db_python_package_details()` - Lists the details of Python packages installed on Vantage.
|
|
2453
|
+
* General Utility Functions
|
|
2454
|
+
* `print_options()`
|
|
2455
|
+
* `view_log()`
|
|
2456
|
+
* `setup_sandbox_env()`
|
|
2457
|
+
* `copy_files_from_container()`
|
|
2458
|
+
* `cleanup_sandbox_env()`
|
|
2459
|
+
* ##### Updates
|
|
2460
|
+
* ###### `create_context()`
|
|
2461
|
+
* Supports all connection parameters supported by teradatasql.connect().
|
|
2462
|
+
* ###### Script
|
|
2463
|
+
* `test_script()` can now be executed in 'local' mode, i.e., outside of the sandbox.
|
|
2464
|
+
* `Script.setup_sto_env()` is deprecated. Use `setup_sandbox_env()` function instead.
|
|
2465
|
+
* Added support for using "quotechar" argument.
|
|
2466
|
+
* ###### Analytic functions
|
|
2467
|
+
* _Updates_
|
|
2468
|
+
* Visit teradataml User Guide to know more about the updates done to ML Engine analytic
|
|
2469
|
+
functions. Following type of updates are done to several functions:
|
|
2470
|
+
* New arguments are added, which are supported only on Vantage Version 1.3.
|
|
2471
|
+
* Default value has been updated for few function arguments.
|
|
2472
|
+
* Few arguments were required, but now they are optional.
|
|
2473
|
+
* ##### Minor Bug Fixes.
|
|
2474
|
+
|
|
2475
|
+
#### teradataml 17.00.00.00
|
|
2476
|
+
* ##### New Features/Functionality
|
|
2477
|
+
* ###### Model Cataloging - Functionality to catalog model metadata and related information in the Model Catalog.
|
|
2478
|
+
* `save_model()` - Save a teradataml Analytic Function model.
|
|
2479
|
+
* `retrieve_model()` - Retrieve a saved model.
|
|
2480
|
+
* `list_model()` - List accessible models.
|
|
2481
|
+
* `describe_model()` - List the details of a model.
|
|
2482
|
+
* `delete_model()` - Remove a model from Model Catalog.
|
|
2483
|
+
* `publish_model()` - Share a model.
|
|
2484
|
+
* ###### Script - An interface to the SCRIPT table operator object in the Advanced SQL Engine.
|
|
2485
|
+
Interface offers execution in two modes:
|
|
2486
|
+
* Test/Debug - to test user scripts locally in a containerized environment.
|
|
2487
|
+
Supporting methods:
|
|
2488
|
+
* `setup_sto_env()` - Set up test environment.
|
|
2489
|
+
* `test_script()` - Test user script in containerized environment.
|
|
2490
|
+
* `set_data()` - Set test data parameters.
|
|
2491
|
+
* In-Database Script Execution - to execute user scripts in database.
|
|
2492
|
+
Supporting methods:
|
|
2493
|
+
* `execute_script()` - Execute user script in Vantage.
|
|
2494
|
+
* `install_file()` - Install or replace file in Database.
|
|
2495
|
+
* `remove_file()` - Remove installed file from Database.
|
|
2496
|
+
* `set_data()` - Set test data parameters.
|
|
2497
|
+
* ###### DataFrame
|
|
2498
|
+
* `DataFrame.show_query()` - Show underlying query for DataFrame.
|
|
2499
|
+
* Regular Aggregates
|
|
2500
|
+
* _New functions_
|
|
2501
|
+
* `kurtosis()` - Calculate the kurtosis value.
|
|
2502
|
+
* `skew()` - Calculate the skewness of the distribution.
|
|
2503
|
+
* _Updates_\
|
|
2504
|
+
New argument `distinct` is added to following aggregates to exclude duplicate values.
|
|
2505
|
+
* `count()`
|
|
2506
|
+
* `max()`
|
|
2507
|
+
* `mean()`
|
|
2508
|
+
* `min()`
|
|
2509
|
+
* `sum()`
|
|
2510
|
+
* `std()`
|
|
2511
|
+
* New argument `population` is added to calculate the population standard deviation.
|
|
2512
|
+
* `var()`
|
|
2513
|
+
* New argument `population` is added to calculate the population variance.
|
|
2514
|
+
* Time Series Aggregates
|
|
2515
|
+
* _New functions_
|
|
2516
|
+
* `kurtosis()` - Calculate the kurtosis value.
|
|
2517
|
+
* `count()` - Get the total number of values.
|
|
2518
|
+
* `max()` - Calculate the maximum value.
|
|
2519
|
+
* `mean()` - Calculate the average value.
|
|
2520
|
+
* `min()` - Calculate the minimum value.
|
|
2521
|
+
* `percentile()` - Calculate the desired percentile.
|
|
2522
|
+
* `skew()` - Calculate the skewness of the distribution.
|
|
2523
|
+
* `sum()` - Calculate the column-wise sum value.
|
|
2524
|
+
* `std()` - Calculate the sample and population standard deviation.
|
|
2525
|
+
* `var()` - Calculate the sample and population standard variance.
|
|
2526
|
+
* ###### General functions
|
|
2527
|
+
* _New functions_
|
|
2528
|
+
* Database Utility Functions
|
|
2529
|
+
* `db_drop_table()`
|
|
2530
|
+
* `db_drop_view()`
|
|
2531
|
+
* `db_list_tables()`
|
|
2532
|
+
* Vantage File Management Functions
|
|
2533
|
+
* `install_file()` - Install a file in Database.
|
|
2534
|
+
* `remove_file()` - Remove an installed file from Database.
|
|
2535
|
+
* _Updates_
|
|
2536
|
+
* `create_context()`
|
|
2537
|
+
* Support added for Stored Password Protection feature.
|
|
2538
|
+
* Kerberos authentication bug fix.
|
|
2539
|
+
* New argument `database` added to `create_context()` API, that allows user to specify connecting database.
|
|
2540
|
+
* ###### Analytic functions
|
|
2541
|
+
* _New functions_
|
|
2542
|
+
* `Betweenness`
|
|
2543
|
+
* `Closeness`
|
|
2544
|
+
* `FMeasure`
|
|
2545
|
+
* `FrequentPaths`
|
|
2546
|
+
* `IdentityMatch`
|
|
2547
|
+
* `Interpolator`
|
|
2548
|
+
* `ROC`
|
|
2549
|
+
* _Updates_
|
|
2550
|
+
* New methods are added to all analytic functions
|
|
2551
|
+
* `show_query()`
|
|
2552
|
+
* `get_build_time()`
|
|
2553
|
+
* `get_prediction_type()`
|
|
2554
|
+
* `get_target_column()`
|
|
2555
|
+
* New properties are added to analytic function's Formula argument
|
|
2556
|
+
* `response_column`
|
|
2557
|
+
* `numeric_columns`
|
|
2558
|
+
* `categorical_columns`
|
|
2559
|
+
* `all_columns`
|
|
2560
|
+
|
|
2561
|
+
#### teradataml 16.20.00.06
|
|
2562
|
+
Fixed the DataFrame data display corruption issue observed with certain analytic functions.
|
|
2563
|
+
|
|
2564
|
+
#### teradataml 16.20.00.05
|
|
2565
|
+
Compatible with Vantage 1.1.1.\
|
|
2566
|
+
The following ML Engine (`teradataml.analytics.mle`) functions have new and/or updated arguments to support the Vantage version:
|
|
2567
|
+
* `AdaBoostPredict`
|
|
2568
|
+
* `DecisionForestPredict`
|
|
2569
|
+
* `DecisionTreePredict`
|
|
2570
|
+
* `GLMPredict`
|
|
2571
|
+
* `LDA`
|
|
2572
|
+
* `NaiveBayesPredict`
|
|
2573
|
+
* `NaiveBayesTextClassifierPredict`
|
|
2574
|
+
* `SVMDensePredict`
|
|
2575
|
+
* `SVMSparse`
|
|
2576
|
+
* `SVMSparsePredict`
|
|
2577
|
+
* `XGBoostPredict`
|
|
2578
|
+
|
|
2579
|
+
#### teradataml 16.20.00.04
|
|
2580
|
+
* ##### Improvements
|
|
2581
|
+
* DataFrame creation is now quicker, impacting many APIs and Analytic functions.
|
|
2582
|
+
* Improved performance by reducing the number of intermediate queries issued to Teradata Vantage when not required.
|
|
2583
|
+
* The number of queries reduced by combining multiple operations into a single step whenever possible and unless the user expects or demands to see the intermediate results.
|
|
2584
|
+
* The performance improvement is almost proportional to the number of chained and unexecuted operations on a teradataml DataFrame.
|
|
2585
|
+
* Reduced number of intermediate internal objects created on Vantage.
|
|
2586
|
+
* ##### New Features/Functionality
|
|
2587
|
+
* ###### General functions
|
|
2588
|
+
* _New functions_
|
|
2589
|
+
* `show_versions()` - to list the version of teradataml and dependencies installed.
|
|
2590
|
+
* `fastload()` - for high performance data loading of large amounts of data into a table on Vantage. Requires `teradatasql` version `16.20.0.48` or above.
|
|
2591
|
+
* Set operators:
|
|
2592
|
+
* `concat`
|
|
2593
|
+
* `td_intersect`
|
|
2594
|
+
* `td_except`
|
|
2595
|
+
* `td_minus`
|
|
2596
|
+
* `case()` - to help construct SQL CASE based expressions.
|
|
2597
|
+
* _Updates_
|
|
2598
|
+
* `copy_to_sql`
|
|
2599
|
+
* Added support to `copy_to_sql` to save multi-level index.
|
|
2600
|
+
* Corrected the type mapping for index when being saved.
|
|
2601
|
+
* `create_context()` updated to support 'JWT' logon mechanism.
|
|
2602
|
+
* ###### Analytic functions
|
|
2603
|
+
* _New functions_
|
|
2604
|
+
* `NERTrainer`
|
|
2605
|
+
* `NERExtractor`
|
|
2606
|
+
* `NEREvaluator`
|
|
2607
|
+
* `GLML1L2`
|
|
2608
|
+
* `GLML1L2Predict`
|
|
2609
|
+
* _Updates_
|
|
2610
|
+
* Added support to categorize numeric columns as categorical while using formula - `as_categorical()` in the `teradataml.common.formula` module.
|
|
2611
|
+
* ###### DataFrame
|
|
2612
|
+
* Added support to create DataFrame from Volatile and Primary Time Index tables.
|
|
2613
|
+
* `DataFrame.sample()` - to sample data.
|
|
2614
|
+
* `DataFrame.index` - Property to access `index_label` of DataFrame.
|
|
2615
|
+
* Functionality to process Time Series Data
|
|
2616
|
+
* Grouping/Resampling time series data:
|
|
2617
|
+
* `groupby_time()`
|
|
2618
|
+
* `resample()`
|
|
2619
|
+
* Time Series Aggregates:
|
|
2620
|
+
* `bottom()`
|
|
2621
|
+
* `count()`
|
|
2622
|
+
* `describe()`
|
|
2623
|
+
* `delta_t()`
|
|
2624
|
+
* `mad()`
|
|
2625
|
+
* `median()`
|
|
2626
|
+
* `mode()`
|
|
2627
|
+
* `first()`
|
|
2628
|
+
* `last()`
|
|
2629
|
+
* `top()`
|
|
2630
|
+
* DataFrame API and method argument validation added.
|
|
2631
|
+
* `DataFrame.info()` - Default value for `null_counts` argument updated from `None` to `False`.
|
|
2632
|
+
* `Dataframe.merge()` updated to accept columns expressions along with column names to `on`, `left_on`, `right_on` arguments.
|
|
2633
|
+
* ###### DataFrame Column/ColumnExpression methods
|
|
2634
|
+
* `cast()` - to help cast the column to a specified type.
|
|
2635
|
+
* `isin()` and `~isin()` - to check the presence of values in a column.
|
|
2636
|
+
* ##### Removed deprecated Analytic functions
|
|
2637
|
+
* All the deprecated Analytic functions under the `teradataml.analytics module` have been removed.
|
|
2638
|
+
Newer versions of the functions are available under the `teradataml.analytics.mle` and the `teradataml.analytics.sqle` modules.
|
|
2639
|
+
The modules removed are:
|
|
2640
|
+
* `teradataml.analytics.Antiselect`
|
|
2641
|
+
* `teradataml.analytics.Arima`
|
|
2642
|
+
* `teradataml.analytics.ArimaPredictor`
|
|
2643
|
+
* `teradataml.analytics.Attribution`
|
|
2644
|
+
* `teradataml.analytics.ConfusionMatrix`
|
|
2645
|
+
* `teradataml.analytics.CoxHazardRatio`
|
|
2646
|
+
* `teradataml.analytics.CoxPH`
|
|
2647
|
+
* `teradataml.analytics.CoxSurvival`
|
|
2648
|
+
* `teradataml.analytics.DecisionForest`
|
|
2649
|
+
* `teradataml.analytics.DecisionForestEvaluator`
|
|
2650
|
+
* `teradataml.analytics.DecisionForestPredict`
|
|
2651
|
+
* `teradataml.analytics.DecisionTree`
|
|
2652
|
+
* `teradataml.analytics.DecisionTreePredict`
|
|
2653
|
+
* `teradataml.analytics.GLM`
|
|
2654
|
+
* `teradataml.analytics.GLMPredict`
|
|
2655
|
+
* `teradataml.analytics.KMeans`
|
|
2656
|
+
* `teradataml.analytics.NGrams`
|
|
2657
|
+
* `teradataml.analytics.NPath`
|
|
2658
|
+
* `teradataml.analytics.NaiveBayes`
|
|
2659
|
+
* `teradataml.analytics.NaiveBayesPredict`
|
|
2660
|
+
* `teradataml.analytics.NaiveBayesTextClassifier`
|
|
2661
|
+
* `teradataml.analytics.NaiveBayesTextClassifierPredict`
|
|
2662
|
+
* `teradataml.analytics.Pack`
|
|
2663
|
+
* `teradataml.analytics.SVMSparse`
|
|
2664
|
+
* `teradataml.analytics.SVMSparsePredict`
|
|
2665
|
+
* `teradataml.analytics.SentenceExtractor`
|
|
2666
|
+
* `teradataml.analytics.Sessionize`
|
|
2667
|
+
* `teradataml.analytics.TF`
|
|
2668
|
+
* `teradataml.analytics.TFIDF`
|
|
2669
|
+
* `teradataml.analytics.TextTagger`
|
|
2670
|
+
* `teradataml.analytics.TextTokenizer`
|
|
2671
|
+
* `teradataml.analytics.Unpack`
|
|
2672
|
+
* `teradataml.analytics.VarMax`
|
|
2673
|
+
|
|
2674
|
+
#### teradataml 16.20.00.03
|
|
2675
|
+
* Fixed the garbage collection issue observed with `remove_context()` when context is created using a SQLAlchemy engine.
|
|
2676
|
+
* Added 4 new Advanced SQL Engine (was NewSQL Engine) analytic functions supported only on Vantage 1.1:
|
|
2677
|
+
* `Antiselect`, `Pack`, `StringSimilarity`, and `Unpack`.
|
|
2678
|
+
* Updated the Machine Learning Engine `NGrams` function to work with Vantage 1.1.
|
|
2679
|
+
|
|
2680
|
+
#### teradataml 16.20.00.02
|
|
2681
|
+
* Python version 3.4.x will no longer be supported. The Python versions supported are 3.5.x, 3.6.x, and 3.7.x.
|
|
2682
|
+
* Major issue with the usage of formula argument in analytic functions with Python3.7 has been fixed, allowing this package to be used with Python3.7 or later.
|
|
2683
|
+
* Configurable alias name support for analytic functions has been added.
|
|
2684
|
+
* Support added to create_context (connect to Teradata Vantage) with different logon mechanisms.
|
|
2685
|
+
Logon mechanisms supported are: 'TD2', 'TDNEGO', 'LDAP' & 'KRB5'.
|
|
2686
|
+
* copy_to_sql function and DataFrame 'to_sql' methods now provide following additional functionality:
|
|
2687
|
+
* Create Primary Time Index tables.
|
|
2688
|
+
* Create set/multiset tables.
|
|
2689
|
+
* New DataFrame methods are added: 'median', 'var', 'squeeze', 'sort_index', 'concat'.
|
|
2690
|
+
* DataFrame method 'join' is now updated to make use of ColumnExpressions (df.column_name) for the 'on' clause as opposed to strings.
|
|
2691
|
+
* Series is supported as a first class object by calling squeeze on DataFrame.
|
|
2692
|
+
* Methods supported by teradataml Series are: 'head', 'unique', 'name', '\_\_repr__'.
|
|
2693
|
+
* Binary operations with teradataml Series is not yet supported. Try using Columns from teradataml.DataFrames.
|
|
2694
|
+
* Sample datasets and commands to load the same have been provided in the function examples.
|
|
2695
|
+
* New configuration property has been added 'column_casesenitive_handler'. Useful when one needs to play with case sensitive columns.
|
|
2696
|
+
|
|
2697
|
+
#### teradataml 16.20.00.01
|
|
2698
|
+
* New support has been added for Linux distributions: Red Hat 7+, Ubuntu 16.04+, CentOS 7+, SLES12+.
|
|
2699
|
+
* 16.20.00.01 now has over 100 analytic functions. These functions have been organized into their own packages for better control over which engine to execute the analytic function on. Due to these namespace changes, the old analytic functions have been deprecated and will be removed in a future release. See the Deprecations section in the Teradata Python Package User Guide for more information.
|
|
2700
|
+
* New DataFrame methods `shape`, `iloc`, `describe`, `get_values`, `merge`, and `tail`.
|
|
2701
|
+
* New Series methods for NA checking (`isnull`, `notnull`) and string processing (`lower`, `strip`, `contains`).
|
|
2702
|
+
|
|
2703
|
+
#### teradataml 16.20.00.00
|
|
2704
|
+
* `teradataml 16.20.00.00` is the first release version. Please refer to the _Teradata Python Package User Guide_ for a list of Limitations and Usage Considerations.
|
|
2705
|
+
|
|
2706
|
+
## Installation and Requirements
|
|
2707
|
+
|
|
2708
|
+
### Package Requirements:
|
|
2709
|
+
* Python 3.5 or later
|
|
2710
|
+
|
|
2711
|
+
Note: 32-bit Python is not supported.
|
|
2712
|
+
|
|
2713
|
+
### Minimum System Requirements:
|
|
2714
|
+
* Windows 7 (64Bit) or later
|
|
2715
|
+
* macOS 10.9 (64Bit) or later
|
|
2716
|
+
* Red Hat 7 or later versions
|
|
2717
|
+
* Ubuntu 16.04 or later versions
|
|
2718
|
+
* CentOS 7 or later versions
|
|
2719
|
+
* SLES 12 or later versions
|
|
2720
|
+
* Teradata Vantage Advanced SQL Engine:
|
|
2721
|
+
* Advanced SQL Engine 16.20 Feature Update 1 or later
|
|
2722
|
+
* For a Teradata Vantage system with the ML Engine:
|
|
2723
|
+
* Teradata Machine Learning Engine 08.00.03.01 or later
|
|
2724
|
+
|
|
2725
|
+
### Installation
|
|
2726
|
+
|
|
2727
|
+
Use pip to install the Teradata Python Package for Advanced Analytics.
|
|
2728
|
+
|
|
2729
|
+
Platform | Command
|
|
2730
|
+
-------------- | ---
|
|
2731
|
+
macOS/Linux | `pip install teradataml`
|
|
2732
|
+
Windows | `py -3 -m pip install teradataml`
|
|
2733
|
+
|
|
2734
|
+
When upgrading to a new version of the Teradata Python Package, you may need to use pip install's `--no-cache-dir` option to force the download of the new version.
|
|
2735
|
+
|
|
2736
|
+
Platform | Command
|
|
2737
|
+
-------------- | ---
|
|
2738
|
+
macOS/Linux | `pip install --no-cache-dir -U teradataml`
|
|
2739
|
+
Windows | `py -3 -m pip install --no-cache-dir -U teradataml`
|
|
2740
|
+
|
|
2741
|
+
## Using the Teradata Python Package
|
|
2742
|
+
|
|
2743
|
+
Your Python script must import the `teradataml` package in order to use the Teradata Python Package:
|
|
2744
|
+
|
|
2745
|
+
```
|
|
2746
|
+
>>> import teradataml as tdml
|
|
2747
|
+
>>> from teradataml import create_context, remove_context
|
|
2748
|
+
>>> create_context(host = 'hostname', username = 'user', password = 'password')
|
|
2749
|
+
>>> df = tdml.DataFrame('iris')
|
|
2750
|
+
>>> df
|
|
2751
|
+
|
|
2752
|
+
SepalLength SepalWidth PetalLength PetalWidth Name
|
|
2753
|
+
0 5.1 3.8 1.5 0.3 Iris-setosa
|
|
2754
|
+
1 6.9 3.1 5.1 2.3 Iris-virginica
|
|
2755
|
+
2 5.1 3.5 1.4 0.3 Iris-setosa
|
|
2756
|
+
3 5.9 3.0 4.2 1.5 Iris-versicolor
|
|
2757
|
+
4 6.0 2.9 4.5 1.5 Iris-versicolor
|
|
2758
|
+
5 5.0 3.5 1.3 0.3 Iris-setosa
|
|
2759
|
+
6 5.5 2.4 3.8 1.1 Iris-versicolor
|
|
2760
|
+
7 6.9 3.2 5.7 2.3 Iris-virginica
|
|
2761
|
+
8 4.4 3.0 1.3 0.2 Iris-setosa
|
|
2762
|
+
9 5.8 2.7 5.1 1.9 Iris-virginica
|
|
2763
|
+
|
|
2764
|
+
>>> df = df.select(['Name', 'SepalLength', 'PetalLength'])
|
|
2765
|
+
>>> df
|
|
2766
|
+
|
|
2767
|
+
Name SepalLength PetalLength
|
|
2768
|
+
0 Iris-versicolor 6.0 4.5
|
|
2769
|
+
1 Iris-versicolor 5.5 3.8
|
|
2770
|
+
2 Iris-virginica 6.9 5.7
|
|
2771
|
+
3 Iris-setosa 5.1 1.4
|
|
2772
|
+
4 Iris-setosa 5.1 1.5
|
|
2773
|
+
5 Iris-virginica 5.8 5.1
|
|
2774
|
+
6 Iris-virginica 6.9 5.1
|
|
2775
|
+
7 Iris-setosa 5.1 1.4
|
|
2776
|
+
8 Iris-virginica 7.7 6.7
|
|
2777
|
+
9 Iris-setosa 5.0 1.3
|
|
2778
|
+
|
|
2779
|
+
>>> df = df[(df.Name == 'Iris-setosa') & (df.PetalLength > 1.5)]
|
|
2780
|
+
>>> df
|
|
2781
|
+
|
|
2782
|
+
Name SepalLength PetalLength
|
|
2783
|
+
0 Iris-setosa 4.8 1.9
|
|
2784
|
+
1 Iris-setosa 5.4 1.7
|
|
2785
|
+
2 Iris-setosa 5.7 1.7
|
|
2786
|
+
3 Iris-setosa 5.0 1.6
|
|
2787
|
+
4 Iris-setosa 5.1 1.9
|
|
2788
|
+
5 Iris-setosa 4.8 1.6
|
|
2789
|
+
6 Iris-setosa 4.7 1.6
|
|
2790
|
+
7 Iris-setosa 5.1 1.6
|
|
2791
|
+
8 Iris-setosa 5.1 1.7
|
|
2792
|
+
9 Iris-setosa 4.8 1.6
|
|
2793
|
+
```
|
|
2794
|
+
|
|
2795
|
+
## Documentation
|
|
2796
|
+
|
|
2797
|
+
General product information, including installation instructions, is available in the [Teradata Documentation website](https://docs.teradata.com/search/documents?query=package+python+-lake&filters=category~%2522Programming+Reference%2522_%2522User+Guide%2522*prodname~%2522Teradata+Package+for+Python%2522_%2522Teradata+Python+Package%2522&sort=last_update&virtual-field=title_only&content-lang=)
|
|
2798
|
+
|
|
2799
|
+
## License
|
|
2800
|
+
|
|
2801
|
+
Use of the Teradata Python Package is governed by the *License Agreement for the Teradata Python Package for Advanced Analytics*.
|
|
2802
|
+
After installation, the `LICENSE` and `LICENSE-3RD-PARTY` files are located in the `teradataml` directory of the Python installation directory.
|
|
2803
|
+
|
|
2804
|
+
|