PyPI - teradataml - Versions diffs - 20.0.0.0__py3-none-any.whl → 20.0.0.2__py3-none-any.whl - Mend

teradataml 20.0.0.0py3-none-any.whl → 20.0.0.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of teradataml might be problematic. Click here for more details.

Files changed (263) hide show

teradataml/LICENSE-3RD-PARTY.pdf +0 -0
teradataml/LICENSE.pdf +0 -0
teradataml/README.md +183 -0
teradataml/__init__.py +6 -3
teradataml/_version.py +2 -2
teradataml/analytics/__init__.py +3 -2
teradataml/analytics/analytic_function_executor.py +275 -40
teradataml/analytics/analytic_query_generator.py +92 -0
teradataml/analytics/byom/__init__.py +3 -2
teradataml/analytics/json_parser/metadata.py +1 -0
teradataml/analytics/json_parser/utils.py +17 -21
teradataml/analytics/meta_class.py +40 -1
teradataml/analytics/sqle/DecisionTreePredict.py +1 -1
teradataml/analytics/sqle/__init__.py +10 -2
teradataml/analytics/table_operator/__init__.py +3 -2
teradataml/analytics/uaf/__init__.py +21 -2
teradataml/analytics/utils.py +62 -1
teradataml/analytics/valib.py +1 -1
teradataml/automl/__init__.py +1553 -319
teradataml/automl/custom_json_utils.py +139 -61
teradataml/automl/data_preparation.py +276 -319
teradataml/automl/data_transformation.py +163 -81
teradataml/automl/feature_engineering.py +402 -239
teradataml/automl/feature_exploration.py +9 -2
teradataml/automl/model_evaluation.py +48 -51
teradataml/automl/model_training.py +291 -189
teradataml/catalog/byom.py +8 -8
teradataml/catalog/model_cataloging_utils.py +1 -1
teradataml/clients/auth_client.py +133 -0
teradataml/clients/pkce_client.py +1 -1
teradataml/common/aed_utils.py +3 -2
teradataml/common/constants.py +48 -6
teradataml/common/deprecations.py +13 -7
teradataml/common/garbagecollector.py +156 -120
teradataml/common/messagecodes.py +6 -1
teradataml/common/messages.py +3 -1
teradataml/common/sqlbundle.py +1 -1
teradataml/common/utils.py +103 -11
teradataml/common/wrapper_utils.py +1 -1
teradataml/context/context.py +121 -31
teradataml/data/advertising.csv +201 -0
teradataml/data/bank_marketing.csv +11163 -0
teradataml/data/bike_sharing.csv +732 -0
teradataml/data/boston2cols.csv +721 -0
teradataml/data/breast_cancer.csv +570 -0
teradataml/data/complaints_test_tokenized.csv +353 -0
teradataml/data/complaints_tokens_model.csv +348 -0
teradataml/data/covid_confirm_sd.csv +83 -0
teradataml/data/customer_segmentation_test.csv +2628 -0
teradataml/data/customer_segmentation_train.csv +8069 -0
teradataml/data/dataframe_example.json +10 -0
teradataml/data/docs/sqle/docs_17_10/OneHotEncodingFit.py +3 -1
teradataml/data/docs/sqle/docs_17_10/OneHotEncodingTransform.py +6 -0
teradataml/data/docs/sqle/docs_17_10/OutlierFilterTransform.py +5 -1
teradataml/data/docs/sqle/docs_17_20/ANOVA.py +61 -1
teradataml/data/docs/sqle/docs_17_20/CFilter.py +132 -0
teradataml/data/docs/sqle/docs_17_20/ColumnTransformer.py +2 -0
teradataml/data/docs/sqle/docs_17_20/FTest.py +105 -26
teradataml/data/docs/sqle/docs_17_20/GLM.py +162 -1
teradataml/data/docs/sqle/docs_17_20/GetFutileColumns.py +5 -3
teradataml/data/docs/sqle/docs_17_20/KMeans.py +48 -1
teradataml/data/docs/sqle/docs_17_20/NaiveBayes.py +162 -0
teradataml/data/docs/sqle/docs_17_20/NonLinearCombineFit.py +3 -2
teradataml/data/docs/sqle/docs_17_20/OneHotEncodingFit.py +5 -0
teradataml/data/docs/sqle/docs_17_20/OneHotEncodingTransform.py +6 -0
teradataml/data/docs/sqle/docs_17_20/OutlierFilterFit.py +2 -0
teradataml/data/docs/sqle/docs_17_20/Pivoting.py +279 -0
teradataml/data/docs/sqle/docs_17_20/ROC.py +3 -2
teradataml/data/docs/sqle/docs_17_20/SVMPredict.py +13 -2
teradataml/data/docs/sqle/docs_17_20/ScaleFit.py +119 -1
teradataml/data/docs/sqle/docs_17_20/ScaleTransform.py +93 -1
teradataml/data/docs/sqle/docs_17_20/Shap.py +197 -0
teradataml/data/docs/sqle/docs_17_20/TDGLMPredict.py +163 -1
teradataml/data/docs/sqle/docs_17_20/TDNaiveBayesPredict.py +189 -0
teradataml/data/docs/sqle/docs_17_20/TFIDF.py +142 -0
teradataml/data/docs/sqle/docs_17_20/Unpivoting.py +216 -0
teradataml/data/docs/sqle/docs_17_20/XGBoost.py +12 -4
teradataml/data/docs/sqle/docs_17_20/XGBoostPredict.py +7 -1
teradataml/data/docs/sqle/docs_17_20/ZTest.py +72 -7
teradataml/data/docs/uaf/docs_17_20/ACF.py +1 -10
teradataml/data/docs/uaf/docs_17_20/ArimaEstimate.py +1 -1
teradataml/data/docs/uaf/docs_17_20/ArimaForecast.py +35 -5
teradataml/data/docs/uaf/docs_17_20/ArimaValidate.py +3 -1
teradataml/data/docs/uaf/docs_17_20/ArimaXEstimate.py +293 -0
teradataml/data/docs/uaf/docs_17_20/AutoArima.py +354 -0
teradataml/data/docs/uaf/docs_17_20/BreuschGodfrey.py +3 -2
teradataml/data/docs/uaf/docs_17_20/BreuschPaganGodfrey.py +1 -1
teradataml/data/docs/uaf/docs_17_20/Convolve.py +13 -10
teradataml/data/docs/uaf/docs_17_20/Convolve2.py +4 -1
teradataml/data/docs/uaf/docs_17_20/CumulPeriodogram.py +5 -4
teradataml/data/docs/uaf/docs_17_20/DFFT2Conv.py +4 -4
teradataml/data/docs/uaf/docs_17_20/DWT.py +235 -0
teradataml/data/docs/uaf/docs_17_20/DWT2D.py +214 -0
teradataml/data/docs/uaf/docs_17_20/DurbinWatson.py +1 -1
teradataml/data/docs/uaf/docs_17_20/ExtractResults.py +1 -1
teradataml/data/docs/uaf/docs_17_20/FilterFactory1d.py +160 -0
teradataml/data/docs/uaf/docs_17_20/GenseriesSinusoids.py +1 -1
teradataml/data/docs/uaf/docs_17_20/GoldfeldQuandt.py +9 -31
teradataml/data/docs/uaf/docs_17_20/HoltWintersForecaster.py +4 -2
teradataml/data/docs/uaf/docs_17_20/IDFFT2.py +1 -8
teradataml/data/docs/uaf/docs_17_20/IDWT.py +236 -0
teradataml/data/docs/uaf/docs_17_20/IDWT2D.py +226 -0
teradataml/data/docs/uaf/docs_17_20/IQR.py +134 -0
teradataml/data/docs/uaf/docs_17_20/LineSpec.py +1 -1
teradataml/data/docs/uaf/docs_17_20/LinearRegr.py +2 -2
teradataml/data/docs/uaf/docs_17_20/MAMean.py +3 -3
teradataml/data/docs/uaf/docs_17_20/Matrix2Image.py +297 -0
teradataml/data/docs/uaf/docs_17_20/MatrixMultiply.py +15 -6
teradataml/data/docs/uaf/docs_17_20/PACF.py +0 -1
teradataml/data/docs/uaf/docs_17_20/Portman.py +2 -2
teradataml/data/docs/uaf/docs_17_20/PowerSpec.py +2 -2
teradataml/data/docs/uaf/docs_17_20/Resample.py +9 -1
teradataml/data/docs/uaf/docs_17_20/SAX.py +246 -0
teradataml/data/docs/uaf/docs_17_20/SeasonalNormalize.py +17 -10
teradataml/data/docs/uaf/docs_17_20/SignifPeriodicities.py +1 -1
teradataml/data/docs/uaf/docs_17_20/WhitesGeneral.py +3 -1
teradataml/data/docs/uaf/docs_17_20/WindowDFFT.py +368 -0
teradataml/data/dwt2d_dataTable.csv +65 -0
teradataml/data/dwt_dataTable.csv +8 -0
teradataml/data/dwt_filterTable.csv +3 -0
teradataml/data/finance_data4.csv +13 -0
teradataml/data/glm_example.json +28 -1
teradataml/data/grocery_transaction.csv +19 -0
teradataml/data/housing_train_segment.csv +201 -0
teradataml/data/idwt2d_dataTable.csv +5 -0
teradataml/data/idwt_dataTable.csv +8 -0
teradataml/data/idwt_filterTable.csv +3 -0
teradataml/data/insect2Cols.csv +61 -0
teradataml/data/interval_data.csv +5 -0
teradataml/data/jsons/paired_functions.json +14 -0
teradataml/data/jsons/sqle/17.20/TD_ANOVA.json +99 -27
teradataml/data/jsons/sqle/17.20/TD_CFilter.json +118 -0
teradataml/data/jsons/sqle/17.20/TD_FTest.json +166 -83
teradataml/data/jsons/sqle/17.20/TD_GLM.json +90 -14
teradataml/data/jsons/sqle/17.20/TD_GLMPREDICT.json +48 -5
teradataml/data/jsons/sqle/17.20/TD_GetFutileColumns.json +5 -3
teradataml/data/jsons/sqle/17.20/TD_KMeans.json +31 -11
teradataml/data/jsons/sqle/17.20/TD_NaiveBayes.json +193 -0
teradataml/data/jsons/sqle/17.20/TD_NaiveBayesPredict.json +212 -0
teradataml/data/jsons/sqle/17.20/TD_NonLinearCombineFit.json +3 -2
teradataml/data/jsons/sqle/17.20/TD_OneClassSVM.json +9 -9
teradataml/data/jsons/sqle/17.20/TD_Pivoting.json +280 -0
teradataml/data/jsons/sqle/17.20/TD_ROC.json +2 -1
teradataml/data/jsons/sqle/17.20/TD_SVM.json +16 -16
teradataml/data/jsons/sqle/17.20/TD_SVMPredict.json +19 -1
teradataml/data/jsons/sqle/17.20/TD_ScaleFit.json +168 -15
teradataml/data/jsons/sqle/17.20/TD_ScaleTransform.json +50 -1
teradataml/data/jsons/sqle/17.20/TD_Shap.json +222 -0
teradataml/data/jsons/sqle/17.20/TD_TFIDF.json +162 -0
teradataml/data/jsons/sqle/17.20/TD_Unpivoting.json +235 -0
teradataml/data/jsons/sqle/17.20/TD_XGBoost.json +25 -7
teradataml/data/jsons/sqle/17.20/TD_XGBoostPredict.json +17 -4
teradataml/data/jsons/sqle/17.20/TD_ZTest.json +157 -80
teradataml/data/jsons/storedprocedure/17.20/TD_FILTERFACTORY1D.json +150 -0
teradataml/data/jsons/uaf/17.20/TD_ACF.json +1 -18
teradataml/data/jsons/uaf/17.20/TD_ARIMAESTIMATE.json +3 -16
teradataml/data/jsons/uaf/17.20/TD_ARIMAFORECAST.json +0 -3
teradataml/data/jsons/uaf/17.20/TD_ARIMAVALIDATE.json +5 -3
teradataml/data/jsons/uaf/17.20/TD_ARIMAXESTIMATE.json +362 -0
teradataml/data/jsons/uaf/17.20/TD_AUTOARIMA.json +469 -0
teradataml/data/jsons/uaf/17.20/TD_BINARYMATRIXOP.json +0 -3
teradataml/data/jsons/uaf/17.20/TD_BINARYSERIESOP.json +0 -2
teradataml/data/jsons/uaf/17.20/TD_BREUSCH_GODFREY.json +2 -1
teradataml/data/jsons/uaf/17.20/TD_BREUSCH_PAGAN_GODFREY.json +2 -5
teradataml/data/jsons/uaf/17.20/TD_CONVOLVE.json +3 -6
teradataml/data/jsons/uaf/17.20/TD_CONVOLVE2.json +1 -3
teradataml/data/jsons/uaf/17.20/TD_CUMUL_PERIODOGRAM.json +0 -5
teradataml/data/jsons/uaf/17.20/TD_DFFT.json +1 -4
teradataml/data/jsons/uaf/17.20/TD_DFFT2.json +2 -7
teradataml/data/jsons/uaf/17.20/TD_DFFT2CONV.json +1 -2
teradataml/data/jsons/uaf/17.20/TD_DFFTCONV.json +0 -2
teradataml/data/jsons/uaf/17.20/TD_DTW.json +3 -6
teradataml/data/jsons/uaf/17.20/TD_DWT.json +173 -0
teradataml/data/jsons/uaf/17.20/TD_DWT2D.json +160 -0
teradataml/data/jsons/uaf/17.20/TD_FITMETRICS.json +1 -1
teradataml/data/jsons/uaf/17.20/TD_GOLDFELD_QUANDT.json +16 -30
teradataml/data/jsons/uaf/17.20/{TD_HOLT_WINTERS_FORECAST.json → TD_HOLT_WINTERS_FORECASTER.json} +1 -2
teradataml/data/jsons/uaf/17.20/TD_IDFFT2.json +1 -15
teradataml/data/jsons/uaf/17.20/TD_IDWT.json +162 -0
teradataml/data/jsons/uaf/17.20/TD_IDWT2D.json +149 -0
teradataml/data/jsons/uaf/17.20/TD_IQR.json +117 -0
teradataml/data/jsons/uaf/17.20/TD_LINEAR_REGR.json +1 -1
teradataml/data/jsons/uaf/17.20/TD_LINESPEC.json +1 -1
teradataml/data/jsons/uaf/17.20/TD_MAMEAN.json +1 -3
teradataml/data/jsons/uaf/17.20/TD_MATRIX2IMAGE.json +209 -0
teradataml/data/jsons/uaf/17.20/TD_PACF.json +2 -2
teradataml/data/jsons/uaf/17.20/TD_POWERSPEC.json +5 -5
teradataml/data/jsons/uaf/17.20/TD_RESAMPLE.json +48 -28
teradataml/data/jsons/uaf/17.20/TD_SAX.json +208 -0
teradataml/data/jsons/uaf/17.20/TD_SEASONALNORMALIZE.json +12 -6
teradataml/data/jsons/uaf/17.20/TD_SIMPLEEXP.json +0 -1
teradataml/data/jsons/uaf/17.20/TD_TRACKINGOP.json +8 -8
teradataml/data/jsons/uaf/17.20/TD_UNDIFF.json +1 -1
teradataml/data/jsons/uaf/17.20/TD_UNNORMALIZE.json +1 -1
teradataml/data/jsons/uaf/17.20/TD_WINDOWDFFT.json +400 -0
teradataml/data/kmeans_example.json +5 -0
teradataml/data/kmeans_table.csv +10 -0
teradataml/data/load_example_data.py +8 -2
teradataml/data/naivebayestextclassifier_example.json +1 -1
teradataml/data/naivebayestextclassifierpredict_example.json +11 -0
teradataml/data/onehot_encoder_train.csv +4 -0
teradataml/data/openml_example.json +29 -0
teradataml/data/peppers.png +0 -0
teradataml/data/real_values.csv +14 -0
teradataml/data/sax_example.json +8 -0
teradataml/data/scale_attributes.csv +3 -0
teradataml/data/scale_example.json +52 -1
teradataml/data/scale_input_part_sparse.csv +31 -0
teradataml/data/scale_input_partitioned.csv +16 -0
teradataml/data/scale_input_sparse.csv +11 -0
teradataml/data/scale_parameters.csv +3 -0
teradataml/data/scripts/deploy_script.py +21 -2
teradataml/data/scripts/sklearn/sklearn_fit.py +40 -37
teradataml/data/scripts/sklearn/sklearn_fit_predict.py +22 -30
teradataml/data/scripts/sklearn/sklearn_function.template +42 -24
teradataml/data/scripts/sklearn/sklearn_model_selection_split.py +23 -33
teradataml/data/scripts/sklearn/sklearn_neighbors.py +19 -28
teradataml/data/scripts/sklearn/sklearn_score.py +32 -32
teradataml/data/scripts/sklearn/sklearn_transform.py +85 -42
teradataml/data/star_pivot.csv +8 -0
teradataml/data/templates/open_source_ml.json +2 -1
teradataml/data/teradataml_example.json +97 -1
teradataml/data/timestamp_data.csv +4 -0
teradataml/data/titanic_dataset_unpivoted.csv +19 -0
teradataml/data/uaf_example.json +55 -1
teradataml/data/unpivot_example.json +15 -0
teradataml/data/url_data.csv +9 -0
teradataml/data/windowdfft.csv +16 -0
teradataml/data/ztest_example.json +16 -0
teradataml/dataframe/copy_to.py +9 -4
teradataml/dataframe/data_transfer.py +125 -64
teradataml/dataframe/dataframe.py +575 -57
teradataml/dataframe/dataframe_utils.py +47 -9
teradataml/dataframe/fastload.py +273 -90
teradataml/dataframe/functions.py +339 -0
teradataml/dataframe/row.py +160 -0
teradataml/dataframe/setop.py +2 -2
teradataml/dataframe/sql.py +740 -18
teradataml/dataframe/window.py +1 -1
teradataml/dbutils/dbutils.py +324 -18
teradataml/geospatial/geodataframe.py +1 -1
teradataml/geospatial/geodataframecolumn.py +1 -1
teradataml/hyperparameter_tuner/optimizer.py +13 -13
teradataml/lib/aed_0_1.dll +0 -0
teradataml/opensource/sklearn/_sklearn_wrapper.py +254 -122
teradataml/options/__init__.py +16 -5
teradataml/options/configure.py +39 -6
teradataml/options/display.py +2 -2
teradataml/plot/axis.py +4 -4
teradataml/scriptmgmt/UserEnv.py +26 -19
teradataml/scriptmgmt/lls_utils.py +120 -16
teradataml/table_operators/Script.py +4 -5
teradataml/table_operators/TableOperator.py +160 -26
teradataml/table_operators/table_operator_util.py +88 -41
teradataml/table_operators/templates/dataframe_udf.template +63 -0
teradataml/telemetry_utils/__init__.py +0 -0
teradataml/telemetry_utils/queryband.py +52 -0
teradataml/utils/validators.py +41 -3
{teradataml-20.0.0.0.dist-info → teradataml-20.0.0.2.dist-info}/METADATA +191 -6
{teradataml-20.0.0.0.dist-info → teradataml-20.0.0.2.dist-info}/RECORD +263 -185
{teradataml-20.0.0.0.dist-info → teradataml-20.0.0.2.dist-info}/WHEEL +0 -0
{teradataml-20.0.0.0.dist-info → teradataml-20.0.0.2.dist-info}/top_level.txt +0 -0
{teradataml-20.0.0.0.dist-info → teradataml-20.0.0.2.dist-info}/zip-safe +0 -0

teradataml/dataframe/dataframe.py CHANGED Viewed

@@ -24,6 +24,7 @@ import teradataml.context.context as tdmlctx
 from collections import OrderedDict, namedtuple
 from sqlalchemy.sql import ClauseElement
 from teradataml import execute_sql
+from teradataml import GarbageCollector
 from teradataml.dataframe.sql import _MetaExpression
 from teradataml.dataframe.sql_interfaces import ColumnExpression
 from teradataml.dataframe.sql_functions import case
@@ -41,6 +42,7 @@ from teradataml.dataframe.indexer import _LocationIndexer
 from teradataml.common.aed_utils import AedUtils
 from teradataml.options.display import display
 from teradataml.dataframe.copy_to import copy_to_sql
+from teradataml.dataframe.row import _Row
 from teradataml.dataframe.setop import concat
 from teradataml.plot.plot import _Plot
 from teradataml.scriptmgmt.UserEnv import UserEnv
@@ -52,7 +54,9 @@ from teradatasql import OperationalError
 from teradataml.dataframe.window import Window
 from teradataml.dataframe.data_transfer import _DataTransferUtils
 from teradataml.common.bulk_exposed_utils import _validate_unimplemented_function
-from teradatasqlalchemy.telemetry.queryband import collect_queryband
+from teradataml.telemetry_utils.queryband import collect_queryband
+from teradataml.options.configure import configure
+from teradataml.utils.internal_buffer import _InternalBuffer
 # TODO use logger when available on master branch
 # logger = teradatapylog.getLogger()
@@ -150,6 +154,11 @@ class DataFrame():
         # This attribute added to add setter for columns property,
         # it is required when setting columns from groupby
         self._columns = None
+        # This attribute stores the internal AED query and avoid multiple
+        # calls to AED utility function aed_show_query()
+        self._aed_query = None
+        # This attribute stores the type of query stored in self._aed_query.
+        self._is_full_query = None
         # Property to determine if table is an ART table or not.
         self._is_art = None
@@ -417,6 +426,130 @@ class DataFrame():
         return df
+    def create_temp_view(self, name):
+        """
+        DESCRIPTION:
+            Creates a temporary view for session on the DataFrame.
+        PARAMETERS:
+            name:
+                Required Argument.
+                Specifies the name of the temporary view.
+                Type: str
+        RETURNS:
+            None
+        RAISES:
+            OperationalError (When view already exists).
+        EXAMPLES:
+            # Load the data to run the example.
+            >>> load_example_data("dataframe", "admissions_train")
+            >>> df = DataFrame("admissions_train")
+            >>> df
+                masters   gpa     stats programming  admitted
+            id
+            38     yes  2.65  Advanced    Beginner         1
+            7      yes  2.33    Novice      Novice         1
+            26     yes  3.57  Advanced    Advanced         1
+            17      no  3.83  Advanced    Advanced         1
+            34     yes  3.85  Advanced    Beginner         0
+            13      no  4.00  Advanced      Novice         1
+            32     yes  3.46  Advanced    Beginner         0
+            11      no  3.13  Advanced    Advanced         1
+            15     yes  4.00  Advanced    Advanced         1
+            36      no  3.00  Advanced      Novice         0
+            # Example 1: Create view 'new_admissions'.
+            >>> df.create_temp_view("new_admissions")
+            >>> new_df = DataFrame("new_admissions")
+            >>> new_df
+                masters   gpa     stats programming  admitted
+            id
+            38     yes  2.65  Advanced    Beginner         1
+            7      yes  2.33    Novice      Novice         1
+            26     yes  3.57  Advanced    Advanced         1
+            17      no  3.83  Advanced    Advanced         1
+            34     yes  3.85  Advanced    Beginner         0
+            13      no  4.00  Advanced      Novice         1
+            32     yes  3.46  Advanced    Beginner         0
+            11      no  3.13  Advanced    Advanced         1
+            15     yes  4.00  Advanced    Advanced         1
+            36      no  3.00  Advanced      Novice         0
+        """
+        # Validating Arguments
+        arg_type_matrix = []
+        arg_type_matrix.append(["name", name, False, (str), True])
+        _Validators._validate_function_arguments(arg_type_matrix)
+        GarbageCollector._add_to_garbagecollector(name, TeradataConstants.TERADATA_VIEW)
+        UtilFuncs._create_view(name, self.show_query())
+    def materialize(self):
+        """
+        DESCRIPTION:
+            Method to materialize teradataml DataFrame into a database object.
+            Notes:
+                * DataFrames are materialized in either view/table/volatile table,
+                  which is decided and taken care by teradataml.
+                * If user wants to materialize object into specific database object
+                  such as table/volatile table, use 'to_sql()' or 'copy_to_sql()' or
+                  'fastload()' functions.
+                * Materialized object is garbage collected at the end of the session.
+        PARAMETERS:
+            None
+        RETURNS:
+            DataFrame
+        EXAMPLES:
+            >>> load_example_data("dataframe", "admissions_train")
+            >>> df = DataFrame("admissions_train")
+            >>> df
+               masters   gpa     stats programming  admitted
+            id
+            13      no  4.00  Advanced      Novice         1
+            26     yes  3.57  Advanced    Advanced         1
+            5       no  3.44    Novice      Novice         0
+            19     yes  1.98  Advanced    Advanced         0
+            15     yes  4.00  Advanced    Advanced         1
+            40     yes  3.95    Novice    Beginner         0
+            7      yes  2.33    Novice      Novice         1
+            22     yes  3.46    Novice    Beginner         0
+            36      no  3.00  Advanced      Novice         0
+            38     yes  2.65  Advanced    Beginner         1
+            # Example 1: Perform operations on teradataml DataFrame
+            #            and materializeit in a database object.
+            >>> df2 = df.get([["id", "masters", "gpa"]])
+            # Initially table_name will be None.
+            >>> df2._table_name
+            >>> df2.materialize()
+               masters   gpa
+            id
+            15     yes  4.00
+            7      yes  2.33
+            22     yes  3.46
+            17      no  3.83
+            13      no  4.00
+            38     yes  2.65
+            26     yes  3.57
+            5       no  3.44
+            34     yes  3.85
+            40     yes  3.95
+            # After materialize(), view name will be assigned.
+            >>> df2._table_name
+            '"ALICE"."ml__select__172077355985236"'
+            >>>
+        """
+        self.__execute_node_and_set_table_name(self._nodeid, self._metaexpr)
+        return self
     @collect_queryband(queryband="DF_fillna")
     def fillna(self, value=None, columns=None, literal_value=False):
         """
@@ -5017,7 +5150,7 @@ class DataFrame():
                     'median', 'var'
                 Acceptable formats for function(s) are
-                    string, dictionary or list of strings/functions.
+                    string, dictionary, list of strings/functions/ColumnExpression or ColumnExpression.
                 Accepted combinations are:
                     1. String function name
@@ -5025,12 +5158,57 @@ class DataFrame():
                     3. Dictionary containing column name as key and
                        aggregate function name (string or list of
                        strings) as value
+                    4. ColumnExpression built using the aggregate functions.
+                    5. List of ColumnExpression built using the aggregate functions.
+                Note:
+                * The name of the output columns are generated based on aggregate functions and column names.
+                    For Example,
+                    1. "func" passed as a string.
+                        >>> df.agg('mean')
+                        Assume that the column names of the dataframe are employee_no, first_name, marks, dob, joined_date.
+                        After the above operation, the output column names are:
+                          mean_employee_no, mean_marks, mean_dob, mean_joined_date
+                    2. "func" passed as a list of string functions.
+                        >>> df.agg(['min', 'sum'])
+                        Assume that the column names of the dataframe are employee_no, first_name, marks, dob, joined_date.
+                        After the above operation, the output column names are:
+                          min_employee_no, sum_employee_no, min_first_name, min_marks, sum_marks, min_dob, min_joined_date
+                    3. "func" passed as a dictionary containing column name as key and aggregate function name as value.
+                        >>> df.agg({'employee_no' : ['min', 'sum', 'var'], 'first_name' : ['min']})
+                        Output column names after the above operation are:
+                          min_employee_no, sum_employee_no, var_employee_no, min_first_name
+                    4. "func" passed as a ColumnExpression built using the aggregate functions.
+                        >>> df.agg(df.first_name.count())
+                        Output column name after the above operation is:
+                          count(first_name)
+                    5. "func" passed as a list of ColumnExpression built using the aggregate functions.
+                        >>> df.agg([df.employee_no.min(), df.first_name.count()])
+                        Output column names after the above operation are:
+                          min(employee_no), count(first_name)
+                * On ColumnExpression or list of ColumnExpression alias() can be used to
+                  return the output columns with aliased name.
+                    For Example,
+                    >>> df.agg(df.first_name.count().alias("total_names"))
+                    Output column name after the above operation is:
+                      total_names
+                    >>> df.agg([df.joined_date.min().alias("min_date"), df.first_name.count().alias("total_names")])
+                    Output column names after the above operation are:
+                      min_date, total_names
         RETURNS:
             teradataml DataFrame object with operations
             mentioned in parameter 'func' performed on specified
             columns.
         RAISES:
             TeradataMLException
             1. TDMLDF_AGGREGATE_FAILED - If operations on given columns
@@ -5072,8 +5250,8 @@ class DataFrame():
                 valid datatype.
                 Possible error message:
-                Invalid type(s) passed to argument 'func', should be:"\
-                             "['str', 'list', 'dict'].
+                Invalid type(s) passed to argument 'func', should be:
+                ['str, dict, ColumnExpression or list of values of type(s): str, ColumnExpression'].
         EXAMPLES :
             # Load the data to run the example.
@@ -5090,21 +5268,49 @@ class DataFrame():
             112               None  None  None    18/12/05
             >>>
-            # Dictionary of column names to string function/list of string functions as parameter.
+            # Get the minimum, sum and variance of employee number and minimum and mean of name,
+            # by passing dictionary of column names to string function/list of string functions as parameter.
             >>> df.agg({'employee_no' : ['min', 'sum', 'var'], 'first_name' : ['min', 'mean']})
-                  min_employee_no sum_employee_no  var_employee_no min_first_name
-                0             100             313        44.333333           abcd
+              min_employee_no sum_employee_no  var_employee_no min_first_name
+            0             100             313        44.333333           abcd
-            # List of string functions as parameter.
+            # Get the minimum and sum of all the columns in the dataframe,
+            # by passing list of string functions as parameter.
             >>> df.agg(['min', 'sum'])
-                  min_employee_no sum_employee_no min_first_name min_marks sum_marks min_dob min_joined_date
-                0             100             313           abcd      None      None    None      1902-05-12
+              min_employee_no sum_employee_no min_first_name min_marks sum_marks min_dob min_joined_date
+            0             100             313           abcd      None      None    None      1902-05-12
-            # A string function as parameter.
+            # Get the mean of all the columns in the dataframe, by passing string function as parameter.
             >>> df.agg('mean')
                mean_employee_no mean_marks mean_dob mean_joined_date
             0        104.333333       None     None         60/12/04
+            # Get the total names in the dataframe, by running count() on the "first_name"
+            # and passing ColumnExpression as parameter.
+            >>> df.agg(df.first_name.count())
+               count(first_name)
+            0                  2
+            # Get the minimum of joining date and total of names in the dataframe,
+            # by running min() on joined_date and count() on the "first_name"
+            # and passing list of ColumnExpression as parameter.
+            >>> df.agg([df.employee_no.min(), df.first_name.count()])
+               min(employee_no)  count(first_name)
+            0               100                  2
+            # Get the total names in the dataframe, by running count() on the "first_name" and
+            # use alias() to have the output column named as "total_names".
+            >>> df.agg(df.first_name.count().alias("total_names"))
+               total_names
+            0            2
+            # Get the minimum of joining date and total names in the dataframe,
+            # by running min() on joined_date and count() on the "first_name" and
+            # use alias() to have the output column named as "min_date" and "total_names".
+            >>> df.agg([df.joined_date.min().alias("min_date"), df.first_name.count().alias("total_names")])
+               min_date  total_names
+            0  02/12/05            2
             # Select only subset of columns from the DataFrame.
             >>> df1 = df.select(['employee_no', 'first_name', 'joined_date'])
@@ -5145,9 +5351,9 @@ class DataFrame():
             raise TeradataMlException(Messages.get_message(MessageCodes.MISSING_ARGS, "func"),
                                       MessageCodes.MISSING_ARGS)
-        if not isinstance(func, str) and not isinstance(func, list) and not isinstance(func, dict):
+        if not isinstance(func, (str, list, dict, ColumnExpression)):
             raise TeradataMlException(Messages.get_message(MessageCodes.UNSUPPORTED_DATATYPE,
-                                                           'func', ['str', 'list', 'dict']),
+                                      'func', ['str, dict, ColumnExpression or list of values of type(s): str, ColumnExpression']),
                                       MessageCodes.UNSUPPORTED_DATATYPE)
         return self._get_dataframe_aggregate(func)
@@ -5169,6 +5375,8 @@ class DataFrame():
                     3. Dictionary containing column name as key and
                        aggregate function name (string or list of
                        strings) as value
+                    4. ColumnExpression built using the aggregate functions.
+                    5. List of ColumnExpression built using the aggregate functions.
             **kwargs: Keyword arguments. Mainly used for Time Series Aggragates.
@@ -5345,7 +5553,9 @@ class DataFrame():
             result = self._check_numeric_overflow(agg_df)
         """
         try:
-            repr(result_df)
+            # Printing the DF will actually run underlying select query and
+            # will brought up numeric overflow if any. Only materializing won't work.
+            print(result_df)
             return False
         except TeradataMlException as tme:
             if "Numeric overflow occurred during computation" in str(tme):
@@ -5481,18 +5691,73 @@ class DataFrame():
         EXAMPLES:
             self.__get_data_columns()
         """
-        self.__execute_node_and_set_table_name(self._nodeid, self._metaexpr)
-        query = repr(self._metaexpr) + ' FROM ' + self._table_name
+        if not self._table_name:
+            if not self._aed_query:
+                self.__generate_aed_query()
+            # TODO: Check the length of query and if it fails, create a view in catch block.
+            # Address in this JIRA: https://teradata-pe.atlassian.net/browse/ELE-6922
+            query = repr(self._metaexpr) + ' FROM ( ' + self._aed_query + ' ) as temp_table'
+        else:
+            query = repr(self._metaexpr) + ' FROM ' + self._table_name
         if self._orderby is not None:
             query += ' ORDER BY ' + self._orderby
+        query += ';'
         # Execute the query and get the results in a list.
         self.__data, self.__data_columns = UtilFuncs._execute_query(query=query, fetchWarnings=True)
         return self.__data, self.__data_columns
+    def __generate_aed_query(self, full_query=False):
+        """
+        DESCRIPTION:
+            Internal function to return underlying SQL for the teradataml
+            DataFrame. It is the same SQL that is used to view the data for
+            a teradataml DataFrame.
+        PARAMETERS:
+            full_query:
+                Optional Argument.
+                Specifies if the complete query for the dataframe should be returned.
+                When this parameter is set to True, query for the dataframe is returned
+                with respect to the base dataframe's table (from_table() or from_query())
+                or from the output tables of analytical functions (if there are any in the
+                workflow). This query may or may not be directly used to retrieve data
+                for the dataframe upon which the function is called.
+                When this parameter is not used, string returned is the query already used
+                or will be used to retrieve data for the teradataml DataFrame.
+                Default Value: False
+                Types: bool
+        RETURNS:
+            String representing the underlying SQL query for the teradataml DataFrame.
+        RAISES:
+            None.
+        EXAMPLES:
+            self.__generate_aed_query()
+        """
+        # Run aed call only when _aed_query is None or
+        # the type of current stored query (full/short) is not matching
+        # with asked query type.
+        if (not self._aed_query) or (not self._is_full_query == full_query):
+            node_id = self._nodeid
+            if isinstance(self, (DataFrameGroupBy, DataFrameGroupByTime)):
+                # If dataframe is either of type groupby or groupbytime
+                # then get its parent dataframe nodeid and return queries
+                # for the same
+                node_id = self._aed_utils._aed_get_parent_nodeids(self._nodeid)[0]
+            queries = self._aed_utils._aed_show_query(node_id, query_with_reference_to_top=full_query)
+            # Store query and type of query in class attributes to avoid future runs.
+            self._aed_query = queries[0][0]
+            self._is_full_query = full_query
+        return self._aed_query
     @collect_queryband(queryband="DF_select")
     def select(self, select_expression):
         """
@@ -7032,6 +7297,97 @@ class DataFrame():
             if function_name is None or function_name in VANTAGE_FUNCTION_ARGTYPE_DEPENDENT_MAPPER:
                 self.__execute_node_and_set_table_name(self._nodeid)
                 return True
+    def _assign_udf(self, udf_expr):
+        """
+        DESCRIPTION:
+            Internal function for DataFrame.assign() to execute the udf using
+            Script Table Operator and create new column for teradataml DataFrame.
+        PARAMETER:
+            udf_expr:
+                Required Argument.
+                Specifies a dictionary of column name to UDF expressions.
+                Types: dict
+        RETURNS:
+            teradataml DataFrame
+        RAISES:
+            None.
+        EXAMPLES:
+            self._assign_udf(udf_expr)
+        """
+        df = self
+        env_name = None
+        # Create a dictionary of env_name to list of output columns to be run on that env.
+        env_mapper = OrderedDict()
+        exec_mode = 'REMOTE' if UtilFuncs._is_lake() else 'IN-DB'
+        if exec_mode == 'REMOTE':
+            if _InternalBuffer.get("auth_token") is None:
+                raise TeradataMlException(Messages.get_message(
+                MessageCodes.FUNC_EXECUTION_FAILED, "'udf'", 'Authentication token is required to run udf. Set token using set_auth_token().'),
+                                      MessageCodes.FUNC_EXECUTION_FAILED)
+            else:
+                for colname, col in udf_expr.items():
+                    env_name = UtilFuncs._get_env_name(col)
+                    # Store the env_name and its corresponding output column
+                    if env_name in env_mapper:
+                        env_mapper[env_name].append(colname)
+                    else:
+                        env_mapper[env_name] = [colname]
+        else:
+            env_mapper[env_name] = udf_expr.keys()
+        for env_name, cols in env_mapper.items():
+            # Create a dictionary of output columns to column type.
+            returns = OrderedDict([(column.name, column.type) for column in df._metaexpr.c])
+            # Store the udf functions
+            user_function = []
+            # Create a dictionary of output column name to udf name
+            columns_definitions = {}
+            # Create a dictionary of output column name to udf arguments
+            function_args = {}
+            for colname, col in udf_expr.items():
+                delimiter = col._delimiter
+                quotechar = col._quotechar
+                if colname in cols:
+                    user_function.append(col._udf)
+                    function_args[colname] = col._udf_args if col._udf_args else ()
+                    returns[colname] = col.type
+                    columns_definitions[colname] = col._udf.__name__
+            tbl_operators = _TableOperatorUtils([],
+                                                df,
+                                                "udf",
+                                                user_function,
+                                                exec_mode,
+                                                chunk_size=None,
+                                                returns=returns,
+                                                delimiter=delimiter,
+                                                quotechar=quotechar,
+                                                num_rows=1,
+                                                auth=None,
+                                                data_partition_column=None,
+                                                data_hash_column=None,
+                                                data_order_column=None,
+                                                is_local_order=None,
+                                                nulls_first=None,
+                                                sort_ascending=None,
+                                                charset=None,
+                                                env_name = env_name,
+                                                style = "csv",
+                                                function_args=function_args,
+                                                columns_definitions=columns_definitions,
+                                                output_type_converters={
+                                                    col_name: _Dtypes._teradata_type_to_python_type(col_type)
+                                                    for col_name, col_type in returns.items()})
+            df = tbl_operators.execute()
+        return df
     @collect_queryband(queryband="DF_assign")
     def assign(self, drop_columns=False, **kwargs):
@@ -7043,10 +7399,12 @@ class DataFrame():
             drop_columns:
                 Optional Argument.
                 If True, drop columns that are not specified in assign.
-                Note:
-                    When DataFrame.assign() is run on DataFrame.groupby(), this argument
-                    is ignored. In such cases, all columns are dropped and only new columns
-                    and grouping columns are returned.
+                Notes:
+                    1. When DataFrame.assign() is run on DataFrame.groupby(), this argument
+                       is ignored. In such cases, all columns are dropped and only new columns
+                       and grouping columns are returned.
+                    2. Argument is ignored for UDF functions.
                 Default Value: False
                 Types: bool
@@ -7062,6 +7420,7 @@ class DataFrame():
                     * SQLAlchemy ClauseElements.
                       (See teradataml extension with SQLAlchemy in teradataml User Guide
                        and Function reference guide for more details)
+                    * Function - udf.
         RETURNS:
@@ -7087,6 +7446,16 @@ class DataFrame():
                used, but the column used in such function must be a part of group by columns.
                See examples for teradataml extension with SQLAlchemy on using various
                functions with DataFrame.assign().
+             6. UDF expressions can run on both Vantage Cloud Lake leveraging Apply Table Operator
+               of Open Analytics Framework and Enterprise leveraging Vantage's Script Table Operator.
+             7. One can pass both regular expressions and udf expressions to this API.
+               However, regular expressions are computed first followed by udf expressions.
+               Hence the order of columns also maintained in same order.
+               Look at Example 18 to understand more.
+             8. While passing multiple udf expressions, one can not pass one column output
+               as another column input in the same ``assign`` call.
+             9. If user pass multiple udf expressions, delimiter and quotechar specified in
+               last udf expression are considered for processing.
         RAISES:
              1. ValueError - When a callable is passed as a value, or columns from different
@@ -7348,6 +7717,134 @@ class DataFrame():
             1  Advanced       2.886226  3.508750     84.21
             2    Novice       6.377775  3.559091     39.15
             >>>
+            #
+            # Executing user defined function (UDF) with assign()
+            #
+            # Example 15: Create two user defined functions to 'to_upper' and 'sum',
+            #            'to_upper' to get the values in 'accounts' to upper case and
+            #            'sum' to add length of string values in column 'accounts'
+            #             with column 'Feb' and store the result in Integer type column.
+            >>> @udf
+            ... def to_upper(s):
+            ...     if s is not None:
+            ...         return s.upper()
+            >>>
+            >>> from teradatasqlalchemy.types import INTEGER
+            >>> @udf(returns=INTEGER())
+            ... def sum(x, y):
+            ...     return len(x)+y
+            >>>
+            # Assign both Column Expressions returned by user defined functions
+            # to the DataFrame.
+            >>> res = df.assign(upper_stats = to_upper('accounts'), len_sum = sum('accounts', 'Feb'))
+            >>> res
+                        Feb    Jan    Mar    Apr  datetime upper_stats  len_sum
+            accounts
+            Blue Inc     90.0   50.0   95.0  101.0  17/01/04    BLUE INC       98
+            Red Inc     200.0  150.0  140.0    NaN  17/01/04     RED INC      207
+            Yellow Inc   90.0    NaN    NaN    NaN  17/01/04  YELLOW INC      100
+            Jones LLC   200.0  150.0  140.0  180.0  17/01/04   JONES LLC      209
+            Orange Inc  210.0    NaN    NaN  250.0  17/01/04  ORANGE INC      220
+            Alpha Co    210.0  200.0  215.0  250.0  17/01/04    ALPHA CO      218
+            >>>
+            # Example 16: Create a user defined function to add 4 to the 'datetime' column
+            #             and store the result in DATE type column.
+            >>> from teradatasqlalchemy.types import DATE
+            >>> import datetime
+            >>> @udf(returns=DATE())
+            ... def add_date(x, y):
+            ...     return (datetime.datetime.strptime(x, "%y/%m/%d")+datetime.timedelta(y)).strftime("%y/%m/%d")
+            >>>
+            # Assign the Column Expression returned by user defined function
+            # to the DataFrame.
+            >>> res = df.assign(new_date = add_date('datetime', 4))
+            >>> res
+                            Feb    Jan    Mar    Apr  datetime  new_date
+            accounts
+            Alpha Co    210.0  200.0  215.0  250.0  17/01/04  17/01/08
+            Blue Inc     90.0   50.0   95.0  101.0  17/01/04  17/01/08
+            Jones LLC   200.0  150.0  140.0  180.0  17/01/04  17/01/08
+            Orange Inc  210.0    NaN    NaN  250.0  17/01/04  17/01/08
+            Yellow Inc   90.0    NaN    NaN    NaN  17/01/04  17/01/08
+            Red Inc     200.0  150.0  140.0    NaN  17/01/04  17/01/08
+            >>>
+            # Example 17: Create a user defined functions to 'to_upper' to get
+            #             the values in 'accounts' to upper case and create a
+            #             new column with a string literal value.
+            >>> @udf
+            ... def to_upper(s):
+            ...     if s is not None:
+            ...         return s.upper()
+            >>>
+            # Assign both expressions to the DataFrame.
+            >>> res = df.assign(upper_stats = to_upper('accounts'), new_col = 'string')
+            >>> res
+                          Feb    Jan    Mar    Apr  datetime new_col upper_stats
+            accounts
+            Alpha Co    210.0  200.0  215.0  250.0  17/01/04  string    ALPHA CO
+            Blue Inc     90.0   50.0   95.0  101.0  17/01/04  string    BLUE INC
+            Yellow Inc   90.0    NaN    NaN    NaN  17/01/04  string  YELLOW INC
+            Jones LLC   200.0  150.0  140.0  180.0  17/01/04  string   JONES LLC
+            Red Inc     200.0  150.0  140.0    NaN  17/01/04  string     RED INC
+            Orange Inc  210.0    NaN    NaN  250.0  17/01/04  string  ORANGE INC
+            >>>
+            # Example 18: Create two user defined functions to 'to_upper' and 'sum'
+            #             and create new columns with string literal value and
+            #             arithmetic operation on column 'Feb'.
+            >>> @udf
+            ... def to_upper(s):
+            ...     if s is not None:
+            ...         return s.upper()
+            >>>
+            >>> from teradatasqlalchemy.types import INTEGER
+            >>> @udf(returns=INTEGER())
+            ... def sum(x, y):
+            ...     return len(x)+y
+            >>>
+            # Assign all expressions to the DataFrame.
+            >>> res = df.assign(upper_stats = to_upper('accounts'),new_col = 'abc',
+            ...                 len_sum = sum('accounts', 'Feb'), col_sum = df.Feb+1)
+            >>> res
+                          Feb    Jan    Mar    Apr  datetime  col_sum new_col upper_stats  len_sum
+            accounts
+            Blue Inc     90.0   50.0   95.0  101.0  17/01/04     91.0     abc    BLUE INC       98
+            Alpha Co    210.0  200.0  215.0  250.0  17/01/04    211.0     abc    ALPHA CO      218
+            Jones LLC   200.0  150.0  140.0  180.0  17/01/04    201.0     abc   JONES LLC      209
+            Yellow Inc   90.0    NaN    NaN    NaN  17/01/04     91.0     abc  YELLOW INC      100
+            Orange Inc  210.0    NaN    NaN  250.0  17/01/04    211.0     abc  ORANGE INC      220
+            Red Inc     200.0  150.0  140.0    NaN  17/01/04    201.0     abc     RED INC      207
+            >>>
+            # Example 19: Convert the values is 'accounts' column to upper case using a user
+            #             defined function on Vantage Cloud Lake.
+            # Create a Python 3.10.5 environment with given name and description in Vantage.
+            >>> env = create_env('test_udf', 'python_3.10.5', 'Test environment for UDF')
+            User environment 'test_udf' created.
+            >>>
+            # Create a user defined functions to 'to_upper' to get the values in upper case
+            # and pass the user env to run it on.
+            >>> from teradataml.dataframe.functions import udf
+            >>> @udf(env_name = env)
+            ... def to_upper(s):
+            ...     if s is not None:
+            ...         return s.upper()
+            >>>
+            # Assign the Column Expression returned by user defined function
+            # to the DataFrame.
+            >>> df.assign(upper_stats = to_upper('accounts'))
+                          Feb    Jan    Mar    Apr  datetime upper_stats
+            accounts
+            Alpha Co    210.0  200.0  215.0  250.0  17/01/04    ALPHA CO
+            Blue Inc     90.0   50.0   95.0  101.0  17/01/04    BLUE INC
+            Yellow Inc   90.0    NaN    NaN    NaN  17/01/04  YELLOW INC
+            Jones LLC   200.0  150.0  140.0  180.0  17/01/04   JONES LLC
+            Orange Inc  210.0    NaN    NaN  250.0  17/01/04  ORANGE INC
+            Red Inc     200.0  150.0  140.0    NaN  17/01/04     RED INC
+            >>>
         """
         # Argument validations
         awu_matrix = []
@@ -7393,13 +7890,35 @@ class DataFrame():
             msg = Messages.get_message(MessageCodes.TDMLDF_INFO_ERROR)
             raise TeradataMlException(msg, MessageCodes.TDMLDF_INFO_ERROR)
-        try:
-            (new_meta, new_nodeid) = self._generate_assign_metaexpr_aed_nodeid(drop_columns, **kwargs)
-            return self._create_dataframe_from_node(new_nodeid, new_meta, self._index_label)
-        except Exception as err:
-            errcode = MessageCodes.TDMLDF_INFO_ERROR
-            msg = Messages.get_message(MessageCodes.TDMLDF_INFO_ERROR)
-            raise TeradataMlException(msg, errcode) from err
+        # Create a dictionary of column name to udf expressions and
+        # column name to normal/regular expressions.
+        udf_expr = {}
+        regular_expr = {}
+        for colname, col in kwargs.items():
+            # If value passed in kwargs is a ColumnExpression and is a udf, store it.
+            if isinstance(col, ColumnExpression) and col._udf:
+                udf_expr[colname] = col
+            else:
+                regular_expr[colname] = col
+        df = self
+        # If kwargs contains both regular and udf expressions, first create new columns
+        # from normal/regular expressions then on the output dataframe create new columns
+        # from udf expression.
+        if bool(regular_expr):
+            try:
+                (new_meta, new_nodeid) = df._generate_assign_metaexpr_aed_nodeid(drop_columns, **regular_expr)
+                df = df._create_dataframe_from_node(new_nodeid, new_meta, df._index_label)
+            except Exception as err:
+                errcode = MessageCodes.TDMLDF_INFO_ERROR
+                msg = Messages.get_message(MessageCodes.TDMLDF_INFO_ERROR)
+                raise TeradataMlException(msg, errcode) from err
+        if bool(udf_expr):
+            df = df._assign_udf(udf_expr)
+        return df
     @collect_queryband(queryband="DF_get")
     def get(self, key):
@@ -10013,9 +10532,10 @@ class DataFrame():
                 case_when_then = {}
                 list_of_fracs = frac
-                # When stratify column is passed for sample then perform TrainTestSplit
-                # for data sampling.
-                if stratify_column is not None:
+                # When stratify column is passed for sample or when seed is passed for
+                # reproducibilty of result then
+                # perform TrainTestSplit for data sampling.
+                if stratify_column is not None or seed is not None:
                     # Local import TrainTestSplit function.
                     from teradataml.analytics.sqle import TrainTestSplit
@@ -10029,7 +10549,16 @@ class DataFrame():
                                                         train_size=list_of_fracs[0],
                                                         test_size=list_of_fracs[1],
                                                         stratify_column=stratify_column,
-                                                        seed=seed)
+                                                        seed=seed,
+                                                        persist=True,
+                                                        display_table_name=False)
+                    # Retrieve the table name from TrainTestSplit_out object.
+                    table_name = TrainTestSplit_out.result._table_name
+                    # Add the table to garbage collector.
+                    table_added = GarbageCollector._add_to_garbagecollector(table_name)
                     # Retrieve the sampled result and updated the column name and values
                     # for backward compatibility.
                     _sampled_df = TrainTestSplit_out.result
@@ -10133,10 +10662,10 @@ class DataFrame():
             # Make this non-lazy. Added this in order to fix https://teradata-pe.atlassian.net/browse/ELE-6368
             # Cannot use __execute_node_and_set_table_name because self points to original df.
-            # Hence, setting the __table_name with _execute_node_return_db_object_name.
+            # Hence, setting the _table_name with _execute_node_return_db_object_name.
             df = self._create_dataframe_from_node(sample_node_id, new_metaexpr, self._index_label)
-            df.__table_name = df_utils._execute_node_return_db_object_name(sample_node_id, new_metaexpr)
+            df._table_name = df_utils._execute_node_return_db_object_name(sample_node_id, new_metaexpr)
             return df
@@ -10267,26 +10796,14 @@ class DataFrame():
              where admitted > 0) as temp_table SAMPLE 0.9'
         """
+        # Argument validations
+        awu_matrix = []
+        awu_matrix.append(["full_query", full_query, False, (bool)])
+        # Validate argument types
+        _Validators._validate_function_arguments(awu_matrix)
         try:
-            # Argument validations
-            awu_matrix = []
-            awu_matrix.append(["full_query", full_query, False, (bool)])
-            # Validate argument types
-            _Validators._validate_function_arguments(awu_matrix)
-            node_id = self._nodeid
-            if isinstance(self, (DataFrameGroupBy, DataFrameGroupByTime)):
-                # If dataframe is either of type groupby or groupbytime
-                # then get it's parent dataframe nodeid and return queries
-                # for the same
-                node_id = self._aed_utils._aed_get_parent_nodeids(self._nodeid)[0]
-            queries = self._aed_utils._aed_show_query(node_id, query_with_reference_to_top=full_query)
-            return queries[0][0]
+            return self.__generate_aed_query(full_query)
         except TeradataMlException:
             raise
@@ -10296,7 +10813,7 @@ class DataFrame():
         except Exception as err:
             errcode = MessageCodes.TDMLDF_INFO_ERROR
             msg = Messages.get_message(errcode)
-            raise TeradataMlException(msg, errcode) from err
+            raise TeradataMlException(msg, errcode) from err
     @collect_queryband(queryband="DF_mapRow")
     def map_row(self,
@@ -13755,7 +14272,7 @@ class DataFrame():
                 Types: int OR NoneType
         RETURNS:
-            iterator, an object to iterate over namedtuples for each row in the DataFrame.
+            iterator, an object to iterate over row in the DataFrame.
         RAISES:
             None
@@ -13804,9 +14321,10 @@ class DataFrame():
         cur = execute_sql(query)
         if name:
+            columns = [column[0] for column in cur.description]
             for rec in cur:
-                Row = namedtuple(name, [column[0] for column in cur.description])
-                yield Row(*rec)
+                row = _Row(columns=columns, values=rec)
+                yield row
         else:
             for rec in cur:
                 yield rec
@@ -16626,7 +17144,7 @@ class _TDUAF(DataFrame):
         # UAF Functions do not accept double quotes.
         db_name = UtilFuncs._extract_db_name(table_name)
         if db_name:
-            table_name = "{}.{}".format(db_name, UtilFuncs._extract_table_name(table_name))
+            table_name = '"{}"."{}"'.format(db_name, UtilFuncs._extract_table_name(table_name))
         else:
             table_name = UtilFuncs._extract_table_name(table_name)

teradataml 20.0.0.0__py3-none-any.whl → 20.0.0.2__py3-none-any.whl

Potentially problematic release.

teradataml 20.0.0.0py3-none-any.whl → 20.0.0.2py3-none-any.whl