PyPI - teradataml - Versions diffs - 20.0.0.2__py3-none-any.whl → 20.0.0.4__py3-none-any.whl - Mend

teradataml 20.0.0.2py3-none-any.whl → 20.0.0.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of teradataml might be problematic. Click here for more details.

Files changed (126) hide show

teradataml/LICENSE-3RD-PARTY.pdf +0 -0
teradataml/README.md +315 -2
teradataml/__init__.py +4 -0
teradataml/_version.py +1 -1
teradataml/analytics/analytic_function_executor.py +95 -8
teradataml/analytics/byom/__init__.py +1 -1
teradataml/analytics/json_parser/metadata.py +12 -3
teradataml/analytics/json_parser/utils.py +7 -2
teradataml/analytics/sqle/__init__.py +5 -1
teradataml/analytics/table_operator/__init__.py +1 -1
teradataml/analytics/uaf/__init__.py +1 -1
teradataml/analytics/utils.py +4 -0
teradataml/analytics/valib.py +18 -4
teradataml/automl/__init__.py +51 -6
teradataml/automl/data_preparation.py +59 -35
teradataml/automl/data_transformation.py +58 -33
teradataml/automl/feature_engineering.py +27 -12
teradataml/automl/model_training.py +73 -46
teradataml/common/constants.py +88 -29
teradataml/common/garbagecollector.py +2 -1
teradataml/common/messagecodes.py +19 -3
teradataml/common/messages.py +6 -1
teradataml/common/sqlbundle.py +64 -12
teradataml/common/utils.py +246 -47
teradataml/common/warnings.py +11 -0
teradataml/context/context.py +161 -27
teradataml/data/amazon_reviews_25.csv +26 -0
teradataml/data/byom_example.json +11 -0
teradataml/data/dataframe_example.json +18 -2
teradataml/data/docs/byom/docs/DataRobotPredict.py +2 -2
teradataml/data/docs/byom/docs/DataikuPredict.py +40 -1
teradataml/data/docs/byom/docs/H2OPredict.py +2 -2
teradataml/data/docs/byom/docs/ONNXEmbeddings.py +242 -0
teradataml/data/docs/byom/docs/ONNXPredict.py +2 -2
teradataml/data/docs/byom/docs/PMMLPredict.py +2 -2
teradataml/data/docs/sqle/docs_17_20/NaiveBayes.py +1 -1
teradataml/data/docs/sqle/docs_17_20/Shap.py +34 -6
teradataml/data/docs/sqle/docs_17_20/TDNaiveBayesPredict.py +4 -4
teradataml/data/docs/sqle/docs_17_20/TextParser.py +3 -3
teradataml/data/docs/tableoperator/docs_17_20/Image2Matrix.py +118 -0
teradataml/data/docs/uaf/docs_17_20/CopyArt.py +145 -0
teradataml/data/docs/uaf/docs_17_20/DWT2D.py +4 -1
teradataml/data/docs/uaf/docs_17_20/DickeyFuller.py +18 -21
teradataml/data/hnsw_alter_data.csv +5 -0
teradataml/data/hnsw_data.csv +10 -0
teradataml/data/jsons/byom/h2opredict.json +1 -1
teradataml/data/jsons/byom/onnxembeddings.json +266 -0
teradataml/data/jsons/sqle/17.20/TD_Shap.json +0 -1
teradataml/data/jsons/sqle/17.20/TD_TextParser.json +1 -1
teradataml/data/jsons/sqle/20.00/TD_HNSW.json +296 -0
teradataml/data/jsons/sqle/20.00/TD_HNSWPredict.json +206 -0
teradataml/data/jsons/sqle/20.00/TD_HNSWSummary.json +32 -0
teradataml/data/jsons/sqle/20.00/TD_KMeans.json +250 -0
teradataml/data/jsons/sqle/20.00/TD_SMOTE.json +266 -0
teradataml/data/jsons/sqle/20.00/TD_VectorDistance.json +278 -0
teradataml/data/jsons/storedprocedure/17.20/TD_COPYART.json +71 -0
teradataml/data/jsons/tableoperator/17.20/IMAGE2MATRIX.json +53 -0
teradataml/data/jsons/uaf/17.20/TD_DICKEY_FULLER.json +10 -19
teradataml/data/jsons/uaf/17.20/TD_SAX.json +3 -1
teradataml/data/jsons/uaf/17.20/TD_WINDOWDFFT.json +15 -5
teradataml/data/medical_readings.csv +101 -0
teradataml/data/patient_profile.csv +101 -0
teradataml/data/scripts/lightgbm/dataset.template +157 -0
teradataml/data/scripts/lightgbm/lightgbm_class_functions.template +247 -0
teradataml/data/scripts/lightgbm/lightgbm_function.template +216 -0
teradataml/data/scripts/lightgbm/lightgbm_sklearn.template +159 -0
teradataml/data/scripts/sklearn/sklearn_fit.py +194 -167
teradataml/data/scripts/sklearn/sklearn_fit_predict.py +136 -115
teradataml/data/scripts/sklearn/sklearn_function.template +14 -19
teradataml/data/scripts/sklearn/sklearn_model_selection_split.py +155 -137
teradataml/data/scripts/sklearn/sklearn_transform.py +129 -42
teradataml/data/target_udt_data.csv +8 -0
teradataml/data/templates/open_source_ml.json +3 -2
teradataml/data/teradataml_example.json +8 -0
teradataml/data/vectordistance_example.json +4 -0
teradataml/dataframe/copy_to.py +8 -3
teradataml/dataframe/data_transfer.py +11 -1
teradataml/dataframe/dataframe.py +1049 -285
teradataml/dataframe/dataframe_utils.py +152 -20
teradataml/dataframe/functions.py +578 -35
teradataml/dataframe/setop.py +11 -6
teradataml/dataframe/sql.py +185 -16
teradataml/dbutils/dbutils.py +1049 -115
teradataml/dbutils/filemgr.py +48 -1
teradataml/hyperparameter_tuner/optimizer.py +12 -1
teradataml/lib/aed_0_1.dll +0 -0
teradataml/opensource/__init__.py +1 -1
teradataml/opensource/_base.py +1466 -0
teradataml/opensource/_class.py +464 -0
teradataml/opensource/{sklearn/constants.py → _constants.py} +21 -14
teradataml/opensource/_lightgbm.py +949 -0
teradataml/opensource/_sklearn.py +1008 -0
teradataml/opensource/{sklearn/_wrapper_utils.py → _wrapper_utils.py} +5 -6
teradataml/options/__init__.py +54 -38
teradataml/options/configure.py +131 -27
teradataml/options/display.py +13 -2
teradataml/plot/axis.py +47 -8
teradataml/plot/figure.py +33 -0
teradataml/plot/plot.py +63 -13
teradataml/scriptmgmt/UserEnv.py +5 -5
teradataml/scriptmgmt/lls_utils.py +130 -40
teradataml/store/__init__.py +12 -0
teradataml/store/feature_store/__init__.py +0 -0
teradataml/store/feature_store/constants.py +291 -0
teradataml/store/feature_store/feature_store.py +2318 -0
teradataml/store/feature_store/models.py +1505 -0
teradataml/table_operators/Apply.py +32 -18
teradataml/table_operators/Script.py +3 -1
teradataml/table_operators/TableOperator.py +3 -1
teradataml/table_operators/query_generator.py +3 -0
teradataml/table_operators/table_operator_query_generator.py +3 -1
teradataml/table_operators/table_operator_util.py +37 -38
teradataml/table_operators/templates/dataframe_register.template +69 -0
teradataml/utils/dtypes.py +51 -2
teradataml/utils/internal_buffer.py +18 -0
teradataml/utils/validators.py +99 -8
{teradataml-20.0.0.2.dist-info → teradataml-20.0.0.4.dist-info}/METADATA +321 -5
{teradataml-20.0.0.2.dist-info → teradataml-20.0.0.4.dist-info}/RECORD +121 -94
teradataml/libaed_0_1.dylib +0 -0
teradataml/libaed_0_1.so +0 -0
teradataml/opensource/sklearn/__init__.py +0 -1
teradataml/opensource/sklearn/_class.py +0 -255
teradataml/opensource/sklearn/_sklearn_wrapper.py +0 -1800
{teradataml-20.0.0.2.dist-info → teradataml-20.0.0.4.dist-info}/WHEEL +0 -0
{teradataml-20.0.0.2.dist-info → teradataml-20.0.0.4.dist-info}/top_level.txt +0 -0
{teradataml-20.0.0.2.dist-info → teradataml-20.0.0.4.dist-info}/zip-safe +0 -0

teradataml/dbutils/dbutils.py CHANGED Viewed

@@ -9,35 +9,45 @@ teradataml db utilities
 ----------
 A teradataml database utility functions provide interface to Teradata Vantage common tasks such as drop_table, drop_view, create_table etc.
 """
-import concurrent.futures, json, os, tempfile, shutil
+import concurrent.futures
+import json
+import os
+import re
+import shutil
+import tempfile
 from datetime import datetime
 import pandas as pd
+from sqlalchemy import (CheckConstraint, Column, ForeignKeyConstraint,
+                        MetaData, PrimaryKeyConstraint, Table,
+                        UniqueConstraint)
 from sqlalchemy.sql.functions import Function
-from teradataml.context import context as tdmlctx
-from teradataml.common.utils import UtilFuncs
-from teradataml.common.messages import Messages
-from teradataml.common.messagecodes import MessageCodes
+from teradatasql import OperationalError
+from teradatasqlalchemy.dialect import TDCreateTablePost as post
+from teradatasqlalchemy.dialect import dialect as td_dialect
+from teradatasqlalchemy.dialect import preparer
+import teradataml.dataframe as tdmldf
+from teradataml.common.constants import (SessionParamsPythonNames,
+                                         SessionParamsSQL, SQLConstants,
+                                         TableOperatorConstants,
+                                         TeradataTableKindConstants)
 from teradataml.common.exceptions import TeradataMlException
-from teradataml.common.constants import TeradataTableKindConstants
+from teradataml.common.messagecodes import MessageCodes
+from teradataml.common.messages import Messages
 from teradataml.common.sqlbundle import SQLBundle
-from teradataml.common.constants import SQLConstants, SessionParamsSQL, SessionParamsPythonNames
-from teradataml.common.constants import TableOperatorConstants
-import teradataml.dataframe as tdmldf
+from teradataml.common.utils import UtilFuncs
+from teradataml.context import context as tdmlctx
 from teradataml.options.configure import configure
-from teradataml.utils.utils import execute_sql
-from teradataml.utils.validators import _Validators
-from teradataml.utils.internal_buffer import _InternalBuffer
-from teradatasql import OperationalError
-from teradatasqlalchemy.dialect import preparer, dialect as td_dialect
-from teradatasqlalchemy.dialect import TDCreateTablePost as post
 from teradataml.telemetry_utils.queryband import collect_queryband
-from sqlalchemy import Table, Column, MetaData, CheckConstraint, \
-    PrimaryKeyConstraint, ForeignKeyConstraint, UniqueConstraint
 from teradataml.utils.internal_buffer import _InternalBuffer
+from teradataml.utils.utils import execute_sql
+from teradataml.utils.validators import _Validators
 @collect_queryband(queryband='DrpTbl')
-def db_drop_table(table_name, schema_name=None):
+def db_drop_table(table_name, schema_name=None, suppress_error=False,
+                  datalake_name=None, purge=None):
     """
     DESCRIPTION:
         Drops the table from the given schema.
@@ -55,6 +65,28 @@ def db_drop_table(table_name, schema_name=None):
             Default Value: None
             Types: str
+        suppress_error:
+            Optional Argument
+            Specifies whether to raise error or not.
+            Default Value: False
+            Types: str
+        datalake_name:
+            Optional Argument
+            Specifies name of the datalake to drop table from.
+            Note:
+                 "schema_name" must be provided while using this argument.
+            Default Value: None
+            Types: str
+        purge:
+            Optional Argument
+            Specifies whether to use purge clause or not while dropping datalake table.
+            It is only applicable when "datalake_name" argument is used. When "datalake_name" is specified,
+            but "purge" is not specified, data is purged by default.
+            Default Value: None
+            Types: bool
     RETURNS:
         True - if the operation is successful.
@@ -64,33 +96,56 @@ def db_drop_table(table_name, schema_name=None):
     EXAMPLES:
         >>> load_example_data("dataframe", "admissions_train")
-        # Drop table in current database
+        # Example 1: Drop table in current database.
         >>> db_drop_table(table_name = 'admissions_train')
-        # Drop table from the given schema
+        # Example 2: Drop table from the given schema.
         >>> db_drop_table(table_name = 'admissions_train', schema_name = 'alice')
+        #Example 3: Drop a table from datalake and purge the data.
+        >>> db_drop_table(table_name = 'datalake_table', schema_name = 'datalake_db',
+        ...               datalake_name='datalake', purge=True)
     """
     # Argument validations
     awu_matrix = []
     awu_matrix.append(["schema_name", schema_name, True, (str), True])
     awu_matrix.append(["table_name", table_name, False, (str), True])
+    awu_matrix.append(["datalake_name", datalake_name, True, (str), True])
+    awu_matrix.append(["purge", purge, True, (bool, type(None)), True])
     # Validate argument types
     _Validators._validate_function_arguments(awu_matrix)
+    # Process datalake related arguments.
+    purge_clause = None
+    if datalake_name is not None:
+        if schema_name is None:
+            err_ = Messages.get_message(MessageCodes.DEPENDENT_ARG_MISSING, "schema_name",
+                                        "datalake_name")
+            raise TeradataMlException(err_, MessageCodes.DEPENDENT_ARG_MISSING)
+        if purge is False:
+            purge_clause = "NO PURGE"
+        else:
+            purge_clause = "PURGE ALL"
     # Joining view and schema names in the format "schema_name"."view_name"
-    table_name = _get_quoted_object_name(schema_name, table_name)
+    table_name = _get_quoted_object_name(schema_name, table_name, datalake_name)
     try:
-        return UtilFuncs._drop_table(table_name)
-    except TeradataMlException:
-        raise
-    except OperationalError:
-        raise
+        return UtilFuncs._drop_table(table_name, purge_clause=purge_clause)
+    except (TeradataMlException, OperationalError):
+        if suppress_error:
+            pass
+        else:
+            raise
     except Exception as err:
-        raise TeradataMlException(Messages.get_message(MessageCodes.DROP_FAILED, "table",
-                                                       table_name),
-                                  MessageCodes.DROP_FAILED) from err
+        if suppress_error:
+            pass
+        else:
+            raise TeradataMlException(Messages.get_message(MessageCodes.DROP_FAILED, "table",
+                                                           table_name),
+                                      MessageCodes.DROP_FAILED) from err
 @collect_queryband(queryband='DrpVw')
@@ -152,7 +207,7 @@ def db_drop_view(view_name, schema_name=None):
 @collect_queryband(queryband='LstTbls')
-def db_list_tables(schema_name=None, object_name=None, object_type='all'):
+def db_list_tables(schema_name=None, object_name=None, object_type='all', datalake_name=None):
     """
     DESCRIPTION:
         Lists the Vantage objects(table/view) names for the specified schema name.
@@ -169,10 +224,12 @@ def db_list_tables(schema_name=None, object_name=None, object_type='all'):
             Optional Argument.
             Specifies a table/view name or pattern to be used for filtering them from the database.
             Pattern may contain '%' or '_' as pattern matching characters.
-            A '%' represents any string of zero or more arbitrary characters. Any string of characters is acceptable as
-            a replacement for the percent.
-            A '_' represents exactly one arbitrary character. Any single character is acceptable in the position in
-            which the underscore character appears.
+            - '%' represents any string of zero or more arbitrary characters. Any string of characters is acceptable as
+              a replacement for the percent.
+            - '_' represents exactly one arbitrary character. Any single character is acceptable in the position in
+              which the underscore character appears.
+            Note:
+                * If '%' is specified in 'object_name', then the '_' character is not evaluated for an arbitrary character.
             Default Value: None
             Types: str
             Example:
@@ -191,6 +248,14 @@ def db_list_tables(schema_name=None, object_name=None, object_type='all'):
             Default Value: 'all'
             Types: str
+        datalake_name:
+            Optional Argument.
+            Specifies the name of datalake to list tables from.
+            Note:
+                "schema_name" must be provided while using this argument.
+            Default Value: None
+            Types: str
     RETURNS:
         Pandas DataFrame
@@ -199,38 +264,40 @@ def db_list_tables(schema_name=None, object_name=None, object_type='all'):
         OperationalError    - If any errors are raised from Vantage.
     EXAMPLES:
-        # Example 1 - List all object types in the default schema
+        # Example 1: List all object types in the default schema
         >>> load_example_data("dataframe", "admissions_train")
         >>> db_list_tables()
-        # Example 2 - List all the views in the default schema
+        # Example 2: List all the views in the default schema
         >>> execute_sql("create view temporary_view as (select 1 as dummy_col1, 2 as dummy_col2);")
         >>> db_list_tables(None , None, 'view')
-        # Example 3 - List all the object types in the default schema whose names begin with 'abc' followed by one
-        # arbitrary character and any number of characters in the end.
+        # Example 3: List all the object types in the default schema whose names begin with 'abc' followed by any number
+        # of characters in the end.
         >>> execute_sql("create view abcd123 as (select 1 as dummy_col1, 2 as dummy_col2);")
-        >>> db_list_tables(None, 'abc_%', None)
+        >>> db_list_tables(None, 'abc%', None)
-        # Example 4 - List all the tables in the default schema whose names begin with 'adm_%' followed by one
-        # arbitrary character and any number of characters in the end.
+        # Example 4: List all the tables in the default schema whose names begin with 'adm' followed by any number of
+        # characters and ends with 'train'.
         >>> load_example_data("dataframe", "admissions_train")
-        >>> db_list_tables(None, 'adm_%', 'table')
+        >>> db_list_tables(None, 'adm%train', 'table')
-        # Example 5 - List all the views in the default schema whose names begin with any character but ends with 'abc'
+        # Example 5: List all the views in the default schema whose names begin with any character but ends with 'abc'
         >>> execute_sql("create view view_abc as (select 1 as dummy_col1, 2 as dummy_col2);")
         >>> db_list_tables(None, '%abc', 'view')
-        # Example 6 - List all the volatile tables in the default schema whose names begin with 'abc' and ends with any
+        # Example 6: List all the volatile tables in the default schema whose names begin with 'abc' and ends with any
         # arbitrary character and has a length of 4
         >>> execute_sql("CREATE volatile TABLE abcd(col0 int, col1 float) NO PRIMARY INDEX;")
         >>> db_list_tables(None, 'abc_', 'volatile')
-        # Example 7 - List all the temporary objects created by teradataml in the default schema whose names begins and
+        # Example 7: List all the temporary objects created by teradataml in the default schema whose names begins and
         # ends with any number of arbitrary characters but contains 'filter' in between.
         >>> db_list_tables(None, '%filter%', 'temp')
-    """
+        # Example 8: List all the tables in datalake's database.
+        >>> db_list_tables(schema_name='datalake_db_name', datalake_name='datalake_name')
+    """
     if tdmlctx.get_connection() is None:
         raise TeradataMlException(Messages.get_message(MessageCodes.INVALID_CONTEXT_CONNECTION),
                                   MessageCodes.INVALID_CONTEXT_CONNECTION)
@@ -245,12 +312,18 @@ def db_list_tables(schema_name=None, object_name=None, object_type='all'):
                               TeradataTableKindConstants.VOLATILE.value,
                               TeradataTableKindConstants.TEMP.value]
     awu_matrix.append(["object_type", object_type, True, (str), True, permitted_object_types])
+    awu_matrix.append(["datalake_name", datalake_name, True, (str), True])
     # Validate argument types
     _Validators._validate_function_arguments(awu_matrix)
+    # 'schema_name' must be provided while using 'datalake_name'.
+    _Validators._validate_dependent_argument(dependent_arg='datalake_name',
+                                             dependent_arg_value=datalake_name,
+                                             independent_arg='schema_name',
+                                             independent_arg_value=schema_name)
     try:
-        return _get_select_table_kind(schema_name, object_name, object_type)
+        return _get_select_table_kind(schema_name, object_name, object_type, datalake_name)
     except TeradataMlException:
         raise
     except OperationalError:
@@ -260,21 +333,49 @@ def db_list_tables(schema_name=None, object_name=None, object_type='all'):
                                   MessageCodes.LIST_DB_TABLES_FAILED) from err
-def _get_select_table_kind(schema_name, table_name, table_kind):
+def _convert_sql_search_string_to_regex(sql_str):
+    """Internal function to convert SQL string matching patterns to python regex."""
+    if sql_str:
+        # sql_str[1:-1] Removes single quotes from sql_str.
+        sql_str = sql_str[1:-1]
+        # If '%' is specified in 'sql_str',
+        # then the '_' character is not evaluated for an arbitrary character.
+        if '%' in sql_str:
+            # Replace % with .* if not preceded by a backslash.
+            sql_str = re.sub(r'(?<!\\)%', r'.*', sql_str, flags=re.IGNORECASE)
+            # Remove the escape character for the replacements.
+            sql_str = sql_str.replace(r'\%', '%')
+        else:
+            # Replace _ with . if not preceded by a backslash.
+            sql_str = re.sub(r'(?<!\\)_', r'.', sql_str, flags=re.IGNORECASE)
+            # Remove the escape character for the replacements.
+            sql_str = sql_str.replace(r'\_', '_')
+        # Add boundaries if the string doesn't start or end with '.*' i.e. SQL '%'.
+        if not sql_str.startswith('.*'):
+            sql_str = '^' + sql_str  # Anchor to the start of the string.
+        if not sql_str.endswith('.*'):
+            sql_str = sql_str + '$'  # Anchor to the end of the string.
+    return sql_str
+def _get_select_table_kind(schema_name, table_name, table_kind, datalake_name):
     """
-    Get the list of the table names from the specified schema name.
+    Get the list of the table names from the specified schema name and datalake.
     PARAMETERS:
         schema_name - The Name of schema in the database. The default value is the current database name.
         table_name -  The pattern to be used to filtering the table names from the database.
-                      The table name argument can contain '%' as pattern matching charecter.For example '%abc'
-                      will return all table names starting with any charecters and ending with abc.
+                      The table name argument can contain '%' as pattern matching character.For example '%abc'
+                      will return all table names starting with any characters and ending with abc.
         table_kind -  The table kind to apply the filter. The valid values are 'all','table','view','volatile','temp'.
                       all - list the all the table kinds.
                       table - list only tables.
                       view - list only views.
                       volatile - list only volatile temp.
                       temp - list all teradata ml temporary objects created in the specified database.
+        datalake_name - The name of datalake to search schema in.
     RETURNS:
         Panda's DataFrame - if the operation is successful.
@@ -289,60 +390,106 @@ def _get_select_table_kind(schema_name, table_name, table_kind):
         object_name_str = "'{0}'".format(table_name)
     object_table_kind = None
-    # Check the schema name.
-    if schema_name is None:
-        schema_name = tdmlctx._get_current_databasename()
-    # Check the table kind.
-    if (table_kind == TeradataTableKindConstants.VOLATILE.value):
-        query = SQLBundle._build_help_volatile_table()
-    else:
-        # Tablekind:
-        # 'O' - stands for Table with no primary index and no partitioning
-        # 'Q' - stands for Queue table
-        # 'T' - stands for a Table with a primary index or primary AMP index, partitioning, or both.
-        #       Or a partitioned table with NoPI
-        # 'V' - stands for View
-        if (table_kind == TeradataTableKindConstants.TABLE.value):
-            object_table_kind = "'{0}','{1}','{2}'".format('O', 'Q', 'T')
-        elif (table_kind == TeradataTableKindConstants.VIEW.value):
-            object_table_kind = "'{0}'".format('V')
-        elif (table_kind == TeradataTableKindConstants.TEMP.value):
-            if table_name is None:
-                object_name_str = "'{0}'".format(TeradataTableKindConstants.ML_PATTERN.value)
-            else:
-                object_name_str = "'{0}','{1}'".format(table_name,
-                                                       TeradataTableKindConstants.ML_PATTERN.value)
+    # Tablekind:
+    # 'O' - stands for Table with no primary index and no partitioning
+    # 'Q' - stands for Queue table
+    # 'T' - stands for a Table with a primary index or primary AMP index, partitioning, or both.
+    #       Or a partitioned table with NoPI
+    # 'V' - stands for View
+    if (table_kind == TeradataTableKindConstants.TABLE.value):
+        object_table_kind = ['O', 'Q', 'T']
+    elif (table_kind == TeradataTableKindConstants.VIEW.value):
+        object_table_kind = ['V']
+    elif (table_kind == TeradataTableKindConstants.TEMP.value):
+        if table_name is None:
+            object_name_str = "'{0}'".format(TeradataTableKindConstants.ML_PATTERN.value)
         else:
-            object_table_kind = "'{0}','{1}','{2}','{3}'".format('O', 'Q', 'T', 'V')
-        query = SQLBundle._build_select_table_kind(schema_name, object_name_str, object_table_kind)
-    try:
-        pddf = pd.read_sql(query, tdmlctx.td_connection.connection)
-        # Check if all table kind is requested and add also volatile tables to the pdf.
-        if (table_kind == TeradataTableKindConstants.ALL.value):
+            object_name_str = "'{0}','{1}'".format(table_name,
+                                                   TeradataTableKindConstants.ML_PATTERN.value)
+    else:
+        object_table_kind = ['O', 'Q', 'T', 'V']
+    if datalake_name is None:
+        # Check the schema name.
+        if schema_name is None:
+            schema_name = tdmlctx._get_current_databasename()
+        # Create an empty dataframe with desired column name.
+        pddf = pd.DataFrame(columns=[TeradataTableKindConstants.REGULAR_TABLE_NAME.value])
+        # Check the table kind.
+        if table_kind != TeradataTableKindConstants.VOLATILE.value:
+            if object_table_kind is not None:
+                object_table_kind = ', '.join([f"'{value}'" for value in object_table_kind])
+            query = SQLBundle._build_select_table_kind(schema_name, object_name_str, object_table_kind)
+            pddf = pd.read_sql(query, tdmlctx.td_connection.connection)
+        # Check if all table kind or volatile table kind is requested.
+        # If so,add volatile tables to the pddf.
+        if table_kind == TeradataTableKindConstants.ALL.value or \
+                table_kind == TeradataTableKindConstants.VOLATILE.value:
+            # Create list of volatile tables.
             try:
-                # Add volatile tables to all dataframe.
                 vtquery = SQLBundle._build_help_volatile_table()
                 vtdf = pd.read_sql(vtquery, tdmlctx.td_connection.connection)
                 if not vtdf.empty:
+                    # Volatile table query returns different column names.
+                    # So, rename its column names to match with normal
+                    # 'SELECT TABLENAME FROM DBC.TABLESV' query results.
                     columns_dict = {TeradataTableKindConstants.VOLATILE_TABLE_NAME.value:
                                         TeradataTableKindConstants.REGULAR_TABLE_NAME.value}
                     vtdf.rename(columns=columns_dict, inplace=True)
+                    # Volatile table names might contain leading whitespaces. Remove those.
+                    vtdf[TeradataTableKindConstants.REGULAR_TABLE_NAME.value] = vtdf[TeradataTableKindConstants.REGULAR_TABLE_NAME.value].str.strip()
+                    # Filter volatile tables using table name pattern.
+                    if object_name_str and (object_name_str := _convert_sql_search_string_to_regex(object_name_str)):
+                        name_filter = vtdf[TeradataTableKindConstants.REGULAR_TABLE_NAME.value].str.strip().str.match(
+                            object_name_str,
+                            na=False,
+                            flags=re.IGNORECASE)
+                        vtdf = vtdf[name_filter]
+                    # Concat existing list with volatile tables list.
                     frames = [pddf, vtdf[[TeradataTableKindConstants.REGULAR_TABLE_NAME.value]]]
                     pddf = pd.concat(frames)
                     pddf.reset_index(drop=True, inplace=True)
             except Exception as err:
-                # No volatle tables exist.
+                # No volatile tables exist.
                 pass
-        if (table_kind == TeradataTableKindConstants.VOLATILE.value):
-            columns_dict = {TeradataTableKindConstants.VOLATILE_TABLE_NAME.value:
-                                TeradataTableKindConstants.REGULAR_TABLE_NAME.value}
-            pddf.rename(columns=columns_dict, inplace=True)
-            return pddf[[TeradataTableKindConstants.REGULAR_TABLE_NAME.value]]
         else:
             return pddf
-    except Exception as err:
+    else:
+        # TODO: when OTF team enables VSD support for datalake tables
+        #  with epic: https://teradata-pe.atlassian.net/browse/OTF-454,
+        #  this can be changed to use VSD_tablesV table which is
+        #  similar to DBC.TABLESV.
+        # For datalake tables' information we need to use help database and
+        # then apply filter for table kind and table substring.
+        # We can't use select from DBC.TABLESV.
+        sqlbundle = SQLBundle()
+        help_db_sql = sqlbundle._get_sql_query(SQLConstants.SQL_HELP_DATABASE)
+        pddf = pd.read_sql(help_db_sql.format(_get_quoted_object_name(schema_name=datalake_name,
+                                                                      object_name=schema_name)),
+                           tdmlctx.td_connection.connection)
+        if object_name_str:
+            object_name_str = _convert_sql_search_string_to_regex(object_name_str)
+            if object_name_str:
+                name_filter = pddf['Table/View/Macro Name'].str.strip().str.match(object_name_str, na=False,
+                                                                      flags=re.IGNORECASE)
+                pddf = pddf[name_filter]
+        if object_table_kind is not None:
+            object_filter = pddf['Kind'].isin(object_table_kind)
+            pddf = pddf[object_filter]
+        columns_dict = {'Table/View/Macro Name':
+                            TeradataTableKindConstants.REGULAR_TABLE_NAME.value}
+        pddf.rename(columns=columns_dict, inplace=True)
+    # Return only filtered columns.
+    if not pddf.empty:
+        return pddf[[TeradataTableKindConstants.REGULAR_TABLE_NAME.value]]
+    else:
         return pd.DataFrame()
@@ -390,7 +537,7 @@ def _execute_transaction(queries):
             for query in queries:
                 cur.execute(query)
-            # Try committing the the transaction
+            # Try committing the transaction
             con.commit()
         except Exception:
             # Let's first rollback
@@ -402,6 +549,73 @@ def _execute_transaction(queries):
             cur.execute(auto_commit_on)
+def db_transaction(func):
+    """
+    DESCRIPTION:
+        Function to execute another function in a transaction.
+    PARAMETERS:
+        func:
+            Required Argument.
+            Specifies the function to be executed in a single transaction.
+            Types: function
+    RETURNS:
+        The object returned by "func".
+    RAISES:
+        TeradataMlException, OperationalError
+    EXAMPLES:
+        # Example: Declare a function to delete all the records from two tables
+        #          and execute the function in a transaction.
+        >>> @db_transaction
+        ... def insert_data(table1, table2):
+        ...     execute_sql("delete from {}".format(table1))
+        ...     execute_sql("delete from {}".format(table2))
+        ...     return True
+        >>> # Executing the above function in a transaction.
+        >>> insert_data("sales", "admissions_train")
+        True
+        >>>
+    """
+    def execute_transaction(*args, **kwargs):
+        auto_commit_off = "{fn teradata_nativesql}{fn teradata_autocommit_off}"
+        auto_commit_on = "{fn teradata_nativesql}{fn teradata_autocommit_on}"
+        con = None
+        cur = None
+        result = None
+        try:
+            con = tdmlctx.td_connection
+            if con is None:
+                raise TeradataMlException(Messages.get_message(MessageCodes.CONNECTION_FAILURE),
+                                          MessageCodes.CONNECTION_FAILURE)
+            con = con.connection
+            cur = con.cursor()
+            # Set auto_commit to OFF.
+            cur.execute(auto_commit_off)
+            # Execute function.
+            result = func(*args, **kwargs)
+            # Try committing the transaction.
+            con.commit()
+        except Exception:
+            # Let's first rollback.
+            con.rollback()
+            # Now, let's raise the error as is.
+            raise
+        finally:
+            # Finally, we must set auto_commit to ON.
+            cur.execute(auto_commit_on)
+        return result
+    return execute_transaction
 def _execute_stored_procedure(function_call, fetchWarnings=True, expect_none_result=False):
     """
     DESCRIPTION:
@@ -499,7 +713,7 @@ def _get_function_call_as_string(sqlcFuncObj):
     return str(sqlcFuncObj.compile(**kw))
-def _get_quoted_object_name(schema_name, object_name):
+def _get_quoted_object_name(schema_name, object_name, datalake=None):
     """
     DESCRIPTION:
         This function quotes and joins schema name to the object name which can either be table or a view.
@@ -508,12 +722,18 @@ def _get_quoted_object_name(schema_name, object_name):
         schema_name
             Required Argument.
             Specifies the schema name.
-            Types: str
+            Type: str
         object_name
             Required Argument.
             Specifies the object name either table or view.
-            Types: str
+            Type: str
+        datalake
+            Optional Argument.
+            Specifies the datalake name.
+            Default value: None
+            Type: str
     RAISES:
         None
@@ -535,6 +755,8 @@ def _get_quoted_object_name(schema_name, object_name):
         schema_name = tdp.quote(tdmlctx._get_current_databasename())
     quoted_object_name = "{0}.{1}".format(schema_name, tdp.quote(object_name))
+    if datalake is not None:
+        quoted_object_name = "{}.{}".format(tdp.quote(datalake), quoted_object_name)
     return quoted_object_name
@@ -635,7 +857,6 @@ def view_log(log_type="script", num_lines=1000, query_id=None, log_dir=None):
         # Validate num_lines is a positive integer.
         _Validators._validate_positive_int(num_lines, "num_lines")
         # Query for viewing last n lines of script log.
         view_log_query = TableOperatorConstants.SCRIPT_LOG_QUERY.value \
             .format(num_lines, configure.default_varchar_size)
@@ -656,8 +877,9 @@ def view_log(log_type="script", num_lines=1000, query_id=None, log_dir=None):
                 err_msg = 'Please provide directory path instead of file path.'.format(
                     log_dir)
                 raise TeradataMlException(err_msg, MessageCodes.INPUT_FILE_NOT_FOUND)
-        from teradataml.scriptmgmt.UserEnv import _get_auth_token, _get_ues_url, \
-            _process_ues_response
+        from teradataml.scriptmgmt.UserEnv import (_get_auth_token,
+                                                   _get_ues_url,
+                                                   _process_ues_response)
         ues_url = _get_ues_url(logs=True, query_id=query_id)
         response = UtilFuncs._http_request(ues_url, headers=_get_auth_token())
         resp = _process_ues_response(api_name="view_log", response=response)
@@ -721,9 +943,10 @@ def _fetch_url_and_save(url, file_path):
 def _check_if_python_packages_installed():
     """
     DESCRIPTION:
-        Function to set global variable 'python_packages_installed' to True
-        or False based on whether the Vantage node has Python and add-on
-        packages including pip3 installed.
+        Function to set the following global variables based on whether the Vantage node
+        has Python and add-on packages including pip3 installed.
+        - 'python_packages_installed' to True or False
+        - 'python_version_vantage' to the version of Python installed on Vantage.
     PARAMETERS:
         None.
@@ -737,14 +960,21 @@ def _check_if_python_packages_installed():
     EXAMPLES:
         _check_if_python_packages_installed()
     """
+    if tdmlctx.python_packages_installed:
+        # Skip check if Python and add-on packages are already installed and checked.
+        return
     # Check if Python interpreter and add-ons packages are installed or not.
     try:
         query = TableOperatorConstants.CHECK_PYTHON_INSTALLED.value.format(configure.indb_install_location)
-        UtilFuncs._execute_query(query=query)
+        opt = UtilFuncs._execute_query(query=query)
+        python_version = opt[0][0].split(" -- ")[1].split(" ")[1].strip()
         # If query execution is successful, then Python and add-on packages are
         # present.
         tdmlctx.python_packages_installed = True
+        tdmlctx.python_version_vantage = python_version
     except Exception as err:
         # Raise Exception if the error message does not contain
         # "bash: pip3: command not found".
@@ -855,6 +1085,203 @@ def db_python_package_details(names=None):
     return ret_val
+def _db_python_package_version_diff(packages=None, only_diff=True):
+    """
+    DESCRIPTION:
+        Internal function to get the pandas dataframe containing the difference in the Python
+        packages installed on Vantage and the packages mentioned in the argument "packages".
+        Note:
+            * Using this function is valid only when Python interpreter and add-on packages
+                are installed on the Vantage node.
+            * This function also checks for differences in Python packages versions given
+                part of package name as string.
+            * Returns pandas dataframe of only differences when the argument `only_diff` is set to
+                True. Otherwise, returns all the packages.
+    PARAMETERS:
+        packages:
+            Required Argument.
+            Specifies the name(s) of the Python package(s) for which the difference
+            in the versions is to be fetched from Vantage.
+            Note:
+            * If this argument is None, all the packages installed on Vantage are considered.
+            * If any package is present in Vantage but not in the current environment, then None
+                is shown as the version of the package in the current environment.
+            Types: str or list of str
+        only_diff:
+            Optional Argument.
+            Specifies whether to return only the differences in the versions of the packages
+            installed on Vantage and the packages mentioned in the argument "packages".
+            Default Value: True
+    RETURNS:
+        pandas DataFrame
+    RAISES:
+        TeradataMlException.
+    EXAMPLES:
+        # Note:
+        #   These examples will work only when the Python packages are installed on Vantage.
+        # Example 1: Get the difference in the versions of Python packages 'dill' and 'matplotlib'
+        # installed on Vantage.
+        >>> _db_python_package_version_diff(["dill", "matplotlib"])
+          package vantage  local
+        0    dill   0.3.6  0.3.7
+        # Example 2: Get the difference in the versions of Python packages 'dill' and 'matplotlib'
+        # installed on Vantage and 'only_diff' argument set to False.
+        >>> _db_python_package_version_diff(["dill", "matplotlib"], only_diff=False)
+                    package vantage  local
+        0  matplotlib-inline   0.1.6  0.1.6
+        1               dill   0.3.6  0.3.7
+        2         matplotlib   3.6.2  3.6.2
+    """
+    # Check if Python interpreter and add-on packages are installed or not.
+    _check_if_python_packages_installed()
+    # Raise error if Python and add-on packages are not installed.
+    if not tdmlctx.python_packages_installed:
+        raise TeradataMlException(Messages.get_message(MessageCodes.PYTHON_NOT_INSTALLED),
+                                  MessageCodes.PYTHON_NOT_INSTALLED)
+    # Installed packages dictionary.
+    db_pkg_df = db_python_package_details(packages)
+    if db_pkg_df is None:
+        return None
+    pkgs_dict = {row.package: row.version for row in db_pkg_df.itertuples()}
+    from importlib.metadata import PackageNotFoundError, version
+    diff_list = []
+    for pkg in pkgs_dict.keys():
+        vantage_version = pkgs_dict.get(pkg)
+        try:
+            local_version = version(pkg)
+        except PackageNotFoundError:
+            # If package is not found in the current environment, then the local version is set to None.
+            local_version = None
+        except Exception as e:
+            # Any other exception is raised.
+            raise
+        if only_diff:
+            if vantage_version != local_version:
+                # Add to list only when the versions are different.
+                diff_list.append([pkg, vantage_version, local_version])
+        else:
+            # Add to list all the packages and versions irrespective of the differences.
+            diff_list.append([pkg, vantage_version, local_version])
+    return pd.DataFrame(diff_list, columns=["package", "vantage", "local"])
+@collect_queryband(queryband='PythonDiff')
+def db_python_version_diff():
+    """
+    DESCRIPTION:
+        Function to get the difference of the Python intepreter major version installed on Vantage
+        and the Python version used in the current environment.
+        Note:
+            * Using this function is valid only when Python interpreter and add-on packages
+              are installed on the Vantage node.
+    RETURNS:
+        Empty dictionary when Python major version is same on Vantage and the current environment.
+        Otherwise, returns a dictionary with the following keys:
+            - 'vantage_version': Python major version installed on Vantage.
+            - 'local_version': Python major version used in the current environment.
+    RAISES:
+        TeradataMlException.
+    EXAMPLES:
+        # Note:
+        # These examples will work only when the Python packages are installed on Vantage.
+        # Example 1: Get the difference in the Python version installed on Vantage and the current environment.
+        >>> db_python_version_diff()
+        {"vantage_version": "3.7", "local_version": "3.8"}
+    """
+    # Check if Python interpretor and add-on packages are installed or not.
+    _check_if_python_packages_installed()
+    # Raise error if Python and add-on packages are not installed.
+    if not tdmlctx.python_packages_installed:
+        raise TeradataMlException(Messages.get_message(MessageCodes.PYTHON_NOT_INSTALLED),
+                                  MessageCodes.PYTHON_NOT_INSTALLED)
+    # Get major version of python installed on Vantage and the current environment.
+    python_local = tdmlctx.python_version_local.rsplit(".", 1)[0]
+    python_vantage = tdmlctx.python_version_vantage.rsplit(".", 1)[0]
+    if python_local != python_vantage:
+        return {"vantage_version": python_vantage, "local_version": python_local}
+    return {}
+@collect_queryband(queryband='PkgDiff')
+def db_python_package_version_diff(packages=None):
+    """
+    DESCRIPTION:
+        Function to get the difference of the Python packages installed on Vantage and
+        in the current environment mentioned in the argument "packages".
+        Notes:
+            * Using this function is valid only when Python interpreter and add-on packages
+              are installed on the Vantage node.
+            * This function also checks for differences in Python packages versions given
+              part of package name as string.
+    PARAMETERS:
+        packages:
+            Optional Argument.
+            Specifies the name(s) of the Python package(s) for which the difference
+            in the versions is to be fetched from Vantage.
+            Notes:
+                * If this argument is None, all the packages installed on Vantage are considered.
+                * If any package is present in Vantage but not in the current environment, then None
+                  is shown as the version of the package in the current environment.
+            Types: str or list of str
+    RETURNS:
+        pandas DataFrame
+    RAISES:
+        TeradataMlException.
+    EXAMPLES:
+        # Note:
+        # These examples will work only when the Python packages are installed on Vantage.
+        # Example 1: Get the difference in the versions of Python package 'dill' installed on Vantage.
+        >>> db_python_package_version_diff("dill")
+                  package   vantage    local
+        0            dill    0.10.0   0.11.2
+        # Example 2: Get the difference in the versions of all Python packages installed on Vantage.
+        >>> db_python_package_version_diff()
+                  package   vantage    local
+        0    scikit-learn     1.3.3   0.24.2
+        1            dill    0.10.0   0.11.2
+        ...
+        532         attrs    18.2.0   17.0.0
+    """
+    # Validate arguments.
+    __arg_info_matrix = []
+    __arg_info_matrix.append(["packages", packages, True, (str, list), True])
+    _Validators._validate_function_arguments(arg_list=__arg_info_matrix)
+    return _db_python_package_version_diff(packages=packages)
 def _create_table(table_name,
                   columns,
                   primary_index=None,
@@ -983,7 +1410,8 @@ def _create_table(table_name,
         else:
             pti = pti.no_primary_index()
-        con_form=[]
+        con_form = []
+        foreign_constraints = []
         for c_name, parameters in kwargs.items():
             _Validators._validate_function_arguments([["constraint_type", c_name, True, str,
                                                        True, SQLConstants.CONSTRAINT.value]])
@@ -992,9 +1420,21 @@ def _create_table(table_name,
                 [con_form.append("{}('{}')".format("CheckConstraint", col)) for col in parameters]
             if c_name in 'foreign_key_constraint':
                 parameters = parameters if isinstance(parameters[0], tuple) else [tuple(parameters)]
-                for col in parameters:
-                    meta.reflect(bind=tdmlctx.get_context(), only=[col[2]])
-                    con_form.append("{}({},{})".format("ForeignKeyConstraint", col[0], col[1]))
+                # Every element in parameter is 3 elements.
+                # 1st element and 2nd element also a list. 3rd element is name of ForeignKey.
+                for fk_columns, fk_ref_columns, fk_name in parameters:
+                    fk_ref_column_objs = []
+                    # fk_ref_columns is in this format - table_name.column_name .
+                    # There is no provision for schema name here.
+                    # sqlalchemy is not accepting this notation here - schema_name.table_name.column_name
+                    # So, create Column Object and bind schema name and table name to it.
+                    for fk_ref_column in fk_ref_columns:
+                        ref_column_table, ref_column = fk_ref_column.split(".")
+                        t = Table(ref_column_table, MetaData(), Column(ref_column), schema=schema_name)
+                        fk_ref_column_objs.append(getattr(t, "c")[ref_column])
+                    foreign_constraints.append(ForeignKeyConstraint(fk_columns, fk_ref_column_objs, fk_name))
             if c_name in ['primary_key_constraint', 'unique_key_constraint']:
                 c_name = "UniqueConstraint" if c_name in 'unique_key_constraint' else 'PrimaryKeyConstraint'
                 parameters = UtilFuncs._as_list(parameters)
@@ -1007,7 +1447,9 @@ def _create_table(table_name,
                     " columns.items()),{} teradatasql_post_create=pti,prefixes=prefix," \
                     "schema=schema_name)".format("" if con_form is None else ",".join(con_form))
-        table=eval(table_str)
+        table = eval(table_str)
+        for foreign_constraint in foreign_constraints:
+            table.append_constraint(foreign_constraint)
         table.create(bind=tdmlctx.get_context())
     except Exception as err:
@@ -1015,6 +1457,372 @@ def _create_table(table_name,
         raise TeradataMlException(Messages.get_message(msg_code, "create table", str(err)), msg_code)
+def _create_database(schema_name, size='10e6', spool_size=None,
+                     datalake=None, **kwargs):
+    """
+    DESCRIPTION:
+        Internal function to create a database with the specified name and size.
+    PARAMETERS:
+        schema_name:
+            Required Argument.
+            Specifies the name of the database to create.
+            Types: str
+        size:
+            Optional Argument.
+            Specifies the number of bytes to allocate to new database.
+            Note:
+                Exponential notation can also be used.
+            Types: str or int
+        spool_size:
+            Optional Argument.
+            Specifies the number of bytes to allocate to new database
+            for spool space.
+            Note:
+                Exponential notation can also be used.
+            Types: str or int
+        datalake:
+            Optional Argument.
+            Specifies the name of datalake to create database in.
+            Types: str
+        kwargs:
+            Optional Argument.
+            Specifies keyword arguments which are used in DBPROPERTIES
+            clause as key-value pair while creating datalake database.
+    RETURNS:
+        bool
+    RAISES:
+        TeradataMlException.
+    EXAMPLES:
+        >>> from teradataml.dbutils.dbutils import _create_database
+        # Example 1: Create database.
+        >>> _create_database("db_name1", "10e5")
+        # Example 2: Create database in datalake.
+        >>> _create_database("otf_db_1", datalake="datalake_iceberg_glue")
+        # Example 3: Create database in datalake having DBPROPERTIES.
+        >>> _create_database("otf_db", datalake="datalake_iceberg_glue",
+        ...                  owner='tdml_user', other_property='some_value',
+        ...                  other_property2=20, comment='Created by tdml_user')
+    """
+    if datalake:
+        db_properties = []
+        for key, val in kwargs.items():
+            db_properties.append("'{}'='{}'".format(key, val))
+        sql = "CREATE DATABASE {}.{}{};".format(datalake, schema_name,
+                                                ' DBPROPERTIES({})'.format(','.join(db_properties))
+                                                if db_properties else '')
+    else:
+        sql = "CREATE DATABASE {} FROM {} AS PERM = {}".format(schema_name, tdmlctx._get_database_username(), size)
+    # If user pass spool size, create it with specified space.
+    if spool_size:
+        sql = "{} , SPOOL = {}".format(sql, spool_size)
+    execute_sql(sql)
+    return True
+def _update_data(update_columns_values, table_name, schema_name, datalake_name=None, update_conditions=None):
+    """
+    DESCRIPTION:
+        Internal function to update the data in a table.
+    PARAMETERS:
+        update_columns_values:
+            Required Argument.
+            Specifies the columns and it's values to update.
+            Types: dict
+        table_name:
+            Required Argument.
+            Specifies the name of the table to update.
+            Types: str
+        schema_name:
+            Required Argument.
+            Specifies the name of the database to update the data in the
+            table "table_name".
+            Types: str
+        datalake_name:
+            Optional Argument.
+            Specifies the name of the datalake to look for "schema_name".
+            Types: str
+        update_conditions:
+            Optional Argument.
+            Specifies the key columns and it's values which is used as condition
+            for updating the records.
+            Types: dict
+    RETURNS:
+        bool
+    RAISES:
+        TeradataMlException.
+    EXAMPLES:
+       >>> from teradataml.dbutils.dbutils import _update_data
+       >>> _update_data("db_name1", "tbl", update_conditions={"column1": "value1"})
+    """
+    # Prepare the update clause.
+    update_clause = ", ".join(("{} = ?".format(col) for col in update_columns_values))
+    update_values = tuple((_value for _value in update_columns_values.values()))
+    # If key_columns_values is passed, then prepare the SQL with where clause.
+    # Else, simply update every thing.
+    qualified_table_name = _get_quoted_object_name(schema_name, table_name, datalake_name)
+    get_str_ = lambda val: "'{}'".format(val) if isinstance(val, str) else val
+    if update_conditions:
+        # Prepare where clause.
+        where_ = []
+        for column, col_value in update_conditions.items():
+            if isinstance(col_value, list):
+                col_value = ", ".join(get_str_(val) for val in col_value)
+                col_value = "({})".format(col_value)
+                where_.append("{} IN {}".format(column, col_value))
+            else:
+                where_.append("{} = {}".format(column, col_value))
+        where_clause = " AND ".join(where_)
+        sql = f"""UPDATE {qualified_table_name} SET {update_clause}
+                 WHERE {where_clause}
+            """
+        execute_sql(sql, (*update_values,))
+    else:
+        sql = f"""UPDATE {qualified_table_name} SET {update_clause}"""
+        execute_sql(sql, update_values)
+    return True
+def _insert_data(table_name, values, columns=None, schema_name=None, datalake_name=None):
+    """
+    DESCRIPTION:
+        Internal function to insert the data in a table.
+    PARAMETERS:
+        table_name:
+            Required Argument.
+            Specifies the name of the table to insert.
+            Types: str
+        values:
+            Required Argument.
+            Specifies the values to insert.
+            Types: tuple or list of tuple
+        columns:
+            Optional Argument.
+            Specifies the name of columns to be involved in insert.
+            Types: list
+        schema_name:
+            Optional Argument.
+            Specifies the name of the database to insert the data in the
+            table "table_name".
+            Types: str
+        datalake_name:
+            Optional Argument.
+            Specifies the name of the datalake to look for "schema_name".
+            Types: str
+    RETURNS:
+        bool
+    RAISES:
+        TeradataMlException.
+    EXAMPLES:
+       >>> from teradataml.dbutils.dbutils import _insert_data
+       >>> _insert_data("tbl", (1, 2, 3))
+    """
+    # Prepare the update clause.
+    qualified_table_name = _get_quoted_object_name(schema_name, table_name, datalake_name)
+    values = UtilFuncs._as_list(values)
+    # Prepare columns clause.
+    if columns:
+        # Prepare question marks.
+        _q_marks = ["?"] * len(columns)
+        columns = "({})".format(", ".join(columns))
+    else:
+        columns = ""
+        _q_marks = ["?"] * (len(values[0]))
+    sql = "insert into {} {} values ({});".format(qualified_table_name, columns, ", ".join(_q_marks))
+    execute_sql(sql, values)
+    return True
+def _upsert_data(update_columns_values,
+                 insert_columns_values,
+                 upsert_conditions,
+                 table_name,
+                 schema_name,
+                 datalake_name=None):
+    """
+    DESCRIPTION:
+        Internal function to either insert or update the data to a table.
+    PARAMETERS:
+        update_columns_values:
+            Required Argument.
+            Specifies the columns and it's values to update.
+            Types: dict
+        insert_columns_values:
+            Required Argument.
+            Specifies the columns and it's values to insert.
+            Types: dict
+        upsert_conditions:
+            Required Argument.
+            Specifies the key columns and it's values which is used as condition
+            for updating the records.
+            Types: tuple
+        table_name:
+            Required Argument.
+            Specifies the name of the table to insert.
+            Types: str
+        schema_name:
+            Required Argument.
+            Specifies the name of the database to update the data in the
+            table "table_name".
+            Types: str
+        datalake_name:
+            Optional Argument.
+            Specifies the name of the datalake to look for "schema_name".
+            Note:
+                "schema_name" must be provided while using this argument.
+            Types: str
+    RETURNS:
+        bool
+    RAISES:
+        TeradataMlException.
+    EXAMPLES:
+       >>> from teradataml.dbutils.dbutils import _upsert_data
+       >>> _upsert_data("db_name1",
+                        "tbl",
+                        update_columns_values={"column1": "value1"},
+                        insert_columns_values={"column1": "value2"},
+                        upsert_conditions={"key1": "val1"}
+                        )
+    """
+    # If user passes datalake name, then append the same to schema name.
+    qualified_table_name = _get_quoted_object_name(schema_name, table_name, datalake_name)
+    # Prepare the update clause.
+    update_clause = ", ".join(("{} = ?".format(col) for col in update_columns_values))
+    update_values = tuple((_value for _value in update_columns_values.values()))
+    # Prepare the where clause and it's values.
+    where_clause = " AND ".join(("{} = ?".format(col) for col in upsert_conditions))
+    where_values = tuple((_value for _value in upsert_conditions.values()))
+    # Prepare the insert clause and it's values.
+    insert_values_clause = ", ".join(("?" for _ in range(len(insert_columns_values))))
+    insert_clause = "({}) values ({})".format(", ".join(insert_columns_values), insert_values_clause)
+    insert_values = tuple((_value for _value in insert_columns_values.values()))
+    sql = f"""UPDATE {qualified_table_name} SET {update_clause}
+         WHERE {where_clause}
+       ELSE INSERT {qualified_table_name} {insert_clause}
+    """
+    execute_sql(sql, (*update_values, *where_values, *insert_values))
+def _delete_data(table_name, schema_name=None, datalake_name=None, delete_conditions=None):
+    """
+    DESCRIPTION:
+        Internal function to delete the data in a table.
+    PARAMETERS:
+        table_name:
+            Required Argument.
+            Specifies the name of the table to delete.
+            Types: str
+        schema_name:
+            Optional Argument.
+            Specifies the name of the database to delete the data in the
+            table "table_name".
+            Types: str
+        datalake_name:
+            Optional Argument.
+            Specifies the name of the datalake to look for "schema_name".
+            Types: str
+        delete_conditions:
+            Optional Argument.
+            Specifies the ColumnExpression or dictionary containing key values
+            pairs to use for removing the data.
+            Types: ColumnExpression, dict
+    RETURNS:
+        int, specifies the number of records those are deleted.
+    RAISES:
+        TeradataMlException.
+    EXAMPLES:
+       >>> from teradataml.dbutils.dbutils import _delete_data
+       >>> _delete_data("tbl", "db_name1", delete_conditions={"column1": "value1"})
+    """
+    qualified_table_name = _get_quoted_object_name(schema_name, table_name, datalake_name)
+    sqlbundle = SQLBundle()
+    sql = sqlbundle._get_sql_query(SQLConstants.SQL_DELETE_ALL_ROWS).format(qualified_table_name)
+    # If condition exist, the prepare where clause.
+    if delete_conditions:
+        from teradataml.dataframe.sql import _SQLColumnExpression
+        if isinstance(delete_conditions, _SQLColumnExpression):
+            where_clause = delete_conditions.compile()
+        elif isinstance(delete_conditions, dict):
+            get_str_ = lambda val: "'{}'".format(val) if isinstance(val, str) else val
+            where_ = []
+            for column, col_value in delete_conditions.items():
+                if isinstance(col_value, list):
+                    col_value = ", ".join(get_str_(val) for val in col_value)
+                    col_value = "({})".format(col_value)
+                    where_.append("{} IN {}".format(column, col_value))
+                else:
+                    where_.append("{} = {}".format(column, col_value))
+            where_clause = " AND ".join(where_)
+        sql = sqlbundle._get_sql_query(SQLConstants.SQL_DELETE_SPECIFIC_ROW).format(qualified_table_name, where_clause)
+    res = execute_sql(sql)
+    return res.rowcount
 @collect_queryband(queryband='LstKwrds')
 def list_td_reserved_keywords(key=None, raise_error=False):
     """
@@ -1079,6 +1887,7 @@ def list_td_reserved_keywords(key=None, raise_error=False):
     """
     from teradataml.dataframe.dataframe import DataFrame, in_schema
     # Get the reserved keywords from the table
     reserved_keys = DataFrame(in_schema("SYSLIB", "SQLRestrictedWords"))
@@ -1096,10 +1905,10 @@ def list_td_reserved_keywords(key=None, raise_error=False):
     # Check if key contains Teradata reserved keyword or not.
     res_key = (k.upper() for k in key if k.upper() in reservered_words)
     res_key = list(res_key)
-    if len(res_key)>0:
+    if len(res_key) > 0:
         if raise_error:
             raise TeradataMlException(Messages.get_message(MessageCodes.RESERVED_KEYWORD, res_key),
-                                                          MessageCodes.RESERVED_KEYWORD)
+                                      MessageCodes.RESERVED_KEYWORD)
         return True
     return False
@@ -1189,6 +1998,7 @@ def _execute_query_and_generate_pandas_df(query, index=None, **kwargs):
     return pandas_df
 class _TDSessionParams:
     """
     A successfull connection through teradataml establishes a session with Vantage.
@@ -1196,6 +2006,7 @@ class _TDSessionParams:
     for parameter 'Session Time Zone'.
     This is an internal utility to store all session related parameters.
     """
     def __init__(self, data):
         """
         Constructor to store columns and rows of session params.
@@ -1222,6 +2033,7 @@ class _TDSessionParams:
             return self.__session_params[parameter]
         raise AttributeError("'TDSessionParams' object has no attribute '{}'".format(parameter))
 def set_session_param(name, value):
     """
     DESCRIPTION:
@@ -1397,15 +2209,16 @@ def set_session_param(name, value):
         [param[0] for param in result.description],
         [value for value in next(result)]
     ))
-    _InternalBuffer.add(session_params = _TDSessionParams(data))
+    _InternalBuffer.add(session_params=_TDSessionParams(data))
     # Store function name of 'DEBUG_FUNCTION' used.
-    _InternalBuffer.add(function_name = value[0] if name.upper() == 'DEBUG_FUNCTION' else '')
+    _InternalBuffer.add(function_name=value[0] if name.upper() == 'DEBUG_FUNCTION' else '')
     # Set the session parameter.
     execute_sql(getattr(SessionParamsSQL, name.upper()).format(*value))
     return True
 def unset_session_param(name):
     """
     DESCRIPTION:
@@ -1449,7 +2262,7 @@ def unset_session_param(name):
     # unset_values stores params which are not available in _InternalBuffer, to unset create a dictionary
     # with param as key and unset param as value
     unset_values = {"CHARACTER_SET_UNICODE": "OFF", "DEBUG_FUNCTION": [_InternalBuffer.get('function_name'), "OFF"],
-                    "ISOLATED_LOADING":"NO", "FUNCTION_TRACE":"SET SESSION FUNCTION TRACE OFF",
+                    "ISOLATED_LOADING": "NO", "FUNCTION_TRACE": "SET SESSION FUNCTION TRACE OFF",
                     "JSON_IGNORE_ERRORS": "OFF", "QUERY_BAND": ["", "SESSION"]}
     # If 'name' in unset_values unset the params
@@ -1463,11 +2276,132 @@ def unset_session_param(name):
         return True
     previous_value = "{}".format(session_params[getattr(SessionParamsPythonNames, name.upper())]) \
-        if name.upper() != 'TIMEZONE' else "'{}'".format(session_params[getattr(SessionParamsPythonNames, name.upper())])
+        if name.upper() != 'TIMEZONE' else "'{}'".format(
+        session_params[getattr(SessionParamsPythonNames, name.upper())])
     if name.upper() == "ACCOUNT":
         previous_value = [previous_value, 'SESSION']
     set_session_param(name, previous_value)
     return True
+class _Authorize:
+    """ Parent class to either provide or revoke access on table(s). """
+    _property = None
+    def __init__(self, objects):
+        """
+        DESCRIPTION:
+            Constructor for creating Authorize object.
+        PARAMETERS:
+            objects:
+                Required Argument.
+                Specifies the name(s) of the database objects to be authorized.
+                Types: str OR list of str.
+        RETURNS:
+            Object of _Authorize.
+        RAISES:
+            None
+        EXAMPLES:
+            >>> auth = _Authorize('vfs_v1')
+        """
+        # Store the objects here. Then use this where ever required.
+        self._objects = objects
+        self._access_method = self.__class__.__name__.upper()
+    def read(self, user):
+        """
+        DESCRIPTION:
+            Authorize the read access.
+            Note:
+                One must have admin access to give read access to other "user".
+        PARAMETERS:
+            user:
+                Required Argument.
+                Specifies the name of the user to have read only access.
+                Types: str
+        RETURNS:
+            bool.
+        RAISES:
+            None
+        EXAMPLES:
+            >>> _Authorize('repo').read('BoB')
+        """
+        for object in self._objects:
+            sql = "{} SELECT ON {} {} {}".format(self._access_method, object, self._property, user)
+            execute_sql(sql)
+        return True
+    def write(self, user):
+        """
+        DESCRIPTION:
+            Authorize the write access.
+            Note:
+                One must have admin access to give write access to other "user".
+        PARAMETERS:
+            user:
+                Required Argument.
+                Specifies the name of the user to have write only access.
+                Types: str
+        RETURNS:
+            bool.
+        RAISES:
+            None
+        EXAMPLES:
+            >>> _Authorize('repo').write('BoB')
+        """
+        for access_type in ["INSERT", "UPDATE", "DELETE"]:
+            for object in self._objects:
+                sql = "{} {} ON {} {} {}".format(self._access_method, access_type, object, self._property, user)
+                execute_sql(sql)
+        return True
+    def read_write(self, user):
+        """
+        DESCRIPTION:
+            Authorize the read and write access.
+            Note:
+                One must have admin access to give read and write access to other "user".
+        PARAMETERS:
+            user:
+                Required Argument.
+                Specifies the name of the user to have read and write access.
+                Types: str
+        RETURNS:
+            bool.
+        RAISES:
+            None
+        EXAMPLES:
+            >>> _Authorize('repo').read_write('BoB')
+        """
+        self.read(user)
+        return self.write(user)
+class Grant(_Authorize):
+    """ Class to grant access to tables."""
+    _property = "TO"
+class Revoke(_Authorize):
+    """ Class to revoke access from tables."""
+    _property = "FROM"

teradataml 20.0.0.2__py3-none-any.whl → 20.0.0.4__py3-none-any.whl

Potentially problematic release.

teradataml 20.0.0.2py3-none-any.whl → 20.0.0.4py3-none-any.whl