PyPI - teradataml - Versions diffs - 20.0.0.3__py3-none-any.whl → 20.0.0.5__py3-none-any.whl - Mend

teradataml 20.0.0.3py3-none-any.whl → 20.0.0.5py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of teradataml might be problematic. Click here for more details.

Files changed (151) hide show

teradataml/LICENSE-3RD-PARTY.pdf +0 -0
teradataml/README.md +193 -1
teradataml/__init__.py +2 -1
teradataml/_version.py +2 -2
teradataml/analytics/analytic_function_executor.py +25 -18
teradataml/analytics/byom/__init__.py +1 -1
teradataml/analytics/json_parser/analytic_functions_argument.py +4 -0
teradataml/analytics/sqle/__init__.py +20 -2
teradataml/analytics/utils.py +15 -1
teradataml/analytics/valib.py +18 -4
teradataml/automl/__init__.py +341 -112
teradataml/automl/autodataprep/__init__.py +471 -0
teradataml/automl/data_preparation.py +84 -42
teradataml/automl/data_transformation.py +69 -33
teradataml/automl/feature_engineering.py +76 -9
teradataml/automl/feature_exploration.py +639 -25
teradataml/automl/model_training.py +35 -14
teradataml/clients/auth_client.py +2 -2
teradataml/common/__init__.py +1 -2
teradataml/common/constants.py +122 -63
teradataml/common/messagecodes.py +14 -3
teradataml/common/messages.py +8 -4
teradataml/common/sqlbundle.py +40 -10
teradataml/common/utils.py +366 -74
teradataml/common/warnings.py +11 -0
teradataml/context/context.py +348 -86
teradataml/data/amazon_reviews_25.csv +26 -0
teradataml/data/apriori_example.json +22 -0
teradataml/data/byom_example.json +11 -0
teradataml/data/docs/byom/docs/DataRobotPredict.py +2 -2
teradataml/data/docs/byom/docs/DataikuPredict.py +40 -1
teradataml/data/docs/byom/docs/H2OPredict.py +2 -2
teradataml/data/docs/byom/docs/ONNXEmbeddings.py +242 -0
teradataml/data/docs/byom/docs/ONNXPredict.py +2 -2
teradataml/data/docs/byom/docs/PMMLPredict.py +2 -2
teradataml/data/docs/sqle/docs_17_20/Apriori.py +138 -0
teradataml/data/docs/sqle/docs_17_20/NERExtractor.py +121 -0
teradataml/data/docs/sqle/docs_17_20/NGramSplitter.py +3 -3
teradataml/data/docs/sqle/docs_17_20/SMOTE.py +212 -0
teradataml/data/docs/sqle/docs_17_20/Shap.py +28 -6
teradataml/data/docs/sqle/docs_17_20/TextMorph.py +119 -0
teradataml/data/docs/sqle/docs_17_20/TextParser.py +54 -3
teradataml/data/docs/uaf/docs_17_20/ACF.py +1 -1
teradataml/data/docs/uaf/docs_17_20/ArimaEstimate.py +2 -2
teradataml/data/docs/uaf/docs_17_20/ArimaXEstimate.py +2 -2
teradataml/data/docs/uaf/docs_17_20/DFFT.py +1 -1
teradataml/data/docs/uaf/docs_17_20/DFFT2.py +1 -1
teradataml/data/docs/uaf/docs_17_20/DFFT2Conv.py +1 -1
teradataml/data/docs/uaf/docs_17_20/DFFTConv.py +1 -1
teradataml/data/docs/uaf/docs_17_20/DWT2D.py +4 -1
teradataml/data/docs/uaf/docs_17_20/FilterFactory1d.py +4 -4
teradataml/data/docs/uaf/docs_17_20/GenseriesSinusoids.py +2 -2
teradataml/data/docs/uaf/docs_17_20/GoldfeldQuandt.py +2 -2
teradataml/data/docs/uaf/docs_17_20/HoltWintersForecaster.py +6 -6
teradataml/data/docs/uaf/docs_17_20/LineSpec.py +1 -1
teradataml/data/docs/uaf/docs_17_20/LinearRegr.py +1 -1
teradataml/data/docs/uaf/docs_17_20/Matrix2Image.py +4 -4
teradataml/data/docs/uaf/docs_17_20/MultivarRegr.py +1 -1
teradataml/data/docs/uaf/docs_17_20/PACF.py +1 -1
teradataml/data/docs/uaf/docs_17_20/PowerSpec.py +2 -2
teradataml/data/docs/uaf/docs_17_20/PowerTransform.py +3 -3
teradataml/data/docs/uaf/docs_17_20/Resample.py +5 -5
teradataml/data/docs/uaf/docs_17_20/SAX.py +3 -3
teradataml/data/docs/uaf/docs_17_20/SignifPeriodicities.py +1 -1
teradataml/data/docs/uaf/docs_17_20/SimpleExp.py +1 -1
teradataml/data/docs/uaf/docs_17_20/Smoothma.py +3 -3
teradataml/data/docs/uaf/docs_17_20/UNDIFF.py +1 -1
teradataml/data/hnsw_alter_data.csv +5 -0
teradataml/data/hnsw_data.csv +10 -0
teradataml/data/jsons/byom/h2opredict.json +1 -1
teradataml/data/jsons/byom/onnxembeddings.json +266 -0
teradataml/data/jsons/sqle/17.20/NGramSplitter.json +6 -6
teradataml/data/jsons/sqle/17.20/TD_Apriori.json +181 -0
teradataml/data/jsons/sqle/17.20/TD_NERExtractor.json +145 -0
teradataml/data/jsons/sqle/17.20/TD_SMOTE.json +267 -0
teradataml/data/jsons/sqle/17.20/TD_Shap.json +0 -1
teradataml/data/jsons/sqle/17.20/TD_TextMorph.json +134 -0
teradataml/data/jsons/sqle/17.20/TD_TextParser.json +114 -9
teradataml/data/jsons/sqle/20.00/AI_AnalyzeSentiment.json +328 -0
teradataml/data/jsons/sqle/20.00/AI_AskLLM.json +420 -0
teradataml/data/jsons/sqle/20.00/AI_DetectLanguage.json +343 -0
teradataml/data/jsons/sqle/20.00/AI_ExtractKeyPhrases.json +328 -0
teradataml/data/jsons/sqle/20.00/AI_MaskPII.json +328 -0
teradataml/data/jsons/sqle/20.00/AI_RecognizeEntities.json +328 -0
teradataml/data/jsons/sqle/20.00/AI_RecognizePIIEntities.json +328 -0
teradataml/data/jsons/sqle/20.00/AI_TextClassifier.json +359 -0
teradataml/data/jsons/sqle/20.00/AI_TextEmbeddings.json +360 -0
teradataml/data/jsons/sqle/20.00/AI_TextSummarize.json +343 -0
teradataml/data/jsons/sqle/20.00/AI_TextTranslate.json +343 -0
teradataml/data/jsons/sqle/20.00/TD_HNSW.json +296 -0
teradataml/data/jsons/sqle/20.00/TD_HNSWPredict.json +206 -0
teradataml/data/jsons/sqle/20.00/TD_HNSWSummary.json +32 -0
teradataml/data/jsons/sqle/20.00/TD_KMeans.json +2 -2
teradataml/data/jsons/sqle/20.00/TD_SMOTE.json +3 -3
teradataml/data/jsons/sqle/20.00/TD_VectorDistance.json +6 -6
teradataml/data/ner_dict.csv +8 -0
teradataml/data/ner_input_eng.csv +7 -0
teradataml/data/ner_rule.csv +5 -0
teradataml/data/pos_input.csv +40 -0
teradataml/data/tdnerextractor_example.json +14 -0
teradataml/data/teradataml_example.json +21 -0
teradataml/data/textmorph_example.json +5 -0
teradataml/data/to_num_data.csv +4 -0
teradataml/data/tochar_data.csv +5 -0
teradataml/data/trans_dense.csv +16 -0
teradataml/data/trans_sparse.csv +55 -0
teradataml/data/vectordistance_example.json +1 -1
teradataml/dataframe/copy_to.py +45 -29
teradataml/dataframe/data_transfer.py +72 -46
teradataml/dataframe/dataframe.py +642 -166
teradataml/dataframe/dataframe_utils.py +167 -22
teradataml/dataframe/functions.py +135 -20
teradataml/dataframe/setop.py +11 -6
teradataml/dataframe/sql.py +330 -78
teradataml/dbutils/dbutils.py +556 -140
teradataml/dbutils/filemgr.py +14 -10
teradataml/hyperparameter_tuner/optimizer.py +12 -1
teradataml/lib/aed_0_1.dll +0 -0
teradataml/opensource/{sklearn/_sklearn_wrapper.py → _base.py} +168 -1013
teradataml/opensource/_class.py +141 -17
teradataml/opensource/{constants.py → _constants.py} +7 -3
teradataml/opensource/_lightgbm.py +52 -53
teradataml/opensource/_sklearn.py +1008 -0
teradataml/opensource/_wrapper_utils.py +5 -5
teradataml/options/__init__.py +47 -15
teradataml/options/configure.py +103 -26
teradataml/options/display.py +13 -2
teradataml/plot/axis.py +47 -8
teradataml/plot/figure.py +33 -0
teradataml/plot/plot.py +63 -13
teradataml/scriptmgmt/UserEnv.py +307 -40
teradataml/scriptmgmt/lls_utils.py +428 -145
teradataml/store/__init__.py +2 -3
teradataml/store/feature_store/feature_store.py +102 -7
teradataml/table_operators/Apply.py +48 -19
teradataml/table_operators/Script.py +23 -2
teradataml/table_operators/TableOperator.py +3 -1
teradataml/table_operators/table_operator_util.py +58 -9
teradataml/utils/dtypes.py +49 -1
teradataml/utils/internal_buffer.py +38 -0
teradataml/utils/validators.py +377 -62
{teradataml-20.0.0.3.dist-info → teradataml-20.0.0.5.dist-info}/METADATA +200 -4
{teradataml-20.0.0.3.dist-info → teradataml-20.0.0.5.dist-info}/RECORD +146 -112
teradataml/data/SQL_Fundamentals.pdf +0 -0
teradataml/libaed_0_1.dylib +0 -0
teradataml/libaed_0_1.so +0 -0
teradataml/opensource/sklearn/__init__.py +0 -0
teradataml/store/vector_store/__init__.py +0 -1586
{teradataml-20.0.0.3.dist-info → teradataml-20.0.0.5.dist-info}/WHEEL +0 -0
{teradataml-20.0.0.3.dist-info → teradataml-20.0.0.5.dist-info}/top_level.txt +0 -0
{teradataml-20.0.0.3.dist-info → teradataml-20.0.0.5.dist-info}/zip-safe +0 -0

teradataml/data/pos_input.csv ADDED Viewed

@@ -0,0 +1,40 @@
+"id","word","pos"
+1,"roger","NN"
+2,"federer","NN"
+3,"born","VBN"
+4,"on","IN"
+5,"8","CD"
+6,"august","NN"
+7,"1981","CD"
+8,",","O"
+9,"is","VBZ"
+10,"a","DT"
+11,"greatest","JJS"
+12,"tennis","NN"
+13,"player","NN"
+14,",","O"
+15,"who","WP"
+16,"has","VBZ"
+17,"been","VBN"
+18,"continuously","RB"
+19,"ranked","VBN"
+20,"inside","IN"
+21,"the","DT"
+22,"top","JJ"
+23,"10","CD"
+24,"since","IN"
+25,"october","JJ"
+26,"2002","CD"
+27,"and","CC"
+28,"has","VBZ"
+29,"won","VBN"
+30,"wimbledon","NN"
+31,",","O"
+32,"usopen","JJ"
+33,",","O"
+34,"australian","JJ"
+35,"and","CC"
+36,"frenchopen","JJ"
+37,"titles","NNS"
+38,"mutiple","JJ"
+39,"times","NNS"

teradataml/data/tdnerextractor_example.json ADDED Viewed

@@ -0,0 +1,14 @@
+{
+    "ner_input_eng": {
+      "id": "integer",
+      "txt": "varchar(500)"
+    },
+    "ner_rule": {
+      "type_ner": "varchar(500)",
+      "regex": "varchar(500)"
+    },
+    "ner_dict": {
+      "type_ner": "varchar(500)",
+      "dict": "varchar(500)"
+    }
+  }

teradataml/data/teradataml_example.json CHANGED Viewed

@@ -1356,6 +1356,10 @@
     "format_col": "VARCHAR(50)",
     "timezone_col": "VARCHAR(50)"
   },
+  "to_num_data":{
+    "price": "VARCHAR(20)",
+    "col_format": "VARCHAR(20)"
+  },
   "interval_data":{
     "id": "INTEGER",
     "int_col": "BIGINT",
@@ -1368,5 +1372,22 @@
     "id": "INTEGER",
     "urls": "VARCHAR(60)",
     "part": "VARCHAR(20)"
+  },
+  "hnsw_data": {
+    "id": "INTEGER",
+    "array_col": "Vector"
+  },
+  "hnsw_alter_data": {
+    "id": "INTEGER",
+    "array_col": "Vector"
+  },
+  "tochar_data": {
+    "id": "INTEGER",
+    "int_col": "INTEGER",
+    "float_col": "FLOAT",
+    "date_col": "DATE",
+    "int_format": "VARCHAR(20)",
+    "float_format": "VARCHAR(20)",
+    "date_format": "VARCHAR(20)"
   }
 }

teradataml/data/textmorph_example.json CHANGED Viewed

@@ -2,5 +2,10 @@
   "words_input": {
     "id": "integer",
     "word": "varchar(30)"
+  },
+  "pos_input": {
+    "id": "integer",
+    "word": "varchar(100)",
+    "pos_tag": "varchar(100)"
   }
 }

teradataml/data/to_num_data.csv ADDED Viewed

@@ -0,0 +1,4 @@
+price,col_format
+"78.12","99.99"
+"USD123","C999"
+"$1234","$9999"

teradataml/data/tochar_data.csv ADDED Viewed

@@ -0,0 +1,5 @@
+id,int_col,float_col,date_col,int_format,float_format,date_format
+0,1234,234.56,03/09/17,"9,999","999D9","MM-DD"
+1,456,234.56,03/09/17,"$999","9.9EEEE","CCAD"
+2,789,123.46,03/09/17,"0999","9999.9","DAY"
+3,1314,123.46,03/09/17,"XXXX","TM9","DY"

teradataml/data/trans_dense.csv ADDED Viewed

@@ -0,0 +1,16 @@
+"location","tranid","period","storeid","region","item","sku","category"
+"MiddleEast",999,"20100715",1,"west","milk,butter,eggs,flour,spinach",1,"dairy"
+"MiddleEast",1000,"20100715",1,"west","milk,eggs,flour,spinach",1,"dairy"
+"MiddleEast",1001,"20100715",1,"west","milk,butter,eggs",1,"dairy"
+"MiddleEast",1002,"20100715",1,"west","milk,butter,spinach",1,"dairy"
+"MiddleEast",1500,"20100715",3,"west","butter,eggs,flour",2,"dairy"
+"AsiaPacific",999,"20100715",1,"west","milk,butter,eggs,flour,spinach",1,"dairy"
+"AsiaPacific",1000,"20100715",1,"west","milk,eggs,flour,spinach",1,"dairy"
+"AsiaPacific",1001,"20100715",1,"west","milk,butter,eggs",1,"dairy"
+"AsiaPacific",1002,"20100715",1,"west","milk,butter,spinach",1,"dairy"
+"AsiaPacific",1500,"20100715",3,"west","butter,eggs,flour",2,"dairy"
+"LatinAmerica",999,"20100715",1,"west","milk,butter,eggs,flour,spinach",1,"dairy"
+"LatinAmerica",1000,"20100715",1,"west","milk,eggs,flour,spinach",1,"dairy"
+"LatinAmerica",1001,"20100715",1,"west","milk,butter,eggs",1,"dairy"
+"LatinAmerica",1002,"20100715",1,"west","milk,butter,spinach",1,"dairy"
+"LatinAmerica",1500,"20100715",3,"west","butter,eggs,flour",2,"dairy"

teradataml/data/trans_sparse.csv ADDED Viewed

@@ -0,0 +1,55 @@
+"location","tranid","period","storeid","region","item","sku","category"
+"MiddleEast",999,"20100715",1,"west","milk",1,"dairy"
+"MiddleEast",999,"20100715",1,"west","butter",2,"dairy"
+"MiddleEast",999,"20100715",1,"west","eggs",3,"dairy"
+"MiddleEast",999,"19990715",1,"west","flour",4,"baking"
+"MiddleEast",999,"19990715",1,"west","spinach",4,"produce"
+"MiddleEast",1000,"20100715",1,"west","milk",1,"dairy"
+"MiddleEast",1000,"20100715",1,"west","eggs",3,"dairy"
+"MiddleEast",1000,"19990715",1,"west","flour",4,"baking"
+"MiddleEast",1000,"19990715",1,"west","spinach",2,"produce"
+"MiddleEast",1001,"20100715",1,"west","milk",1,"dairy"
+"MiddleEast",1001,"20100715",1,"west","butter",2,"dairy"
+"MiddleEast",1001,"20100715",1,"west","eggs",3,"dairy"
+"MiddleEast",1002,"20100715",1,"west","milk",1,"dairy"
+"MiddleEast",1002,"20100715",1,"west","butter",2,"dairy"
+"MiddleEast",1002,"20100715",1,"west","spinach",3,"produce"
+"MiddleEast",1500,"20100715",3,"west","butter",2,"dairy"
+"MiddleEast",1500,"20100715",3,"west","eggs",3,"dairy"
+"MiddleEast",1500,"20100715",3,"west","flour",4,"baking"
+"AsiaPacific",999,"20100715",1,"west","milk",1,"dairy"
+"AsiaPacific",999,"20100715",1,"west","butter",2,"dairy"
+"AsiaPacific",999,"20100715",1,"west","eggs",3,"dairy"
+"AsiaPacific",999,"19990715",1,"west","flour",4,"baking"
+"AsiaPacific",999,"19990715",1,"west","spinach",4,"produce"
+"AsiaPacific",1000,"20100715",1,"west","milk",1,"dairy"
+"AsiaPacific",1000,"20100715",1,"west","eggs",3,"dairy"
+"AsiaPacific",1000,"19990715",1,"west","flour",4,"baking"
+"AsiaPacific",1000,"19990715",1,"west","spinach",2,"produce"
+"AsiaPacific",1001,"20100715",1,"west","milk",1,"dairy"
+"AsiaPacific",1001,"20100715",1,"west","butter",2,"dairy"
+"AsiaPacific",1001,"20100715",1,"west","eggs",3,"dairy"
+"AsiaPacific",1002,"20100715",1,"west","milk",1,"dairy"
+"AsiaPacific",1002,"20100715",1,"west","butter",2,"dairy"
+"AsiaPacific",1002,"20100715",1,"west","spinach",3,"produce"
+"AsiaPacific",1500,"20100715",3,"west","butter",2,"dairy"
+"AsiaPacific",1500,"20100715",3,"west","eggs",3,"dairy"
+"AsiaPacific",1500,"20100715",3,"west","flour",4,"baking"
+"LatinAmerica",999,"20100715",1,"west","milk",1,"dairy"
+"LatinAmerica",999,"20100715",1,"west","butter",2,"dairy"
+"LatinAmerica",999,"20100715",1,"west","eggs",3,"dairy"
+"LatinAmerica",999,"19990715",1,"west","flour",4,"baking"
+"LatinAmerica",999,"19990715",1,"west","spinach",4,"produce"
+"LatinAmerica",1000,"20100715",1,"west","milk",1,"dairy"
+"LatinAmerica",1000,"20100715",1,"west","eggs",3,"dairy"
+"LatinAmerica",1000,"19990715",1,"west","flour",4,"baking"
+"LatinAmerica",1000,"19990715",1,"west","spinach",2,"produce"
+"LatinAmerica",1001,"20100715",1,"west","milk",1,"dairy"
+"LatinAmerica",1001,"20100715",1,"west","butter",2,"dairy"
+"LatinAmerica",1001,"20100715",1,"west","eggs",3,"dairy"
+"LatinAmerica",1002,"20100715",1,"west","milk",1,"dairy"
+"LatinAmerica",1002,"20100715",1,"west","butter",2,"dairy"
+"LatinAmerica",1002,"20100715",1,"west","spinach",3,"produce"
+"LatinAmerica",1500,"20100715",3,"west","butter",2,"dairy"
+"LatinAmerica",1500,"20100715",3,"west","eggs",3,"dairy"
+"LatinAmerica",1500,"20100715",3,"west","flour",4,"baking"

teradataml/data/vectordistance_example.json CHANGED Viewed

@@ -25,6 +25,6 @@
   },
   "target_udt_data":{
     "id": "INTEGER",
-    "array_col":"AIVector"
+    "array_col":"Vector"
   }
 }

teradataml/dataframe/copy_to.py CHANGED Viewed

@@ -297,10 +297,10 @@ def copy_to_sql(df, table_name,
             >>> from teradatasqlalchemy.types import *
             >>> df = {'emp_name': ['A1', 'A2', 'A3', 'A4'],
-                'emp_sage': [100, 200, 300, 400],
-                'emp_id': [133, 144, 155, 177],
-                'marks': [99.99, 97.32, 94.67, 91.00]
-                }
+            ...       'emp_sage': [100, 200, 300, 400],
+            ...       'emp_id': [133, 144, 155, 177],
+            ...       'marks': [99.99, 97.32, 94.67, 91.00]
+            ...    }
             >>> pandas_df = pd.DataFrame(df)
@@ -313,24 +313,35 @@ def copy_to_sql(df, table_name,
             c) Save a Pandas DataFrame by specifying additional parameters:
             >>> copy_to_sql(df = pandas_df, table_name = 'my_table_2', schema_name = 'alice',
-                            index = True, index_label = 'my_index_label', temporary = False,
-                            primary_index = ['emp_id'], if_exists = 'append',
-                            types = {'emp_name': VARCHAR, 'emp_sage':INTEGER,
-                                     'emp_id': BIGINT, 'marks': DECIMAL})
+            ...             index = True, index_label = 'my_index_label', temporary = False,
+            ...             primary_index = ['emp_id'], if_exists = 'append',
+            ...             types = {'emp_name': VARCHAR, 'emp_sage':INTEGER,
+            ...                      'emp_id': BIGINT, 'marks': DECIMAL})
             d) Saving with additional parameters as a SET table
             >>> copy_to_sql(df = pandas_df, table_name = 'my_table_3', schema_name = 'alice',
-                            index = True, index_label = 'my_index_label', temporary = False,
-                            primary_index = ['emp_id'], if_exists = 'append',
-                            types = {'emp_name': VARCHAR, 'emp_sage':INTEGER,
-                                     'emp_id': BIGINT, 'marks': DECIMAL},
-                            set_table=True)
+            ...             index = True, index_label = 'my_index_label', temporary = False,
+            ...             primary_index = ['emp_id'], if_exists = 'append',
+            ...             types = {'emp_name': VARCHAR, 'emp_sage':INTEGER,
+            ...                       'emp_id': BIGINT, 'marks': DECIMAL},
+            ...             set_table=True)
             e) Saving levels in index of type MultiIndex
             >>> pandas_df = pandas_df.set_index(['emp_id', 'emp_name'])
             >>> copy_to_sql(df = pandas_df, table_name = 'my_table_4', schema_name = 'alice',
-                            index = True, index_label = ['index1', 'index2'], temporary = False,
-                            primary_index = ['index1'], if_exists = 'replace')
+            ...             index = True, index_label = ['index1', 'index2'], temporary = False,
+            ...             primary_index = ['index1'], if_exists = 'replace')
+            f) Save a Pandas DataFrame with VECTOR datatype:
+            >>> import pandas as pd
+            >>> VECTOR_data = {
+            ...        'id': [10, 11, 12, 13],
+            ...        'array_col': ['1,1', '2,2', '3,3', '4,4']
+            ...        }
+            >>> df = pd.DataFrame(VECTOR_data)
+            >>> from teradatasqlalchemy import VECTOR
+            >>> copy_to_sql(df=df, table_name='my_vector_table', types={'array_col': VECTOR})
         2. Saving a teradataml DataFrame:
@@ -358,13 +369,13 @@ def copy_to_sql(df, table_name,
             d) Save a teradataml DataFrame by using copy_to_sql with additional parameters:
             >>> copy_to_sql(df = df2, table_name = 'my_tdml_table_3', schema_name = 'alice',
-                            temporary = False, primary_index = None, if_exists = 'append',
-                            types = {'masters': VARCHAR, 'gpa':INTEGER})
+            ...             temporary = False, primary_index = None, if_exists = 'append',
+            ...             types = {'masters': VARCHAR, 'gpa':INTEGER})
             e) Saving as a SET table
             >>> copy_to_sql(df = df2, table_name = 'my_tdml_set_table', schema_name = 'alice',
-                            temporary = False, primary_index = ['gpa'], if_exists = 'append',
-                            types = {'masters': VARCHAR, 'gpa':INTEGER}, set_table = True)
+            ...             temporary = False, primary_index = ['gpa'], if_exists = 'append',
+            ...             types = {'masters': VARCHAR, 'gpa':INTEGER}, set_table = True)
         3. Saving a teradataml DataFrame as a PTI table:
@@ -377,19 +388,19 @@ def copy_to_sql(df, table_name,
             a) Using copy_to_sql
             >>> copy_to_sql(df3, "test_copyto_pti",
-                            timecode_column='clicktime',
-                            columns_list='event')
+            ...             timecode_column='clicktime',
+            ...             columns_list='event')
             b) Alternatively, using DataFrame.to_sql
             >>> df3.to_sql(table_name = "test_copyto_pti_1",
-                          timecode_column='clicktime',
-                          columns_list='event')
+            ...            timecode_column='clicktime',
+            ...            columns_list='event')
             c) Saving as a SET table
             >>> copy_to_sql(df3, "test_copyto_pti_2",
-                            timecode_column='clicktime',
-                            columns_list='event',
-                            set_table=True)
+            ...             timecode_column='clicktime',
+            ...             columns_list='event',
+            ...             set_table=True)
     """
     # Deriving global connection using get_connection().
@@ -487,6 +498,11 @@ def copy_to_sql(df, table_name,
                                                              table_type=TeradataConstants.TERADATA_TABLE,
                                                              quote=False)
+            # If configure.temp_object_type="VT", _generate_temp_table_name() retruns the
+            # table name in fully qualified format. Because of this , test cases started
+            # failing with Blank name in quotation mark. Hence, extracted only the table name.
+            table_name = UtilFuncs._extract_table_name(table_name)
         # Let's create the SQLAlchemy table object to recreate the table
         if not table_exists or if_exists.lower() == 'replace':
             if not is_pti:
@@ -1459,9 +1475,9 @@ def _extract_column_info(df, types = None, index = False, index_label = None):
     # If the datatype is not specified then check if the datatype is datetime64 and timezone is present then map it to
     # TIMESTAMP(timezone=True) else map it according to default value.
     col_types = [types.get(col_name) if types and col_name in types else
-                 TIMESTAMP(timezone=True) if pt.is_datetime64_ns_dtype(df.dtypes[key])
+                 TIMESTAMP(timezone=True) if pt.is_datetime64_ns_dtype(df.dtypes.iloc[key])
                                              and (df[col_name].dt.tz is not None)
-                 else _get_sqlalchemy_mapping_types(str(df.dtypes[key]))
+                 else _get_sqlalchemy_mapping_types(str(df.dtypes.iloc[key]))
                  for key, col_name in enumerate(list(df.columns))]
     ind_names = []
@@ -1469,7 +1485,7 @@ def _extract_column_info(df, types = None, index = False, index_label = None):
     if index:
         ind_names, ind_types = _get_index_labels(df, index_label)
         ind_types = [types.get(ind_name) if types and ind_name in types
-                     else TIMESTAMP(timezone=True) if pt.is_datetime64_ns_dtype(df.dtypes[key])
+                     else TIMESTAMP(timezone=True) if pt.is_datetime64_ns_dtype(df.dtypes.iloc[key])
                                                       and (df[ind_name].dt.tz is not None)
                      else _get_sqlalchemy_mapping_types(str(ind_types[key]))
                      for key, ind_name in enumerate(ind_names)]

teradataml/dataframe/data_transfer.py CHANGED Viewed

@@ -328,6 +328,7 @@ def fastexport(df, export_to="pandas", index_column=None,
             # using fastexport datatransfer protocol.
             # "require" is always True, because with this function user requires
             # fastexport.
             return dt_obj._fastexport_get_pandas_df(require=True, **kwargs)
         # Convert teradataml DataFrame to CSV file.
@@ -689,77 +690,77 @@ def read_csv(filepath,
         #            while doing so catch all errors and warnings as well as store those in the table.
         >>> types = OrderedDict(id=BIGINT, fname=VARCHAR, lname=VARCHAR, marks=FLOAT)
         >>> read_csv(filepath='test_file.csv',
-                     table_name='my_first_table1', types=types,
-                     save_errors=True, catch_errors_warnings=True)
+        ...          table_name='my_first_table1', types=types,
+        ...          save_errors=True, catch_errors_warnings=True)
         # Example 3: Load the data from CSV file into a table using fastload CSV protocol.
         #            If table exists, then replace the same. Catch all errors and warnings as well as
         #            store those in the table.
         >>> types = OrderedDict(id=BIGINT, fname=VARCHAR, lname=VARCHAR, marks=FLOAT)
         >>> read_csv(filepath='test_file.csv',
-                     table_name='my_first_table',
-                     types=types, if_exists='replace',
-                     save_errors=True, catch_errors_warnings=True)
+        ...          table_name='my_first_table',
+        ...          types=types, if_exists='replace',
+        ...          save_errors=True, catch_errors_warnings=True)
         # Example 4: Load the data from CSV file into a table using fastload CSV protocol.
         #            If table exists in specified schema, then append the same. Catch all
         #            errors and warnings as well as store those in the table.
         >>> types = OrderedDict(id=BIGINT, fname=VARCHAR, lname=VARCHAR, marks=FLOAT)
         >>> read_csv(filepath='test_file.csv',
-                     table_name='my_first_table',
-                     types=types, if_exists='fail',
-                     save_errors=True, catch_errors_warnings=True)
+        ...          table_name='my_first_table',
+        ...          types=types, if_exists='fail',
+        ...          save_errors=True, catch_errors_warnings=True)
         >>> read_csv(filepath='test_file.csv',
-                     table_name='my_first_table',
-                     if_exists='append',
-                     save_errors=True, catch_errors_warnings=True)
+        ...          table_name='my_first_table',
+        ...          if_exists='append',
+        ...          save_errors=True, catch_errors_warnings=True)
         # Example 5: Load the data from CSV file into a SET table using fastload CSV protocol.
         #            Catch all errors and warnings as well as store those in the table.
         >>> types = OrderedDict(id=BIGINT, fname=VARCHAR, lname=VARCHAR, marks=FLOAT)
         >>> read_csv(filepath='test_file.csv',
-                     table_name='my_first_table',
-                     types=types, if_exists='replace',
-                     set_table=True, primary_index='id',
-                     save_errors=True, catch_errors_warnings=True)
+        ...          table_name='my_first_table',
+        ...          types=types, if_exists='replace',
+        ...          set_table=True, primary_index='id',
+        ...          save_errors=True, catch_errors_warnings=True)
         # Example 6: Load the data from CSV file into a temporary table without fastloadCSV protocol.
         #            If table exists, then append to the same.
         >>> types = OrderedDict(id=BIGINT, fname=VARCHAR, lname=VARCHAR, marks=FLOAT)
         >>> read_csv(filepath='test_file.csv',
-                     table_name='my_first_table',
-                     types=types, if_exists='replace',
-                     temporary=True)
+        ...          table_name='my_first_table',
+        ...          types=types, if_exists='replace',
+        ...          temporary=True)
         >>> read_csv(filepath='test_file.csv',
-                     table_name='my_first_table',
-                     if_exists='append',
-                     temporary=True)
+        ...          table_name='my_first_table',
+        ...          if_exists='append',
+        ...          temporary=True)
         # Example 7: Load the data from CSV file with DATE and TIMESTAMP columns into
         #            a table without Fastload protocol. If table exists in specified
         #            schema, then append to the table.
         >>> types = OrderedDict(id=BIGINT, fname=VARCHAR, lname=VARCHAR, marks=FLOAT,
-                     admission_date=DATE, admission_time=TIMESTAMP)
+        ...                     admission_date=DATE, admission_time=TIMESTAMP)
         >>> read_csv(filepath='test_file.csv',
-                     table_name='my_first_table',
-                     types=types, if_exists='fail',
-                     use_fastload=False)
+        ...          table_name='my_first_table',
+        ...          types=types, if_exists='fail',
+        ...          use_fastload=False)
         >>> read_csv(filepath='test_file.csv',
-                     table_name='my_first_table',
-                     if_exists='append',
-                     use_fastload=False)
+        ...          table_name='my_first_table',
+        ...          if_exists='append',
+        ...          use_fastload=False)
         # Example 8: Load the data from CSV file with TIMESTAMP columns into
         #            a PTI table. If specified table exists then append to the table,
         #            otherwise creates new table.
         >>> types = OrderedDict(partition_id=INTEGER, adid=INTEGER, productid=INTEGER,
-                                event=VARCHAR, clicktime=TIMESTAMP)
+        ...                     event=VARCHAR, clicktime=TIMESTAMP)
         >>> read_csv(filepath='test_file.csv',
-                     table_name='my_first_read_csv_pti_table',
-                     types=types, if_exists='append',
-                     timecode_column='clicktime',
-                     columns_list='event',
-                     use_fastload=False)
+        ...          table_name='my_first_read_csv_pti_table',
+        ...          types=types, if_exists='append',
+        ...          timecode_column='clicktime',
+        ...          columns_list='event',
+        ...          use_fastload=False)
         # Example 9: Load the data from CSV file with TIMESTAMP columns into
         #            a SET PTI table. If specified table exists then append to the table,
@@ -767,11 +768,11 @@ def read_csv(filepath,
         >>> types = OrderedDict(partition_id=INTEGER, adid=INTEGER, productid=INTEGER,
                                 event=VARCHAR, clicktime=TIMESTAMP)
         >>> read_csv(filepath='test_file.csv',
-                     table_name='my_first_read_csv_pti_table',
-                     types=types, if_exists='append',
-                     timecode_column='clicktime',
-                     columns_list='event',
-                     set_table=True)
+        ...          table_name='my_first_read_csv_pti_table',
+        ...          types=types, if_exists='append',
+        ...          timecode_column='clicktime',
+        ...          columns_list='event',
+        ...          set_table=True)
         # Example 10: Load the data from CSV file with TIMESTAMP columns into
         #            a temporary PTI table. If specified table exists then append to the table,
@@ -779,11 +780,11 @@ def read_csv(filepath,
         >>> types = OrderedDict(partition_id=INTEGER, adid=INTEGER, productid=INTEGER,
                                 event=VARCHAR, clicktime=TIMESTAMP)
         >>> read_csv(filepath='test_file.csv',
-                     table_name='my_first_read_csv_pti_table',
-                     types=types, if_exists='append',
-                     timecode_column='clicktime',
-                     columns_list='event',
-                     temporary=True)
+        ...          table_name='my_first_read_csv_pti_table',
+        ...          types=types, if_exists='append',
+        ...          timecode_column='clicktime',
+        ...          columns_list='event',
+        ...          temporary=True)
         # Example 11: Load the data from CSV file into Vantage table by opening specified
         #             number of Teradata data transfer sesions.
@@ -795,8 +796,24 @@ def read_csv(filepath,
         #             through primary_index argument.
         >>> types = OrderedDict(id=BIGINT, fname=VARCHAR, lname=VARCHAR, marks=FLOAT)
         >>> read_csv(filepath='test_file.csv', table_name='my_first_table_with_primary_index',
-                    types=types, primary_index = ['fname'])
+        ...          types=types, primary_index = ['fname'])
+        # Example 13: Load the data from CSV file into VECTOR datatype in Vantage table.
+        >>> from teradatasqlalchemy import VECTOR
+        >>> from pathlib import Path
+        >>> types = OrderedDict(id=BIGINT, array_col=VECTOR)
+        # Get the absolute path of the teradataml module
+        >>> import teradataml
+        >>> base_path = Path(teradataml.__path__[0])
+        # Append the relative path to the CSV file
+        >>> csv_path = os.path.join(base_path, "data", "hnsw_alter_data.csv")
+        >>> read_csv(filepath=csv_path,
+        ...          table_name='my_first_table_with_vector',
+        ...          types=types,
+        ...          use_fastload=False)
     """
     # Deriving global connection using context.get_context()
     con = get_context()
@@ -2553,7 +2570,6 @@ class _DataTransferUtils():
             _create_staging_table_and_load_csv_data(column_info={"id": INTEGER}, primary_index = ['id'])
         """
-        stag_table_name = ""
         stage_table_created = False
         try:
             # Generate the temporary table.
@@ -2562,6 +2578,11 @@ class _DataTransferUtils():
                                                                   quote=False,
                                                                   table_type=TeradataConstants.TERADATA_TABLE)
+            # If configure.temp_object_type="VT", _generate_temp_table_name() retruns the
+            # table name in fully qualified format. Because of this , test cases started
+            # failing with Blank name in quotation mark. Hence, extracted only the table name.
+            stag_table_name = UtilFuncs._extract_table_name(stag_table_name)
             # Information about uniqueness of primary index and
             # SET/MULTISET property of existing table is not available,
             # so over-assuming to be False.
@@ -2707,6 +2728,11 @@ class _DataTransferUtils():
                                                                   quote=False,
                                                                   table_type=TeradataConstants.TERADATA_TABLE)
+            # If configure.temp_object_type="VT", _generate_temp_table_name() retruns the
+            # table name in fully qualified format. Because of this , test cases started
+            # failing with Blank name in quotation mark. Hence, extracted only the table name.
+            stag_table_name = UtilFuncs._extract_table_name(stag_table_name)
             # Get the teradataml dataframe from staging table using read_csv()
             read_csv_output = read_csv(filepath=self.df, table_name=stag_table_name,
                                        types=self.types, sep=self.sep,

teradataml 20.0.0.3__py3-none-any.whl → 20.0.0.5__py3-none-any.whl

Potentially problematic release.

teradataml 20.0.0.3py3-none-any.whl → 20.0.0.5py3-none-any.whl