PyPI - teradataml - Versions diffs - 20.0.0.4__py3-none-any.whl → 20.0.0.5__py3-none-any.whl - Mend

teradataml 20.0.0.4py3-none-any.whl → 20.0.0.5py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of teradataml might be problematic. Click here for more details.

Files changed (107) hide show

teradataml/LICENSE-3RD-PARTY.pdf +0 -0
teradataml/README.md +86 -13
teradataml/__init__.py +2 -1
teradataml/_version.py +2 -2
teradataml/analytics/analytic_function_executor.py +7 -12
teradataml/analytics/json_parser/analytic_functions_argument.py +4 -0
teradataml/analytics/sqle/__init__.py +16 -1
teradataml/analytics/utils.py +15 -1
teradataml/automl/__init__.py +290 -106
teradataml/automl/autodataprep/__init__.py +471 -0
teradataml/automl/data_preparation.py +29 -10
teradataml/automl/data_transformation.py +11 -0
teradataml/automl/feature_engineering.py +64 -4
teradataml/automl/feature_exploration.py +639 -25
teradataml/automl/model_training.py +1 -1
teradataml/clients/auth_client.py +2 -2
teradataml/common/constants.py +61 -26
teradataml/common/messagecodes.py +2 -1
teradataml/common/messages.py +5 -4
teradataml/common/utils.py +255 -37
teradataml/context/context.py +225 -87
teradataml/data/apriori_example.json +22 -0
teradataml/data/docs/sqle/docs_17_20/Apriori.py +138 -0
teradataml/data/docs/sqle/docs_17_20/NERExtractor.py +121 -0
teradataml/data/docs/sqle/docs_17_20/NGramSplitter.py +3 -3
teradataml/data/docs/sqle/docs_17_20/SMOTE.py +212 -0
teradataml/data/docs/sqle/docs_17_20/TextMorph.py +119 -0
teradataml/data/docs/sqle/docs_17_20/TextParser.py +54 -3
teradataml/data/docs/uaf/docs_17_20/ACF.py +1 -1
teradataml/data/docs/uaf/docs_17_20/ArimaEstimate.py +2 -2
teradataml/data/docs/uaf/docs_17_20/ArimaXEstimate.py +2 -2
teradataml/data/docs/uaf/docs_17_20/DFFT.py +1 -1
teradataml/data/docs/uaf/docs_17_20/DFFT2.py +1 -1
teradataml/data/docs/uaf/docs_17_20/DFFT2Conv.py +1 -1
teradataml/data/docs/uaf/docs_17_20/DFFTConv.py +1 -1
teradataml/data/docs/uaf/docs_17_20/FilterFactory1d.py +4 -4
teradataml/data/docs/uaf/docs_17_20/GenseriesSinusoids.py +2 -2
teradataml/data/docs/uaf/docs_17_20/GoldfeldQuandt.py +2 -2
teradataml/data/docs/uaf/docs_17_20/HoltWintersForecaster.py +6 -6
teradataml/data/docs/uaf/docs_17_20/LineSpec.py +1 -1
teradataml/data/docs/uaf/docs_17_20/LinearRegr.py +1 -1
teradataml/data/docs/uaf/docs_17_20/Matrix2Image.py +4 -4
teradataml/data/docs/uaf/docs_17_20/MultivarRegr.py +1 -1
teradataml/data/docs/uaf/docs_17_20/PACF.py +1 -1
teradataml/data/docs/uaf/docs_17_20/PowerSpec.py +2 -2
teradataml/data/docs/uaf/docs_17_20/PowerTransform.py +3 -3
teradataml/data/docs/uaf/docs_17_20/Resample.py +5 -5
teradataml/data/docs/uaf/docs_17_20/SAX.py +3 -3
teradataml/data/docs/uaf/docs_17_20/SignifPeriodicities.py +1 -1
teradataml/data/docs/uaf/docs_17_20/SimpleExp.py +1 -1
teradataml/data/docs/uaf/docs_17_20/Smoothma.py +3 -3
teradataml/data/docs/uaf/docs_17_20/UNDIFF.py +1 -1
teradataml/data/jsons/sqle/17.20/NGramSplitter.json +6 -6
teradataml/data/jsons/sqle/17.20/TD_Apriori.json +181 -0
teradataml/data/jsons/sqle/17.20/TD_NERExtractor.json +145 -0
teradataml/data/jsons/sqle/17.20/TD_SMOTE.json +267 -0
teradataml/data/jsons/sqle/17.20/TD_TextMorph.json +134 -0
teradataml/data/jsons/sqle/17.20/TD_TextParser.json +114 -9
teradataml/data/jsons/sqle/20.00/AI_AnalyzeSentiment.json +328 -0
teradataml/data/jsons/sqle/20.00/AI_AskLLM.json +420 -0
teradataml/data/jsons/sqle/20.00/AI_DetectLanguage.json +343 -0
teradataml/data/jsons/sqle/20.00/AI_ExtractKeyPhrases.json +328 -0
teradataml/data/jsons/sqle/20.00/AI_MaskPII.json +328 -0
teradataml/data/jsons/sqle/20.00/AI_RecognizeEntities.json +328 -0
teradataml/data/jsons/sqle/20.00/AI_RecognizePIIEntities.json +328 -0
teradataml/data/jsons/sqle/20.00/AI_TextClassifier.json +359 -0
teradataml/data/jsons/sqle/20.00/AI_TextEmbeddings.json +360 -0
teradataml/data/jsons/sqle/20.00/AI_TextSummarize.json +343 -0
teradataml/data/jsons/sqle/20.00/AI_TextTranslate.json +343 -0
teradataml/data/jsons/sqle/20.00/TD_SMOTE.json +2 -2
teradataml/data/jsons/sqle/20.00/TD_VectorDistance.json +1 -1
teradataml/data/ner_dict.csv +8 -0
teradataml/data/ner_input_eng.csv +7 -0
teradataml/data/ner_rule.csv +5 -0
teradataml/data/pos_input.csv +40 -0
teradataml/data/tdnerextractor_example.json +14 -0
teradataml/data/teradataml_example.json +13 -0
teradataml/data/textmorph_example.json +5 -0
teradataml/data/to_num_data.csv +4 -0
teradataml/data/tochar_data.csv +5 -0
teradataml/data/trans_dense.csv +16 -0
teradataml/data/trans_sparse.csv +55 -0
teradataml/dataframe/copy_to.py +37 -26
teradataml/dataframe/data_transfer.py +61 -45
teradataml/dataframe/dataframe.py +130 -50
teradataml/dataframe/dataframe_utils.py +15 -2
teradataml/dataframe/functions.py +109 -9
teradataml/dataframe/sql.py +328 -76
teradataml/dbutils/dbutils.py +33 -13
teradataml/dbutils/filemgr.py +14 -10
teradataml/lib/aed_0_1.dll +0 -0
teradataml/opensource/_base.py +6 -157
teradataml/options/configure.py +4 -5
teradataml/scriptmgmt/UserEnv.py +305 -38
teradataml/scriptmgmt/lls_utils.py +376 -130
teradataml/store/__init__.py +1 -1
teradataml/table_operators/Apply.py +16 -1
teradataml/table_operators/Script.py +20 -1
teradataml/table_operators/table_operator_util.py +58 -9
teradataml/utils/dtypes.py +2 -1
teradataml/utils/internal_buffer.py +22 -2
teradataml/utils/validators.py +313 -57
{teradataml-20.0.0.4.dist-info → teradataml-20.0.0.5.dist-info}/METADATA +89 -14
{teradataml-20.0.0.4.dist-info → teradataml-20.0.0.5.dist-info}/RECORD +107 -77
{teradataml-20.0.0.4.dist-info → teradataml-20.0.0.5.dist-info}/WHEEL +0 -0
{teradataml-20.0.0.4.dist-info → teradataml-20.0.0.5.dist-info}/top_level.txt +0 -0
{teradataml-20.0.0.4.dist-info → teradataml-20.0.0.5.dist-info}/zip-safe +0 -0

teradataml/data/jsons/sqle/20.00/TD_SMOTE.json CHANGED Viewed

@@ -168,10 +168,10 @@
     },
     {
       "isOutputColumn": false,
-      "allowNaN": false,
+      "defaultValue": 5,
       "name": "OversamplingFactor",
       "alternateNames": [],
-      "isRequired": true,
+      "isRequired": false,
       "rDescription": "specifies the factor for oversampling the minority class.",
       "description": "specifies the factor for oversampling the minority class.",
       "datatype": "DOUBLE",

teradataml/data/jsons/sqle/20.00/TD_VectorDistance.json CHANGED Viewed

@@ -163,7 +163,7 @@
     {
       "defaultValue": 10,
       "lowerBound": 1,
-      "upperBound": 100,
+      "upperBound": 1024,
       "lowerBoundType": "INCLUSIVE",
       "upperBoundType": "INCLUSIVE",
       "allowNaN": false,

teradataml/data/ner_dict.csv ADDED Viewed

@@ -0,0 +1,8 @@
+"type_ner","dict"
+"location","Arkansas"
+"location","Dublin"
+"MISC","average maturity"
+"location","Ohio"
+"month","June"
+"Last Name","Gross"
+"digit regex","[0-9]+"

teradataml/data/ner_input_eng.csv ADDED Viewed

@@ -0,0 +1,7 @@
+"id","txt"
+1,"At end of August, the Janus Unconstrained fund held only 45 debt issues with 70 percent of its assets in U.S. government debt."
+2,"One Treasury issue due June 2016 alone was worth 43 percent of the fund's total assets."
+3,"Most of the bonds have short durations, with the average maturity of just over three years, indicating a generally defensive posture."
+4,"For Bill Gross, quitting Pimco's $222 billion Total Return Fund to take over a $13 million fund at Janus Capital is like resigning the U.S. presidency to become city manager of Ashtabula, Ohio, population 18,800."
+5,"Gross stunned the investing world on Friday with his abrupt departure from Pimco, the $2 trillion asset manager he co-founded in 1971 and where he had run the Total Return Fund, the world's biggest bond fund, for more than 27 years."
+6,"[0-9]+"

teradataml/data/ner_rule.csv ADDED Viewed

@@ -0,0 +1,5 @@
+"type_ner","regex"
+"email","[\w\-]([\.\w])+[\w]+@([\w\-]+\.)+[a-zA-Z]{2,4}"
+"Money","\s\$[0-9]+\s"
+"Digits","\s[0-9]+\s"
+"Name","[A-Z][a-z]+\s+[A-Z][a-z]+"

teradataml/data/pos_input.csv ADDED Viewed

@@ -0,0 +1,40 @@
+"id","word","pos"
+1,"roger","NN"
+2,"federer","NN"
+3,"born","VBN"
+4,"on","IN"
+5,"8","CD"
+6,"august","NN"
+7,"1981","CD"
+8,",","O"
+9,"is","VBZ"
+10,"a","DT"
+11,"greatest","JJS"
+12,"tennis","NN"
+13,"player","NN"
+14,",","O"
+15,"who","WP"
+16,"has","VBZ"
+17,"been","VBN"
+18,"continuously","RB"
+19,"ranked","VBN"
+20,"inside","IN"
+21,"the","DT"
+22,"top","JJ"
+23,"10","CD"
+24,"since","IN"
+25,"october","JJ"
+26,"2002","CD"
+27,"and","CC"
+28,"has","VBZ"
+29,"won","VBN"
+30,"wimbledon","NN"
+31,",","O"
+32,"usopen","JJ"
+33,",","O"
+34,"australian","JJ"
+35,"and","CC"
+36,"frenchopen","JJ"
+37,"titles","NNS"
+38,"mutiple","JJ"
+39,"times","NNS"

teradataml/data/tdnerextractor_example.json ADDED Viewed

@@ -0,0 +1,14 @@
+{
+    "ner_input_eng": {
+      "id": "integer",
+      "txt": "varchar(500)"
+    },
+    "ner_rule": {
+      "type_ner": "varchar(500)",
+      "regex": "varchar(500)"
+    },
+    "ner_dict": {
+      "type_ner": "varchar(500)",
+      "dict": "varchar(500)"
+    }
+  }

teradataml/data/teradataml_example.json CHANGED Viewed

@@ -1356,6 +1356,10 @@
     "format_col": "VARCHAR(50)",
     "timezone_col": "VARCHAR(50)"
   },
+  "to_num_data":{
+    "price": "VARCHAR(20)",
+    "col_format": "VARCHAR(20)"
+  },
   "interval_data":{
     "id": "INTEGER",
     "int_col": "BIGINT",
@@ -1376,5 +1380,14 @@
   "hnsw_alter_data": {
     "id": "INTEGER",
     "array_col": "Vector"
+  },
+  "tochar_data": {
+    "id": "INTEGER",
+    "int_col": "INTEGER",
+    "float_col": "FLOAT",
+    "date_col": "DATE",
+    "int_format": "VARCHAR(20)",
+    "float_format": "VARCHAR(20)",
+    "date_format": "VARCHAR(20)"
   }
 }

teradataml/data/textmorph_example.json CHANGED Viewed

@@ -2,5 +2,10 @@
   "words_input": {
     "id": "integer",
     "word": "varchar(30)"
+  },
+  "pos_input": {
+    "id": "integer",
+    "word": "varchar(100)",
+    "pos_tag": "varchar(100)"
   }
 }

teradataml/data/to_num_data.csv ADDED Viewed

@@ -0,0 +1,4 @@
+price,col_format
+"78.12","99.99"
+"USD123","C999"
+"$1234","$9999"

teradataml/data/tochar_data.csv ADDED Viewed

@@ -0,0 +1,5 @@
+id,int_col,float_col,date_col,int_format,float_format,date_format
+0,1234,234.56,03/09/17,"9,999","999D9","MM-DD"
+1,456,234.56,03/09/17,"$999","9.9EEEE","CCAD"
+2,789,123.46,03/09/17,"0999","9999.9","DAY"
+3,1314,123.46,03/09/17,"XXXX","TM9","DY"

teradataml/data/trans_dense.csv ADDED Viewed

@@ -0,0 +1,16 @@
+"location","tranid","period","storeid","region","item","sku","category"
+"MiddleEast",999,"20100715",1,"west","milk,butter,eggs,flour,spinach",1,"dairy"
+"MiddleEast",1000,"20100715",1,"west","milk,eggs,flour,spinach",1,"dairy"
+"MiddleEast",1001,"20100715",1,"west","milk,butter,eggs",1,"dairy"
+"MiddleEast",1002,"20100715",1,"west","milk,butter,spinach",1,"dairy"
+"MiddleEast",1500,"20100715",3,"west","butter,eggs,flour",2,"dairy"
+"AsiaPacific",999,"20100715",1,"west","milk,butter,eggs,flour,spinach",1,"dairy"
+"AsiaPacific",1000,"20100715",1,"west","milk,eggs,flour,spinach",1,"dairy"
+"AsiaPacific",1001,"20100715",1,"west","milk,butter,eggs",1,"dairy"
+"AsiaPacific",1002,"20100715",1,"west","milk,butter,spinach",1,"dairy"
+"AsiaPacific",1500,"20100715",3,"west","butter,eggs,flour",2,"dairy"
+"LatinAmerica",999,"20100715",1,"west","milk,butter,eggs,flour,spinach",1,"dairy"
+"LatinAmerica",1000,"20100715",1,"west","milk,eggs,flour,spinach",1,"dairy"
+"LatinAmerica",1001,"20100715",1,"west","milk,butter,eggs",1,"dairy"
+"LatinAmerica",1002,"20100715",1,"west","milk,butter,spinach",1,"dairy"
+"LatinAmerica",1500,"20100715",3,"west","butter,eggs,flour",2,"dairy"

teradataml/data/trans_sparse.csv ADDED Viewed

@@ -0,0 +1,55 @@
+"location","tranid","period","storeid","region","item","sku","category"
+"MiddleEast",999,"20100715",1,"west","milk",1,"dairy"
+"MiddleEast",999,"20100715",1,"west","butter",2,"dairy"
+"MiddleEast",999,"20100715",1,"west","eggs",3,"dairy"
+"MiddleEast",999,"19990715",1,"west","flour",4,"baking"
+"MiddleEast",999,"19990715",1,"west","spinach",4,"produce"
+"MiddleEast",1000,"20100715",1,"west","milk",1,"dairy"
+"MiddleEast",1000,"20100715",1,"west","eggs",3,"dairy"
+"MiddleEast",1000,"19990715",1,"west","flour",4,"baking"
+"MiddleEast",1000,"19990715",1,"west","spinach",2,"produce"
+"MiddleEast",1001,"20100715",1,"west","milk",1,"dairy"
+"MiddleEast",1001,"20100715",1,"west","butter",2,"dairy"
+"MiddleEast",1001,"20100715",1,"west","eggs",3,"dairy"
+"MiddleEast",1002,"20100715",1,"west","milk",1,"dairy"
+"MiddleEast",1002,"20100715",1,"west","butter",2,"dairy"
+"MiddleEast",1002,"20100715",1,"west","spinach",3,"produce"
+"MiddleEast",1500,"20100715",3,"west","butter",2,"dairy"
+"MiddleEast",1500,"20100715",3,"west","eggs",3,"dairy"
+"MiddleEast",1500,"20100715",3,"west","flour",4,"baking"
+"AsiaPacific",999,"20100715",1,"west","milk",1,"dairy"
+"AsiaPacific",999,"20100715",1,"west","butter",2,"dairy"
+"AsiaPacific",999,"20100715",1,"west","eggs",3,"dairy"
+"AsiaPacific",999,"19990715",1,"west","flour",4,"baking"
+"AsiaPacific",999,"19990715",1,"west","spinach",4,"produce"
+"AsiaPacific",1000,"20100715",1,"west","milk",1,"dairy"
+"AsiaPacific",1000,"20100715",1,"west","eggs",3,"dairy"
+"AsiaPacific",1000,"19990715",1,"west","flour",4,"baking"
+"AsiaPacific",1000,"19990715",1,"west","spinach",2,"produce"
+"AsiaPacific",1001,"20100715",1,"west","milk",1,"dairy"
+"AsiaPacific",1001,"20100715",1,"west","butter",2,"dairy"
+"AsiaPacific",1001,"20100715",1,"west","eggs",3,"dairy"
+"AsiaPacific",1002,"20100715",1,"west","milk",1,"dairy"
+"AsiaPacific",1002,"20100715",1,"west","butter",2,"dairy"
+"AsiaPacific",1002,"20100715",1,"west","spinach",3,"produce"
+"AsiaPacific",1500,"20100715",3,"west","butter",2,"dairy"
+"AsiaPacific",1500,"20100715",3,"west","eggs",3,"dairy"
+"AsiaPacific",1500,"20100715",3,"west","flour",4,"baking"
+"LatinAmerica",999,"20100715",1,"west","milk",1,"dairy"
+"LatinAmerica",999,"20100715",1,"west","butter",2,"dairy"
+"LatinAmerica",999,"20100715",1,"west","eggs",3,"dairy"
+"LatinAmerica",999,"19990715",1,"west","flour",4,"baking"
+"LatinAmerica",999,"19990715",1,"west","spinach",4,"produce"
+"LatinAmerica",1000,"20100715",1,"west","milk",1,"dairy"
+"LatinAmerica",1000,"20100715",1,"west","eggs",3,"dairy"
+"LatinAmerica",1000,"19990715",1,"west","flour",4,"baking"
+"LatinAmerica",1000,"19990715",1,"west","spinach",2,"produce"
+"LatinAmerica",1001,"20100715",1,"west","milk",1,"dairy"
+"LatinAmerica",1001,"20100715",1,"west","butter",2,"dairy"
+"LatinAmerica",1001,"20100715",1,"west","eggs",3,"dairy"
+"LatinAmerica",1002,"20100715",1,"west","milk",1,"dairy"
+"LatinAmerica",1002,"20100715",1,"west","butter",2,"dairy"
+"LatinAmerica",1002,"20100715",1,"west","spinach",3,"produce"
+"LatinAmerica",1500,"20100715",3,"west","butter",2,"dairy"
+"LatinAmerica",1500,"20100715",3,"west","eggs",3,"dairy"
+"LatinAmerica",1500,"20100715",3,"west","flour",4,"baking"

teradataml/dataframe/copy_to.py CHANGED Viewed

@@ -297,10 +297,10 @@ def copy_to_sql(df, table_name,
             >>> from teradatasqlalchemy.types import *
             >>> df = {'emp_name': ['A1', 'A2', 'A3', 'A4'],
-                'emp_sage': [100, 200, 300, 400],
-                'emp_id': [133, 144, 155, 177],
-                'marks': [99.99, 97.32, 94.67, 91.00]
-                }
+            ...       'emp_sage': [100, 200, 300, 400],
+            ...       'emp_id': [133, 144, 155, 177],
+            ...       'marks': [99.99, 97.32, 94.67, 91.00]
+            ...    }
             >>> pandas_df = pd.DataFrame(df)
@@ -313,24 +313,35 @@ def copy_to_sql(df, table_name,
             c) Save a Pandas DataFrame by specifying additional parameters:
             >>> copy_to_sql(df = pandas_df, table_name = 'my_table_2', schema_name = 'alice',
-                            index = True, index_label = 'my_index_label', temporary = False,
-                            primary_index = ['emp_id'], if_exists = 'append',
-                            types = {'emp_name': VARCHAR, 'emp_sage':INTEGER,
-                                     'emp_id': BIGINT, 'marks': DECIMAL})
+            ...             index = True, index_label = 'my_index_label', temporary = False,
+            ...             primary_index = ['emp_id'], if_exists = 'append',
+            ...             types = {'emp_name': VARCHAR, 'emp_sage':INTEGER,
+            ...                      'emp_id': BIGINT, 'marks': DECIMAL})
             d) Saving with additional parameters as a SET table
             >>> copy_to_sql(df = pandas_df, table_name = 'my_table_3', schema_name = 'alice',
-                            index = True, index_label = 'my_index_label', temporary = False,
-                            primary_index = ['emp_id'], if_exists = 'append',
-                            types = {'emp_name': VARCHAR, 'emp_sage':INTEGER,
-                                     'emp_id': BIGINT, 'marks': DECIMAL},
-                            set_table=True)
+            ...             index = True, index_label = 'my_index_label', temporary = False,
+            ...             primary_index = ['emp_id'], if_exists = 'append',
+            ...             types = {'emp_name': VARCHAR, 'emp_sage':INTEGER,
+            ...                       'emp_id': BIGINT, 'marks': DECIMAL},
+            ...             set_table=True)
             e) Saving levels in index of type MultiIndex
             >>> pandas_df = pandas_df.set_index(['emp_id', 'emp_name'])
             >>> copy_to_sql(df = pandas_df, table_name = 'my_table_4', schema_name = 'alice',
-                            index = True, index_label = ['index1', 'index2'], temporary = False,
-                            primary_index = ['index1'], if_exists = 'replace')
+            ...             index = True, index_label = ['index1', 'index2'], temporary = False,
+            ...             primary_index = ['index1'], if_exists = 'replace')
+            f) Save a Pandas DataFrame with VECTOR datatype:
+            >>> import pandas as pd
+            >>> VECTOR_data = {
+            ...        'id': [10, 11, 12, 13],
+            ...        'array_col': ['1,1', '2,2', '3,3', '4,4']
+            ...        }
+            >>> df = pd.DataFrame(VECTOR_data)
+            >>> from teradatasqlalchemy import VECTOR
+            >>> copy_to_sql(df=df, table_name='my_vector_table', types={'array_col': VECTOR})
         2. Saving a teradataml DataFrame:
@@ -358,13 +369,13 @@ def copy_to_sql(df, table_name,
             d) Save a teradataml DataFrame by using copy_to_sql with additional parameters:
             >>> copy_to_sql(df = df2, table_name = 'my_tdml_table_3', schema_name = 'alice',
-                            temporary = False, primary_index = None, if_exists = 'append',
-                            types = {'masters': VARCHAR, 'gpa':INTEGER})
+            ...             temporary = False, primary_index = None, if_exists = 'append',
+            ...             types = {'masters': VARCHAR, 'gpa':INTEGER})
             e) Saving as a SET table
             >>> copy_to_sql(df = df2, table_name = 'my_tdml_set_table', schema_name = 'alice',
-                            temporary = False, primary_index = ['gpa'], if_exists = 'append',
-                            types = {'masters': VARCHAR, 'gpa':INTEGER}, set_table = True)
+            ...             temporary = False, primary_index = ['gpa'], if_exists = 'append',
+            ...             types = {'masters': VARCHAR, 'gpa':INTEGER}, set_table = True)
         3. Saving a teradataml DataFrame as a PTI table:
@@ -377,19 +388,19 @@ def copy_to_sql(df, table_name,
             a) Using copy_to_sql
             >>> copy_to_sql(df3, "test_copyto_pti",
-                            timecode_column='clicktime',
-                            columns_list='event')
+            ...             timecode_column='clicktime',
+            ...             columns_list='event')
             b) Alternatively, using DataFrame.to_sql
             >>> df3.to_sql(table_name = "test_copyto_pti_1",
-                          timecode_column='clicktime',
-                          columns_list='event')
+            ...            timecode_column='clicktime',
+            ...            columns_list='event')
             c) Saving as a SET table
             >>> copy_to_sql(df3, "test_copyto_pti_2",
-                            timecode_column='clicktime',
-                            columns_list='event',
-                            set_table=True)
+            ...             timecode_column='clicktime',
+            ...             columns_list='event',
+            ...             set_table=True)
     """
     # Deriving global connection using get_connection().

teradataml/dataframe/data_transfer.py CHANGED Viewed

@@ -690,77 +690,77 @@ def read_csv(filepath,
         #            while doing so catch all errors and warnings as well as store those in the table.
         >>> types = OrderedDict(id=BIGINT, fname=VARCHAR, lname=VARCHAR, marks=FLOAT)
         >>> read_csv(filepath='test_file.csv',
-                     table_name='my_first_table1', types=types,
-                     save_errors=True, catch_errors_warnings=True)
+        ...          table_name='my_first_table1', types=types,
+        ...          save_errors=True, catch_errors_warnings=True)
         # Example 3: Load the data from CSV file into a table using fastload CSV protocol.
         #            If table exists, then replace the same. Catch all errors and warnings as well as
         #            store those in the table.
         >>> types = OrderedDict(id=BIGINT, fname=VARCHAR, lname=VARCHAR, marks=FLOAT)
         >>> read_csv(filepath='test_file.csv',
-                     table_name='my_first_table',
-                     types=types, if_exists='replace',
-                     save_errors=True, catch_errors_warnings=True)
+        ...          table_name='my_first_table',
+        ...          types=types, if_exists='replace',
+        ...          save_errors=True, catch_errors_warnings=True)
         # Example 4: Load the data from CSV file into a table using fastload CSV protocol.
         #            If table exists in specified schema, then append the same. Catch all
         #            errors and warnings as well as store those in the table.
         >>> types = OrderedDict(id=BIGINT, fname=VARCHAR, lname=VARCHAR, marks=FLOAT)
         >>> read_csv(filepath='test_file.csv',
-                     table_name='my_first_table',
-                     types=types, if_exists='fail',
-                     save_errors=True, catch_errors_warnings=True)
+        ...          table_name='my_first_table',
+        ...          types=types, if_exists='fail',
+        ...          save_errors=True, catch_errors_warnings=True)
         >>> read_csv(filepath='test_file.csv',
-                     table_name='my_first_table',
-                     if_exists='append',
-                     save_errors=True, catch_errors_warnings=True)
+        ...          table_name='my_first_table',
+        ...          if_exists='append',
+        ...          save_errors=True, catch_errors_warnings=True)
         # Example 5: Load the data from CSV file into a SET table using fastload CSV protocol.
         #            Catch all errors and warnings as well as store those in the table.
         >>> types = OrderedDict(id=BIGINT, fname=VARCHAR, lname=VARCHAR, marks=FLOAT)
         >>> read_csv(filepath='test_file.csv',
-                     table_name='my_first_table',
-                     types=types, if_exists='replace',
-                     set_table=True, primary_index='id',
-                     save_errors=True, catch_errors_warnings=True)
+        ...          table_name='my_first_table',
+        ...          types=types, if_exists='replace',
+        ...          set_table=True, primary_index='id',
+        ...          save_errors=True, catch_errors_warnings=True)
         # Example 6: Load the data from CSV file into a temporary table without fastloadCSV protocol.
         #            If table exists, then append to the same.
         >>> types = OrderedDict(id=BIGINT, fname=VARCHAR, lname=VARCHAR, marks=FLOAT)
         >>> read_csv(filepath='test_file.csv',
-                     table_name='my_first_table',
-                     types=types, if_exists='replace',
-                     temporary=True)
+        ...          table_name='my_first_table',
+        ...          types=types, if_exists='replace',
+        ...          temporary=True)
         >>> read_csv(filepath='test_file.csv',
-                     table_name='my_first_table',
-                     if_exists='append',
-                     temporary=True)
+        ...          table_name='my_first_table',
+        ...          if_exists='append',
+        ...          temporary=True)
         # Example 7: Load the data from CSV file with DATE and TIMESTAMP columns into
         #            a table without Fastload protocol. If table exists in specified
         #            schema, then append to the table.
         >>> types = OrderedDict(id=BIGINT, fname=VARCHAR, lname=VARCHAR, marks=FLOAT,
-                     admission_date=DATE, admission_time=TIMESTAMP)
+        ...                     admission_date=DATE, admission_time=TIMESTAMP)
         >>> read_csv(filepath='test_file.csv',
-                     table_name='my_first_table',
-                     types=types, if_exists='fail',
-                     use_fastload=False)
+        ...          table_name='my_first_table',
+        ...          types=types, if_exists='fail',
+        ...          use_fastload=False)
         >>> read_csv(filepath='test_file.csv',
-                     table_name='my_first_table',
-                     if_exists='append',
-                     use_fastload=False)
+        ...          table_name='my_first_table',
+        ...          if_exists='append',
+        ...          use_fastload=False)
         # Example 8: Load the data from CSV file with TIMESTAMP columns into
         #            a PTI table. If specified table exists then append to the table,
         #            otherwise creates new table.
         >>> types = OrderedDict(partition_id=INTEGER, adid=INTEGER, productid=INTEGER,
-                                event=VARCHAR, clicktime=TIMESTAMP)
+        ...                     event=VARCHAR, clicktime=TIMESTAMP)
         >>> read_csv(filepath='test_file.csv',
-                     table_name='my_first_read_csv_pti_table',
-                     types=types, if_exists='append',
-                     timecode_column='clicktime',
-                     columns_list='event',
-                     use_fastload=False)
+        ...          table_name='my_first_read_csv_pti_table',
+        ...          types=types, if_exists='append',
+        ...          timecode_column='clicktime',
+        ...          columns_list='event',
+        ...          use_fastload=False)
         # Example 9: Load the data from CSV file with TIMESTAMP columns into
         #            a SET PTI table. If specified table exists then append to the table,
@@ -768,11 +768,11 @@ def read_csv(filepath,
         >>> types = OrderedDict(partition_id=INTEGER, adid=INTEGER, productid=INTEGER,
                                 event=VARCHAR, clicktime=TIMESTAMP)
         >>> read_csv(filepath='test_file.csv',
-                     table_name='my_first_read_csv_pti_table',
-                     types=types, if_exists='append',
-                     timecode_column='clicktime',
-                     columns_list='event',
-                     set_table=True)
+        ...          table_name='my_first_read_csv_pti_table',
+        ...          types=types, if_exists='append',
+        ...          timecode_column='clicktime',
+        ...          columns_list='event',
+        ...          set_table=True)
         # Example 10: Load the data from CSV file with TIMESTAMP columns into
         #            a temporary PTI table. If specified table exists then append to the table,
@@ -780,11 +780,11 @@ def read_csv(filepath,
         >>> types = OrderedDict(partition_id=INTEGER, adid=INTEGER, productid=INTEGER,
                                 event=VARCHAR, clicktime=TIMESTAMP)
         >>> read_csv(filepath='test_file.csv',
-                     table_name='my_first_read_csv_pti_table',
-                     types=types, if_exists='append',
-                     timecode_column='clicktime',
-                     columns_list='event',
-                     temporary=True)
+        ...          table_name='my_first_read_csv_pti_table',
+        ...          types=types, if_exists='append',
+        ...          timecode_column='clicktime',
+        ...          columns_list='event',
+        ...          temporary=True)
         # Example 11: Load the data from CSV file into Vantage table by opening specified
         #             number of Teradata data transfer sesions.
@@ -796,8 +796,24 @@ def read_csv(filepath,
         #             through primary_index argument.
         >>> types = OrderedDict(id=BIGINT, fname=VARCHAR, lname=VARCHAR, marks=FLOAT)
         >>> read_csv(filepath='test_file.csv', table_name='my_first_table_with_primary_index',
-                    types=types, primary_index = ['fname'])
+        ...          types=types, primary_index = ['fname'])
+        # Example 13: Load the data from CSV file into VECTOR datatype in Vantage table.
+        >>> from teradatasqlalchemy import VECTOR
+        >>> from pathlib import Path
+        >>> types = OrderedDict(id=BIGINT, array_col=VECTOR)
+        # Get the absolute path of the teradataml module
+        >>> import teradataml
+        >>> base_path = Path(teradataml.__path__[0])
+        # Append the relative path to the CSV file
+        >>> csv_path = os.path.join(base_path, "data", "hnsw_alter_data.csv")
+        >>> read_csv(filepath=csv_path,
+        ...          table_name='my_first_table_with_vector',
+        ...          types=types,
+        ...          use_fastload=False)
     """
     # Deriving global connection using context.get_context()
     con = get_context()

teradataml 20.0.0.4__py3-none-any.whl → 20.0.0.5__py3-none-any.whl

Potentially problematic release.

teradataml 20.0.0.4py3-none-any.whl → 20.0.0.5py3-none-any.whl