teradataml 20.0.0.1__py3-none-any.whl → 20.0.0.3__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of teradataml might be problematic. Click here for more details.

Files changed (240) hide show
  1. teradataml/LICENSE-3RD-PARTY.pdf +0 -0
  2. teradataml/LICENSE.pdf +0 -0
  3. teradataml/README.md +306 -0
  4. teradataml/__init__.py +10 -3
  5. teradataml/_version.py +1 -1
  6. teradataml/analytics/__init__.py +3 -2
  7. teradataml/analytics/analytic_function_executor.py +299 -16
  8. teradataml/analytics/analytic_query_generator.py +92 -0
  9. teradataml/analytics/byom/__init__.py +3 -2
  10. teradataml/analytics/json_parser/metadata.py +13 -3
  11. teradataml/analytics/json_parser/utils.py +13 -6
  12. teradataml/analytics/meta_class.py +40 -1
  13. teradataml/analytics/sqle/DecisionTreePredict.py +1 -1
  14. teradataml/analytics/sqle/__init__.py +11 -2
  15. teradataml/analytics/table_operator/__init__.py +4 -3
  16. teradataml/analytics/uaf/__init__.py +21 -2
  17. teradataml/analytics/utils.py +66 -1
  18. teradataml/analytics/valib.py +1 -1
  19. teradataml/automl/__init__.py +1502 -323
  20. teradataml/automl/custom_json_utils.py +139 -61
  21. teradataml/automl/data_preparation.py +247 -307
  22. teradataml/automl/data_transformation.py +32 -12
  23. teradataml/automl/feature_engineering.py +325 -86
  24. teradataml/automl/model_evaluation.py +44 -35
  25. teradataml/automl/model_training.py +122 -153
  26. teradataml/catalog/byom.py +8 -8
  27. teradataml/clients/pkce_client.py +1 -1
  28. teradataml/common/__init__.py +2 -1
  29. teradataml/common/constants.py +72 -0
  30. teradataml/common/deprecations.py +13 -7
  31. teradataml/common/garbagecollector.py +152 -120
  32. teradataml/common/messagecodes.py +11 -2
  33. teradataml/common/messages.py +4 -1
  34. teradataml/common/sqlbundle.py +26 -4
  35. teradataml/common/utils.py +225 -14
  36. teradataml/common/wrapper_utils.py +1 -1
  37. teradataml/context/context.py +82 -2
  38. teradataml/data/SQL_Fundamentals.pdf +0 -0
  39. teradataml/data/complaints_test_tokenized.csv +353 -0
  40. teradataml/data/complaints_tokens_model.csv +348 -0
  41. teradataml/data/covid_confirm_sd.csv +83 -0
  42. teradataml/data/dataframe_example.json +27 -1
  43. teradataml/data/docs/sqle/docs_17_20/CFilter.py +132 -0
  44. teradataml/data/docs/sqle/docs_17_20/NaiveBayes.py +162 -0
  45. teradataml/data/docs/sqle/docs_17_20/OutlierFilterFit.py +2 -0
  46. teradataml/data/docs/sqle/docs_17_20/Pivoting.py +279 -0
  47. teradataml/data/docs/sqle/docs_17_20/Shap.py +203 -0
  48. teradataml/data/docs/sqle/docs_17_20/TDNaiveBayesPredict.py +189 -0
  49. teradataml/data/docs/sqle/docs_17_20/TFIDF.py +142 -0
  50. teradataml/data/docs/sqle/docs_17_20/TextParser.py +3 -3
  51. teradataml/data/docs/sqle/docs_17_20/Unpivoting.py +216 -0
  52. teradataml/data/docs/tableoperator/docs_17_20/Image2Matrix.py +118 -0
  53. teradataml/data/docs/uaf/docs_17_20/ACF.py +1 -10
  54. teradataml/data/docs/uaf/docs_17_20/ArimaEstimate.py +1 -1
  55. teradataml/data/docs/uaf/docs_17_20/ArimaForecast.py +35 -5
  56. teradataml/data/docs/uaf/docs_17_20/ArimaValidate.py +3 -1
  57. teradataml/data/docs/uaf/docs_17_20/ArimaXEstimate.py +293 -0
  58. teradataml/data/docs/uaf/docs_17_20/AutoArima.py +354 -0
  59. teradataml/data/docs/uaf/docs_17_20/BreuschGodfrey.py +3 -2
  60. teradataml/data/docs/uaf/docs_17_20/BreuschPaganGodfrey.py +1 -1
  61. teradataml/data/docs/uaf/docs_17_20/Convolve.py +13 -10
  62. teradataml/data/docs/uaf/docs_17_20/Convolve2.py +4 -1
  63. teradataml/data/docs/uaf/docs_17_20/CopyArt.py +145 -0
  64. teradataml/data/docs/uaf/docs_17_20/CumulPeriodogram.py +5 -4
  65. teradataml/data/docs/uaf/docs_17_20/DFFT2Conv.py +4 -4
  66. teradataml/data/docs/uaf/docs_17_20/DWT.py +235 -0
  67. teradataml/data/docs/uaf/docs_17_20/DWT2D.py +214 -0
  68. teradataml/data/docs/uaf/docs_17_20/DickeyFuller.py +18 -21
  69. teradataml/data/docs/uaf/docs_17_20/DurbinWatson.py +1 -1
  70. teradataml/data/docs/uaf/docs_17_20/ExtractResults.py +1 -1
  71. teradataml/data/docs/uaf/docs_17_20/FilterFactory1d.py +160 -0
  72. teradataml/data/docs/uaf/docs_17_20/GenseriesSinusoids.py +1 -1
  73. teradataml/data/docs/uaf/docs_17_20/GoldfeldQuandt.py +9 -31
  74. teradataml/data/docs/uaf/docs_17_20/HoltWintersForecaster.py +4 -2
  75. teradataml/data/docs/uaf/docs_17_20/IDFFT2.py +1 -8
  76. teradataml/data/docs/uaf/docs_17_20/IDWT.py +236 -0
  77. teradataml/data/docs/uaf/docs_17_20/IDWT2D.py +226 -0
  78. teradataml/data/docs/uaf/docs_17_20/IQR.py +134 -0
  79. teradataml/data/docs/uaf/docs_17_20/LineSpec.py +1 -1
  80. teradataml/data/docs/uaf/docs_17_20/LinearRegr.py +2 -2
  81. teradataml/data/docs/uaf/docs_17_20/MAMean.py +3 -3
  82. teradataml/data/docs/uaf/docs_17_20/Matrix2Image.py +297 -0
  83. teradataml/data/docs/uaf/docs_17_20/MatrixMultiply.py +15 -6
  84. teradataml/data/docs/uaf/docs_17_20/PACF.py +0 -1
  85. teradataml/data/docs/uaf/docs_17_20/Portman.py +2 -2
  86. teradataml/data/docs/uaf/docs_17_20/PowerSpec.py +2 -2
  87. teradataml/data/docs/uaf/docs_17_20/Resample.py +9 -1
  88. teradataml/data/docs/uaf/docs_17_20/SAX.py +246 -0
  89. teradataml/data/docs/uaf/docs_17_20/SeasonalNormalize.py +17 -10
  90. teradataml/data/docs/uaf/docs_17_20/SignifPeriodicities.py +1 -1
  91. teradataml/data/docs/uaf/docs_17_20/WhitesGeneral.py +3 -1
  92. teradataml/data/docs/uaf/docs_17_20/WindowDFFT.py +368 -0
  93. teradataml/data/dwt2d_dataTable.csv +65 -0
  94. teradataml/data/dwt_dataTable.csv +8 -0
  95. teradataml/data/dwt_filterTable.csv +3 -0
  96. teradataml/data/finance_data4.csv +13 -0
  97. teradataml/data/grocery_transaction.csv +19 -0
  98. teradataml/data/idwt2d_dataTable.csv +5 -0
  99. teradataml/data/idwt_dataTable.csv +8 -0
  100. teradataml/data/idwt_filterTable.csv +3 -0
  101. teradataml/data/interval_data.csv +5 -0
  102. teradataml/data/jsons/paired_functions.json +14 -0
  103. teradataml/data/jsons/sqle/17.20/TD_CFilter.json +118 -0
  104. teradataml/data/jsons/sqle/17.20/TD_NaiveBayes.json +193 -0
  105. teradataml/data/jsons/sqle/17.20/TD_NaiveBayesPredict.json +212 -0
  106. teradataml/data/jsons/sqle/17.20/TD_OneClassSVM.json +9 -9
  107. teradataml/data/jsons/sqle/17.20/TD_Pivoting.json +280 -0
  108. teradataml/data/jsons/sqle/17.20/TD_Shap.json +222 -0
  109. teradataml/data/jsons/sqle/17.20/TD_TFIDF.json +162 -0
  110. teradataml/data/jsons/sqle/17.20/TD_TextParser.json +1 -1
  111. teradataml/data/jsons/sqle/17.20/TD_Unpivoting.json +235 -0
  112. teradataml/data/jsons/sqle/20.00/TD_KMeans.json +250 -0
  113. teradataml/data/jsons/sqle/20.00/TD_SMOTE.json +266 -0
  114. teradataml/data/jsons/sqle/20.00/TD_VectorDistance.json +278 -0
  115. teradataml/data/jsons/storedprocedure/17.20/TD_COPYART.json +71 -0
  116. teradataml/data/jsons/storedprocedure/17.20/TD_FILTERFACTORY1D.json +150 -0
  117. teradataml/data/jsons/tableoperator/17.20/IMAGE2MATRIX.json +53 -0
  118. teradataml/data/jsons/uaf/17.20/TD_ACF.json +1 -18
  119. teradataml/data/jsons/uaf/17.20/TD_ARIMAESTIMATE.json +3 -16
  120. teradataml/data/jsons/uaf/17.20/TD_ARIMAFORECAST.json +0 -3
  121. teradataml/data/jsons/uaf/17.20/TD_ARIMAVALIDATE.json +5 -3
  122. teradataml/data/jsons/uaf/17.20/TD_ARIMAXESTIMATE.json +362 -0
  123. teradataml/data/jsons/uaf/17.20/TD_AUTOARIMA.json +469 -0
  124. teradataml/data/jsons/uaf/17.20/TD_BINARYMATRIXOP.json +0 -3
  125. teradataml/data/jsons/uaf/17.20/TD_BINARYSERIESOP.json +0 -2
  126. teradataml/data/jsons/uaf/17.20/TD_BREUSCH_GODFREY.json +2 -1
  127. teradataml/data/jsons/uaf/17.20/TD_BREUSCH_PAGAN_GODFREY.json +2 -5
  128. teradataml/data/jsons/uaf/17.20/TD_CONVOLVE.json +3 -6
  129. teradataml/data/jsons/uaf/17.20/TD_CONVOLVE2.json +1 -3
  130. teradataml/data/jsons/uaf/17.20/TD_CUMUL_PERIODOGRAM.json +0 -5
  131. teradataml/data/jsons/uaf/17.20/TD_DFFT.json +1 -4
  132. teradataml/data/jsons/uaf/17.20/TD_DFFT2.json +2 -7
  133. teradataml/data/jsons/uaf/17.20/TD_DFFT2CONV.json +1 -2
  134. teradataml/data/jsons/uaf/17.20/TD_DFFTCONV.json +0 -2
  135. teradataml/data/jsons/uaf/17.20/TD_DICKEY_FULLER.json +10 -19
  136. teradataml/data/jsons/uaf/17.20/TD_DTW.json +3 -6
  137. teradataml/data/jsons/uaf/17.20/TD_DWT.json +173 -0
  138. teradataml/data/jsons/uaf/17.20/TD_DWT2D.json +160 -0
  139. teradataml/data/jsons/uaf/17.20/TD_FITMETRICS.json +1 -1
  140. teradataml/data/jsons/uaf/17.20/TD_GOLDFELD_QUANDT.json +16 -30
  141. teradataml/data/jsons/uaf/17.20/{TD_HOLT_WINTERS_FORECAST.json → TD_HOLT_WINTERS_FORECASTER.json} +1 -2
  142. teradataml/data/jsons/uaf/17.20/TD_IDFFT2.json +1 -15
  143. teradataml/data/jsons/uaf/17.20/TD_IDWT.json +162 -0
  144. teradataml/data/jsons/uaf/17.20/TD_IDWT2D.json +149 -0
  145. teradataml/data/jsons/uaf/17.20/TD_IQR.json +117 -0
  146. teradataml/data/jsons/uaf/17.20/TD_LINEAR_REGR.json +1 -1
  147. teradataml/data/jsons/uaf/17.20/TD_LINESPEC.json +1 -1
  148. teradataml/data/jsons/uaf/17.20/TD_MAMEAN.json +1 -3
  149. teradataml/data/jsons/uaf/17.20/TD_MATRIX2IMAGE.json +209 -0
  150. teradataml/data/jsons/uaf/17.20/TD_PACF.json +2 -2
  151. teradataml/data/jsons/uaf/17.20/TD_POWERSPEC.json +5 -5
  152. teradataml/data/jsons/uaf/17.20/TD_RESAMPLE.json +48 -28
  153. teradataml/data/jsons/uaf/17.20/TD_SAX.json +210 -0
  154. teradataml/data/jsons/uaf/17.20/TD_SEASONALNORMALIZE.json +12 -6
  155. teradataml/data/jsons/uaf/17.20/TD_SIMPLEEXP.json +0 -1
  156. teradataml/data/jsons/uaf/17.20/TD_TRACKINGOP.json +8 -8
  157. teradataml/data/jsons/uaf/17.20/TD_UNDIFF.json +1 -1
  158. teradataml/data/jsons/uaf/17.20/TD_UNNORMALIZE.json +1 -1
  159. teradataml/data/jsons/uaf/17.20/TD_WINDOWDFFT.json +410 -0
  160. teradataml/data/load_example_data.py +8 -2
  161. teradataml/data/medical_readings.csv +101 -0
  162. teradataml/data/naivebayestextclassifier_example.json +1 -1
  163. teradataml/data/naivebayestextclassifierpredict_example.json +11 -0
  164. teradataml/data/patient_profile.csv +101 -0
  165. teradataml/data/peppers.png +0 -0
  166. teradataml/data/real_values.csv +14 -0
  167. teradataml/data/sax_example.json +8 -0
  168. teradataml/data/scripts/deploy_script.py +1 -1
  169. teradataml/data/scripts/lightgbm/dataset.template +157 -0
  170. teradataml/data/scripts/lightgbm/lightgbm_class_functions.template +247 -0
  171. teradataml/data/scripts/lightgbm/lightgbm_function.template +216 -0
  172. teradataml/data/scripts/lightgbm/lightgbm_sklearn.template +159 -0
  173. teradataml/data/scripts/sklearn/sklearn_fit.py +194 -160
  174. teradataml/data/scripts/sklearn/sklearn_fit_predict.py +136 -115
  175. teradataml/data/scripts/sklearn/sklearn_function.template +34 -16
  176. teradataml/data/scripts/sklearn/sklearn_model_selection_split.py +155 -137
  177. teradataml/data/scripts/sklearn/sklearn_neighbors.py +1 -1
  178. teradataml/data/scripts/sklearn/sklearn_score.py +12 -3
  179. teradataml/data/scripts/sklearn/sklearn_transform.py +162 -24
  180. teradataml/data/star_pivot.csv +8 -0
  181. teradataml/data/target_udt_data.csv +8 -0
  182. teradataml/data/templates/open_source_ml.json +3 -1
  183. teradataml/data/teradataml_example.json +20 -1
  184. teradataml/data/timestamp_data.csv +4 -0
  185. teradataml/data/titanic_dataset_unpivoted.csv +19 -0
  186. teradataml/data/uaf_example.json +55 -1
  187. teradataml/data/unpivot_example.json +15 -0
  188. teradataml/data/url_data.csv +9 -0
  189. teradataml/data/vectordistance_example.json +4 -0
  190. teradataml/data/windowdfft.csv +16 -0
  191. teradataml/dataframe/copy_to.py +1 -1
  192. teradataml/dataframe/data_transfer.py +5 -3
  193. teradataml/dataframe/dataframe.py +1002 -201
  194. teradataml/dataframe/fastload.py +3 -3
  195. teradataml/dataframe/functions.py +867 -0
  196. teradataml/dataframe/row.py +160 -0
  197. teradataml/dataframe/setop.py +2 -2
  198. teradataml/dataframe/sql.py +840 -33
  199. teradataml/dataframe/window.py +1 -1
  200. teradataml/dbutils/dbutils.py +878 -34
  201. teradataml/dbutils/filemgr.py +48 -1
  202. teradataml/geospatial/geodataframe.py +1 -1
  203. teradataml/geospatial/geodataframecolumn.py +1 -1
  204. teradataml/hyperparameter_tuner/optimizer.py +13 -13
  205. teradataml/lib/aed_0_1.dll +0 -0
  206. teradataml/opensource/__init__.py +1 -1
  207. teradataml/opensource/{sklearn/_class.py → _class.py} +102 -17
  208. teradataml/opensource/_lightgbm.py +950 -0
  209. teradataml/opensource/{sklearn/_wrapper_utils.py → _wrapper_utils.py} +1 -2
  210. teradataml/opensource/{sklearn/constants.py → constants.py} +13 -10
  211. teradataml/opensource/sklearn/__init__.py +0 -1
  212. teradataml/opensource/sklearn/_sklearn_wrapper.py +1019 -574
  213. teradataml/options/__init__.py +9 -23
  214. teradataml/options/configure.py +42 -4
  215. teradataml/options/display.py +2 -2
  216. teradataml/plot/axis.py +4 -4
  217. teradataml/scriptmgmt/UserEnv.py +13 -9
  218. teradataml/scriptmgmt/lls_utils.py +77 -23
  219. teradataml/store/__init__.py +13 -0
  220. teradataml/store/feature_store/__init__.py +0 -0
  221. teradataml/store/feature_store/constants.py +291 -0
  222. teradataml/store/feature_store/feature_store.py +2223 -0
  223. teradataml/store/feature_store/models.py +1505 -0
  224. teradataml/store/vector_store/__init__.py +1586 -0
  225. teradataml/table_operators/Script.py +2 -2
  226. teradataml/table_operators/TableOperator.py +106 -20
  227. teradataml/table_operators/query_generator.py +3 -0
  228. teradataml/table_operators/table_operator_query_generator.py +3 -1
  229. teradataml/table_operators/table_operator_util.py +102 -56
  230. teradataml/table_operators/templates/dataframe_register.template +69 -0
  231. teradataml/table_operators/templates/dataframe_udf.template +63 -0
  232. teradataml/telemetry_utils/__init__.py +0 -0
  233. teradataml/telemetry_utils/queryband.py +52 -0
  234. teradataml/utils/dtypes.py +4 -2
  235. teradataml/utils/validators.py +34 -2
  236. {teradataml-20.0.0.1.dist-info → teradataml-20.0.0.3.dist-info}/METADATA +311 -3
  237. {teradataml-20.0.0.1.dist-info → teradataml-20.0.0.3.dist-info}/RECORD +240 -157
  238. {teradataml-20.0.0.1.dist-info → teradataml-20.0.0.3.dist-info}/WHEEL +0 -0
  239. {teradataml-20.0.0.1.dist-info → teradataml-20.0.0.3.dist-info}/top_level.txt +0 -0
  240. {teradataml-20.0.0.1.dist-info → teradataml-20.0.0.3.dist-info}/zip-safe +0 -0
@@ -0,0 +1,266 @@
1
+ {
2
+ "json_schema_major_version": "1",
3
+ "json_schema_minor_version": "2",
4
+ "json_content_version": "1",
5
+ "function_name": "TD_SMOTE",
6
+ "function_version": "1.0",
7
+ "function_type": "fastpath",
8
+ "function_category": "Feature Engineering Transform Functions",
9
+ "function_alias_name": "TD_SMOTE",
10
+ "function_r_name": "aa.td_smote",
11
+ "ref_function_r_name": "aa.td_smote",
12
+ "short_description": "This function generates data by oversampling a minority class.",
13
+ "long_description": "This function generates data by oversampling a minority class using smote, adasyn, borderline-2 or smote-nc algorithms.",
14
+ "input_tables": [
15
+ {
16
+ "requiredInputKind": [
17
+ "PartitionByAny"
18
+ ],
19
+ "isOrdered": false,
20
+ "partitionByOne": false,
21
+ "name": "InputTable",
22
+ "alternateNames": [],
23
+ "isRequired": true,
24
+ "rDescription": "Specifies the table containing the input data.",
25
+ "description": "Specifies the table containing the input data.",
26
+ "datatype": "TABLE_ALIAS",
27
+ "allowsLists": false,
28
+ "rName": "data",
29
+ "useInR": true,
30
+ "rOrderNum": 1
31
+ },
32
+ {
33
+ "requiredInputKind": [
34
+ "Dimension"
35
+ ],
36
+
37
+ "isOrdered": false,
38
+ "partitionByOne": false,
39
+ "name": "EncodingsTable",
40
+ "alternateNames": [],
41
+ "isRequired": false,
42
+ "rDescription": "Specifies the table created with TD_OrdinalEncodingFit output, using the categorical input columns as TargetColumns. Used and required only with smotenc.",
43
+ "description": "Specifies the table creted with TD_OrdinalEncodingFit output, using the categorical input columns as TargetColumns. Used and required only with smotenc.",
44
+ "datatype": "TABLE_ALIAS",
45
+ "allowsLists": false,
46
+ "rName": "encoding.data",
47
+ "useInR": true,
48
+ "rOrderNum": 2
49
+ }
50
+ ],
51
+ "argument_clauses": [
52
+ {
53
+ "targetTable": [
54
+ "InputTable"
55
+ ],
56
+
57
+ "checkDuplicate": true,
58
+ "allowedTypes": [],
59
+ "allowedTypeGroups": [
60
+ "INTEGER"
61
+ ],
62
+
63
+ "matchLengthOfArgument": "",
64
+ "allowPadding": false,
65
+ "name": "IDColumn",
66
+ "alternateNames": [],
67
+ "isRequired": true,
68
+ "rDescription": "specifies the name of the column that uniquely identifies a data sample in the input table.",
69
+ "description": "specifies the name of the column that uniquely identifies a data sample in the input table.",
70
+ "datatype": "COLUMNS",
71
+ "allowsLists": false,
72
+ "rName": "id.column",
73
+ "useInR": true,
74
+ "rOrderNum": 3
75
+ },
76
+ {
77
+ "targetTable": [
78
+ "InputTable"
79
+ ],
80
+ "checkDuplicate": true,
81
+ "allowedTypes": [],
82
+ "allowedTypeGroups": [
83
+ "NUMERIC"
84
+ ],
85
+
86
+ "matchLengthOfArgument": "",
87
+ "allowPadding": false,
88
+ "name": "ResponseColumn",
89
+ "alternateNames": [],
90
+ "isRequired": false,
91
+ "rDescription": "specifies the name of the input table column that contains the numeric value to be used as the response value for a sample.",
92
+ "description": "specifies the name of the input table column that contains the numeric value to be used as the response value for a sample.",
93
+ "datatype": "COLUMNS",
94
+ "allowsLists": false,
95
+ "rName": "response.column",
96
+ "useInR": true,
97
+ "rOrderNum": 4
98
+ },
99
+ {
100
+ "targetTable": [
101
+ "InputTable"
102
+ ],
103
+ "checkDuplicate": true,
104
+ "allowedTypes": [],
105
+ "allowedTypeGroups": [
106
+ "NUMERIC"
107
+ ],
108
+ "matchLengthOfArgument": "",
109
+ "allowPadding": false,
110
+ "name": "InputColumns",
111
+ "alternateNames": [],
112
+ "isRequired": true,
113
+ "rDescription": "specifies the name of the input table columns that the function uses for oversampling.",
114
+ "description": "specifies the name of the input table columns that the function uses for oversampling.",
115
+ "datatype": "COLUMNS",
116
+ "allowsLists": true,
117
+ "rName": "input.columns",
118
+ "useInR": true,
119
+ "rOrderNum": 5
120
+ },
121
+ {
122
+ "targetTable": [
123
+ "InputTable"
124
+ ],
125
+ "checkDuplicate": true,
126
+ "allowedTypes": [],
127
+ "allowedTypeGroups": [
128
+ "STRING"
129
+ ],
130
+ "matchLengthOfArgument": "",
131
+ "allowPadding": false,
132
+ "name": "CategoricalInputColumns",
133
+ "alternateNames": [],
134
+ "isRequired": false,
135
+ "rDescription": "specifies the name of the categorical columns in the input table that the function uses for oversampling with smotenc.",
136
+ "description": "specifies the name of the categorical columns in the input table that the function uses for oversampling with smotenc.",
137
+ "datatype": "COLUMNS",
138
+ "allowsLists": true,
139
+ "rName": "categorical.columns",
140
+ "useInR": true,
141
+ "rOrderNum": 6
142
+ },
143
+ {
144
+ "isOutputColumn": false,
145
+ "name": "MedianStandardDeviation",
146
+ "alternateNames": [],
147
+ "isRequired": false,
148
+ "rDescription": "specifies the median of the standard deviations computed over the numerical input columns. Required only with smotenc.",
149
+ "description": "specifies the median of the standard deviations computed over the numerical input columns. Required only with smotenc.",
150
+ "datatype": "DOUBLE",
151
+ "allowsLists": false,
152
+ "rName": "median.standard.deviation",
153
+ "useInR": true,
154
+ "rOrderNum": 7
155
+ },
156
+ {
157
+ "isOutputColumn": false,
158
+ "name": "MinorityClass",
159
+ "alternateNames": [],
160
+ "isRequired": true,
161
+ "rDescription": "specifies the minority class for which synthetic samples need to be generated. The label for minority class under response column must be numeric integer.",
162
+ "description": "specifies the minority class for which synthetic samples need to be generated. The label for minority class under response column must be numeric integer.",
163
+ "datatype": "STRING",
164
+ "allowsLists": false,
165
+ "rName": "minority.class",
166
+ "useInR": true,
167
+ "rOrderNum": 8
168
+ },
169
+ {
170
+ "isOutputColumn": false,
171
+ "allowNaN": false,
172
+ "name": "OversamplingFactor",
173
+ "alternateNames": [],
174
+ "isRequired": true,
175
+ "rDescription": "specifies the factor for oversampling the minority class.",
176
+ "description": "specifies the factor for oversampling the minority class.",
177
+ "datatype": "DOUBLE",
178
+ "allowsLists": false,
179
+ "rName": "oversampling.factor",
180
+ "useInR": true,
181
+ "rOrderNum": 9
182
+ },
183
+ {
184
+ "permittedValues": ["smote", "adasyn", "borderline","smotenc"],
185
+ "isOutputColumn": false,
186
+ "defaultValue": "smote",
187
+ "name": "SamplingStrategy",
188
+ "alternateNames": [],
189
+ "isRequired": false,
190
+ "rDescription": "specifies the oversampling algorithm to be used to create synthetic samples.",
191
+ "description": "specifies the oversampling algorithm to be used to create synthetic samples.",
192
+ "datatype": "STRING",
193
+ "allowsLists": false,
194
+ "rName": "sampling.strategy",
195
+ "useInR": true,
196
+ "rOrderNum": 10
197
+ },
198
+ {
199
+ "defaultValue": true,
200
+ "isOutputColumn": false,
201
+ "name": "FillSampleID",
202
+ "isRequired": false,
203
+ "rDescription": "A boolean flag which specifies whether the function should write out the id of the observation used to generate the corresponding new synthetic observations.",
204
+ "description": "A boolean flag which specifies whether the function should write out the id of the observation used to generate the corresponding new synthetic observations.",
205
+ "datatype": "BOOLEAN",
206
+ "allowsLists": false,
207
+ "rName": "fill.sampleid",
208
+ "useInR": true,
209
+ "rOrderNum": 11
210
+ },
211
+ {
212
+ "permittedValues": ["sample", "neighbor", "null"],
213
+ "isOutputColumn": false,
214
+ "defaultValue": "sample",
215
+ "name": "ValueForNonInputColumns",
216
+ "alternateNames": [],
217
+ "isRequired": false,
218
+ "rDescription": "Specifies the value to put in a sample column for columns not specified as input columns.",
219
+ "description": "Specifies the value to put in a sample column for columns not specified as input columns.",
220
+ "datatype": "STRING",
221
+ "allowsLists": false,
222
+ "rName": "noninput.columns.value",
223
+ "useInR": true,
224
+ "rOrderNum": 12
225
+ },
226
+ {
227
+ "defaultValue": 5,
228
+ "lowerBound": 2,
229
+ "upperBound": 100,
230
+ "lowerBoundType": "INCLUSIVE",
231
+ "upperBoundType": "INCLUSIVE",
232
+ "allowNaN": false,
233
+ "isOutputColumn": false,
234
+ "matchLengthOfArgument": "",
235
+ "allowPadding": false,
236
+ "name": "NumberOfNeighbors",
237
+ "alternateNames": [],
238
+ "isRequired": false,
239
+ "rDescription": "Specifies the number of nearest neighbors for choosing the sample to be used in oversampling.",
240
+ "description": "Specifies the number of nearest neighbors for choosing the sample to be used in oversampling.",
241
+ "datatype": "INTEGER",
242
+ "allowsLists": false,
243
+ "rName": "n.neighbors",
244
+ "useInR": true,
245
+ "rOrderNum": 13
246
+ },
247
+ {
248
+ "lowerBound": 0,
249
+ "upperBound": 186006,
250
+ "lowerBoundType": "INCLUSIVE",
251
+ "upperBoundType": "INCLUSIVE",
252
+ "allowNaN": false,
253
+ "name": "Seed",
254
+ "alternateNames": [],
255
+ "isRequired": false,
256
+ "rDescription": "Specify the random seed the algorithm uses for repeatable results. The function uses the seed for random interpolation and generate the synthetic sample.",
257
+ "description": "Specify the random seed the algorithm uses for repeatable results. The function uses the seed for random interpolation and generate the synthetic sample.",
258
+ "datatype": "INTEGER",
259
+ "allowsLists": false,
260
+ "rName": "seed",
261
+ "useInR": true,
262
+ "rOrderNum": 14
263
+ }
264
+ ]
265
+ }
266
+
@@ -0,0 +1,278 @@
1
+ {
2
+ "json_schema_major_version": "1",
3
+ "json_schema_minor_version": "1",
4
+ "json_content_version": "1",
5
+ "function_name": "TD_VectorDistance",
6
+ "function_version": "1.0",
7
+ "function_type": "fastpath",
8
+ "function_category": "Model Training",
9
+ "function_alias_name": "TD_VectorDistance",
10
+ "function_r_name": "aa.td_vectordistance",
11
+ "short_description": "fastpath function which takes a table of target vectors and a table of reference vectors(optional) and returns a table that contains the distance between the target-reference pair.",
12
+ "long_description": "fastpath function which takes a table of target vectors and a table of reference vectors(optional) and returns a table that contains the distance between the target-reference pair.",
13
+ "input_tables": [
14
+ {
15
+ "requiredInputKind": [
16
+ "PartitionByAny"
17
+ ],
18
+ "isOrdered": false,
19
+ "partitionByOne": false,
20
+ "name": "TargetTable",
21
+ "alternateNames": [],
22
+ "isRequired": true,
23
+ "rDescription": "The relation that contains target table vectors.",
24
+ "description": "The relation that contains target table vectors.",
25
+ "datatype": "TABLE_ALIAS",
26
+ "allowsLists": false,
27
+ "rName": "target.table",
28
+ "useInR": true,
29
+ "rOrderNum": 1
30
+ },
31
+ {
32
+ "requiredInputKind": [
33
+ "Dimension"
34
+ ],
35
+ "isOrdered": false,
36
+ "partitionByOne": false,
37
+ "name": "ReferenceTable",
38
+ "alternateNames": [],
39
+ "isRequired": false,
40
+ "rDescription": "The relation that contains reference table vectors.",
41
+ "description": "The relation that contains reference table vectors.",
42
+ "datatype": "TABLE_ALIAS",
43
+ "allowsLists": false,
44
+ "rName": "reference.table",
45
+ "useInR": true,
46
+ "rOrderNum": 2
47
+ }
48
+ ],
49
+ "argument_clauses": [
50
+ {
51
+ "targetTable": [
52
+ "TargetTable"
53
+ ],
54
+ "checkDuplicate": true,
55
+ "allowedTypes": [],
56
+ "allowedTypeGroups": [
57
+ "INTEGER"
58
+ ],
59
+ "requiredLength": 1,
60
+ "matchLengthOfArgument": "",
61
+ "allowPadding": false,
62
+ "name": "TargetIDColumn",
63
+ "alternateNames": [],
64
+ "isRequired": true,
65
+ "rDescription": "Specifies the name of the target table column that contains identifiers of the target table vectors.",
66
+ "description": "Specifies the name of the target table column that contains identifiers of the target table vectors.",
67
+ "datatype": "COLUMNS",
68
+ "allowsLists": false,
69
+ "rName": "target.id.column",
70
+ "useInR": true,
71
+ "rOrderNum": 3
72
+ },
73
+ {
74
+ "targetTable": [
75
+ "TargetTable"
76
+ ],
77
+ "checkDuplicate": true,
78
+ "allowedTypes": [],
79
+ "allowedTypeGroups": [
80
+ "NUMERIC","AIVECTOR","BYTE","VARBYTE"
81
+ ],
82
+ "matchLengthOfArgument": "",
83
+ "allowPadding": false,
84
+ "name": "TargetFeatureColumns",
85
+ "alternateNames": [],
86
+ "isRequired": true,
87
+ "rDescription": "Specifies the names of the target table columns that contain features of the target table vectors.",
88
+ "description": "Specifies the names of the target table columns that contain features of the target table vectors.",
89
+ "datatype": "COLUMNS",
90
+ "allowsLists": true,
91
+ "rName": "target.feature.columns",
92
+ "useInR": true,
93
+ "rOrderNum": 4
94
+ },
95
+ {
96
+ "targetTable": [
97
+ "ReferenceTable"
98
+ ],
99
+ "checkDuplicate": true,
100
+ "allowedTypes": [],
101
+ "allowedTypeGroups": [
102
+ "INTEGER"
103
+ ],
104
+ "requiredLength": 1,
105
+ "matchLengthOfArgument": "",
106
+ "allowPadding": false,
107
+ "name": "RefIDColumn",
108
+ "alternateNames": [],
109
+ "isRequired": false,
110
+ "rDescription": "Specifies the name of the reference table column that contains identifiers of the reference table vectors.",
111
+ "description": "Specifies the name of the reference table column that contains identifiers of the reference table vectors.",
112
+ "datatype": "COLUMNS",
113
+ "allowsLists": false,
114
+ "rName": "ref.id.column",
115
+ "useInR": true,
116
+ "rOrderNum": 5
117
+ },
118
+ {
119
+ "targetTable": [
120
+ "ReferenceTable"
121
+ ],
122
+ "checkDuplicate": true,
123
+ "allowedTypes": [],
124
+ "allowedTypeGroups": [
125
+ "NUMERIC","AIVECTOR","BYTE","VARBYTE"
126
+ ],
127
+ "matchLengthOfArgument": "",
128
+ "allowPadding": false,
129
+ "name": "RefFeatureColumns",
130
+ "alternateNames": [],
131
+ "isRequired": false,
132
+ "rDescription": "Specifies the names of the reference table columns that contain features of the reference table vectors.",
133
+ "description": "Specifies the names of the reference table columns that contain features of the reference table vectors.",
134
+ "datatype": "COLUMNS",
135
+ "allowsLists": true,
136
+ "rName": "ref.feature.columns",
137
+ "useInR": true,
138
+ "rOrderNum": 6
139
+ },
140
+ {
141
+ "permittedValues": [
142
+ "COSINE",
143
+ "EUCLIDEAN",
144
+ "MANHATTAN",
145
+ "DOTPRODUCT",
146
+ "MINKOWSKI"
147
+ ],
148
+ "defaultValue": "COSINE",
149
+ "isOutputColumn": false,
150
+ "matchLengthOfArgument": "",
151
+ "allowPadding": false,
152
+ "name": "DistanceMeasure",
153
+ "alternateNames": [],
154
+ "isRequired": false,
155
+ "rDescription": "Specifies the distance measures that the function uses.The default value is 'cosine'.",
156
+ "description": "Specifies the distance measures that the function uses.The default value is 'cosine'.",
157
+ "datatype": "STRING",
158
+ "allowsLists": true,
159
+ "rName": "distance.measure",
160
+ "useInR": true,
161
+ "rOrderNum": 7
162
+ },
163
+ {
164
+ "defaultValue": 10,
165
+ "lowerBound": 1,
166
+ "upperBound": 100,
167
+ "lowerBoundType": "INCLUSIVE",
168
+ "upperBoundType": "INCLUSIVE",
169
+ "allowNaN": false,
170
+ "isOutputColumn": false,
171
+ "matchLengthOfArgument": "",
172
+ "allowPadding": false,
173
+ "name": "TopK",
174
+ "alternateNames": [],
175
+ "isRequired": false,
176
+ "rDescription": "Specifies, for each target vector and for each measure, the maximum number of closest reference vectors to include in the output table.",
177
+ "description": "Specifies, for each target vector and for each measure, the maximum number of closest reference vectors to include in the output table.",
178
+ "datatype": "INTEGER",
179
+ "allowsLists": false,
180
+ "rName": "topk",
181
+ "useInR": true,
182
+ "rOrderNum": 8
183
+ },
184
+ {
185
+ "defaultValue": 2,
186
+ "lowerBound": 1,
187
+ "upperBound": 2147483647,
188
+ "lowerBoundType": "INCLUSIVE",
189
+ "upperBoundType": "INCLUSIVE",
190
+ "allowNaN": false,
191
+ "isOutputColumn": false,
192
+ "matchLengthOfArgument": "",
193
+ "allowPadding": false,
194
+ "name": "PValue",
195
+ "alternateNames": [],
196
+ "isRequired": false,
197
+ "rDescription": "Specify the p value for MinKowski distance.",
198
+ "description": "Specify the p value for MinKowski distance.",
199
+ "datatype": "INTEGER",
200
+ "allowsLists": false,
201
+ "rName": "pvalue",
202
+ "useInR": true,
203
+ "rOrderNum": 9
204
+ },
205
+ {
206
+ "lowerBound": 2.225074e-308,
207
+ "upperBound": 1.797693e+308,
208
+ "lowerBoundType": "INCLUSIVE",
209
+ "upperBoundType": "INCLUSIVE",
210
+ "allowNaN": false,
211
+ "isOutputColumn": false,
212
+ "matchLengthOfArgument": "",
213
+ "allowPadding": false,
214
+ "name": "SearchThresholds",
215
+ "alternateNames": [],
216
+ "isRequired": false,
217
+ "rDescription": "Specifies the thresholds between a pair of target and reference vectors.",
218
+ "description": "Specifies the thresholds between a pair of target and reference vectors.",
219
+ "datatype": "NUMERIC",
220
+ "allowsLists": true,
221
+ "rName": "search.thresholds",
222
+ "useInR": true,
223
+ "rOrderNum": 10
224
+ },
225
+ {
226
+ "permittedValues": [],
227
+ "isOutputColumn": false,
228
+ "matchLengthOfArgument": "",
229
+ "allowPadding": false,
230
+ "defaultValue": false,
231
+ "name": "LargeReferenceInput",
232
+ "alternateNames": [],
233
+ "isRequired": false,
234
+ "rDescription": "If the reference table is huge compared to the target table, then passing true in this syntax element will make the reference table as 'Partition By any' instead of 'Dimension'.",
235
+ "description": "If the reference table is huge compared to the target table, then passing true in this syntax element will make the reference table as 'Partition By any' instead of 'Dimension'.",
236
+ "datatype": "BOOLEAN",
237
+ "allowsLists": false,
238
+ "rName": "largereference.input",
239
+ "useInR": true,
240
+ "rOrderNum": 11
241
+ },
242
+ {
243
+ "permittedValues": [],
244
+ "isOutputColumn": false,
245
+ "matchLengthOfArgument": "",
246
+ "allowPadding": false,
247
+ "defaultValue": false,
248
+ "name": "OutputSimilarity",
249
+ "alternateNames": [],
250
+ "isRequired": false,
251
+ "rDescription": "Specify true if the user wants similarity instead of distance.",
252
+ "description": "Specify true if the user wants similarity instead of distance.",
253
+ "datatype": "BOOLEAN",
254
+ "allowsLists": false,
255
+ "rName": "output.similarity",
256
+ "useInR": true,
257
+ "rOrderNum": 12
258
+ },
259
+ {
260
+ "defaultValue": 1,
261
+ "lowerBound": 1,
262
+ "upperBound": 4096,
263
+ "lowerBoundType": "INCLUSIVE",
264
+ "upperBoundType": "INCLUSIVE",
265
+ "allowNaN": false,
266
+ "name": "EmbeddingSize",
267
+ "alternateNames": [],
268
+ "isRequired": false,
269
+ "rDescription": "Specify the embedding size of the vectors.",
270
+ "description": "Specify the embedding size of the vectors.",
271
+ "datatype": "INTEGER",
272
+ "allowsLists": false,
273
+ "rName": "embedding.size",
274
+ "useInR": true,
275
+ "rOrderNum": 13
276
+ }
277
+ ]
278
+ }
@@ -0,0 +1,71 @@
1
+ {
2
+ "FuncName": "TD_COPYART",
3
+ "FuncDescriptionShort": "TD_COPYART creates a copy of existing ART table.",
4
+ "FuncDescriptionLong": [
5
+ "creates a copy of existing ART table with permanet or volatile option."
6
+ ],
7
+ "FunctionVersion": "...",
8
+ "FunctionCategory": "General Utility",
9
+ "JSONVersion": "1",
10
+ "FuncRName": "td_Copy_Art",
11
+ "MaxInputFiles": 0,
12
+ "Input": [],
13
+ "Output": [],
14
+ "Params": [
15
+ {
16
+ "Name": "DST_DATABASENAME",
17
+ "Type": "string",
18
+ "Optional": false,
19
+ "Description": [
20
+ "Name of the target database.",
21
+ "Must include where TGT_TABLENAME need to be created."
22
+ ],
23
+ "LangName": "database_name"
24
+ },
25
+ {
26
+ "Name": "DST_TABLENAME",
27
+ "Type": "string",
28
+ "Optional": false,
29
+ "Description": [
30
+ "Name of the target table."
31
+ ],
32
+ "LangName": "table_name"
33
+ },
34
+ {
35
+ "Name": "DST_MAPNAME",
36
+ "Type": "string",
37
+ "Optional": false,
38
+ "Description": [
39
+ "[Optional] If not specified, the default map is used.",
40
+ "Provided name of the map to be used for the copy."
41
+ ],
42
+ "LangName": "map_name"
43
+ },
44
+ {
45
+ "Name": "DST_ISPERMTABLE",
46
+ "Type": "string",
47
+ "Optional": true,
48
+ "PermittedValues": [
49
+ "T",
50
+ "TRUE",
51
+ "F",
52
+ "FALSE",
53
+ "t",
54
+ "true",
55
+ "'true'",
56
+ "'false'",
57
+ "f",
58
+ "false"
59
+ ],
60
+ "Description": [
61
+ "[Optional] If not specified, the default is true.",
62
+ "If true, the target table is permanent.",
63
+ "If false, the target table is volatile."
64
+ ],
65
+ "LangName": "permanent_table"
66
+ }
67
+ ],
68
+ "IsPlottable": true,
69
+ "InputFmt": false,
70
+ "OutputFmt": false
71
+ }