@frontlinesystems/rason-mcp-server 2026.5.1 → 2026.5.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (194) hide show
  1. package/LICENSE +35 -35
  2. package/examples/EXAMPLES_REFERENCE.md +128 -128
  3. package/examples/{optimization → Optimization}/Conic/AirlineHubConic.json +111 -111
  4. package/examples/{optimization → Optimization}/Conic/AirlineHubConic2.json +108 -108
  5. package/examples/{optimization → Optimization}/Conic/AirlineHubConic3.json +111 -111
  6. package/examples/{optimization → Optimization}/Conic/AirlineHubConic4.json +99 -99
  7. package/examples/{optimization → Optimization}/Conic/AirlineHubConic5.json +101 -101
  8. package/examples/{optimization → Optimization}/DataBinding/ProductMixCsv.json +81 -81
  9. package/examples/{optimization → Optimization}/DataBinding/ProductMixCsv4.json +96 -96
  10. package/examples/{optimization → Optimization}/DataBinding/ProductMixExcel.json +73 -73
  11. package/examples/{optimization → Optimization}/DataBinding/ProductMixExcel1.json +86 -86
  12. package/examples/{optimization → Optimization}/DataBinding/ProductMixExcel11.json +108 -108
  13. package/examples/{optimization → Optimization}/DataBinding/ProductMixExcel2.json +77 -77
  14. package/examples/{optimization → Optimization}/DataBinding/ProductMixTab.json +89 -89
  15. package/examples/{optimization → Optimization}/DataBinding/ProductMixTab1.json +73 -73
  16. package/examples/{optimization → Optimization}/DataBinding/ProductMixTab2.json +77 -77
  17. package/examples/{optimization → Optimization}/Linear/Inventory.json +199 -199
  18. package/examples/{optimization → Optimization}/Linear/Matop.json +119 -119
  19. package/examples/{optimization → Optimization}/Linear/ProductMix.json +97 -97
  20. package/examples/{optimization → Optimization}/Linear/ProductMix2.json +72 -72
  21. package/examples/{optimization → Optimization}/Linear/ProductMix3.json +49 -49
  22. package/examples/{optimization → Optimization}/Linear/ProductMix4.json +56 -56
  23. package/examples/{optimization → Optimization}/Linear/ProductMixCsv1.json +106 -106
  24. package/examples/{optimization → Optimization}/Linear/ProductMixCsv2.json +106 -106
  25. package/examples/{optimization → Optimization}/Linear/ProductMixSQL11.json +82 -82
  26. package/examples/{optimization → Optimization}/Linear/Rowop.json +126 -126
  27. package/examples/{optimization → Optimization}/NonLinear/AirlineHub.json +63 -63
  28. package/examples/{optimization → Optimization}/NonLinear/AirlineHub2.json +47 -47
  29. package/examples/{optimization → Optimization}/NonLinear/AirlineHub3.json +47 -47
  30. package/examples/{optimization → Optimization}/NonSmooth/Inventory2.json +159 -159
  31. package/examples/{optimization → Optimization}/Quadratic/PortfolioOpt.json +55 -55
  32. package/examples/{optimization → Optimization}/Quadratic/PortfolioOpt2.json +65 -65
  33. package/examples/{optimization → Optimization}/WithUncertainty/GasCompanyChance.json +78 -78
  34. package/examples/{optimization → Optimization}/WithUncertainty/GasCompanyRecourse.json +78 -78
  35. package/examples/{optimization → Optimization}/WithUncertainty/ProjectSelect.json +77 -77
  36. package/examples/{optimization → Optimization}/WithUncertainty/ProjectSelect2.json +81 -81
  37. package/examples/{optimization → Optimization}/WithUncertainty/ProjectSelect3.json +84 -84
  38. package/examples/{optimization → Optimization}/WithUncertainty/ProjectSelect4.json +74 -74
  39. package/examples/{simulation → Simulation}/CandyStoreSalesUsingSIP.json +147 -147
  40. package/examples/{simulation → Simulation}/CollegeFundGrowth1.json +423 -423
  41. package/examples/{simulation → Simulation}/CollegeFundGrowth1SIPModel.json +27 -27
  42. package/examples/{simulation → Simulation}/CollegeFundGrowth2.json +415 -415
  43. package/examples/{simulation → Simulation}/CollegeFundGrowthSIP.json +401 -401
  44. package/examples/{simulation → Simulation}/GBMSimulationModel.json +236 -236
  45. package/examples/{simulation → Simulation}/YieldManagement(Sim).json +69 -69
  46. package/examples/{simulation → Simulation}/YieldManagement2(Sim).json +72 -72
  47. package/examples/calculation/DMNExamples/DMN Box Fun with typeDef result.json +53 -53
  48. package/examples/calculation/DMNExamples/DMN Context example.json +69 -69
  49. package/examples/calculation/DMNExamples/DMN DT with typeDef result.json +43 -43
  50. package/examples/calculation/DMNExamples/FEEL Date Time example.json +28 -28
  51. package/examples/calculation/DMNExamples/FEEL For iteration example.json +66 -66
  52. package/examples/calculation/DMNExamples/FEEL For with two indices.json +15 -15
  53. package/examples/calculation/DMNExamples/FEEL For with typeDef result.json +88 -88
  54. package/examples/calculation/DMNExamples/FEEL If Then Else example.json +25 -25
  55. package/examples/calculation/DMNExamples/FEEL List example.json +37 -37
  56. package/examples/calculation/DMNExamples/FEEL List operator.json +17 -17
  57. package/examples/calculation/DMNExamples/FEEL List with typeDef collection.json +36 -36
  58. package/examples/calculation/DMNExamples/FEEL Some or Every example.json +65 -65
  59. package/examples/calculation/DecisionTables/DT Datasource example.json +52 -52
  60. package/examples/calculation/DecisionTables/DT Date and Time examples.json +91 -91
  61. package/examples/calculation/DecisionTables/DT Expression example.json +32 -32
  62. package/examples/calculation/DecisionTables/DT Hit Policy examples.json +136 -136
  63. package/examples/calculation/DecisionTables/DT Loan Recommend model.json +81 -81
  64. package/examples/calculation/DecisionTables/DT Loan Strategy Model and Predictive CSV-XML.json +218 -218
  65. package/examples/calculation/DecisionTables/DT Loan Strategy model and Datasource.json +286 -286
  66. package/examples/calculation/DecisionTables/DT Loan Strategy model and Predictive.json +203 -203
  67. package/examples/calculation/DecisionTables/DT Loan Strategy model by scratch.json +214 -214
  68. package/examples/calculation/DecisionTables/DT Output Order example.json +39 -39
  69. package/examples/calculation/DecisionTables/DT Unique example.json +38 -38
  70. package/examples/calculation/TypeDefinitions/TypeDefCF.json +64 -64
  71. package/examples/calculation/TypeDefinitions/TypeDefDT.json +57 -57
  72. package/examples/datamining/AffinityAnalysis/AssociationRules.json +51 -51
  73. package/examples/datamining/Classification/DecisionTree.json +90 -90
  74. package/examples/datamining/Classification/DiscriminantAnalysis.json +81 -81
  75. package/examples/datamining/Classification/Ensembles/Bagging.json +66 -66
  76. package/examples/datamining/Classification/Ensembles/Boosting.json +67 -67
  77. package/examples/datamining/Classification/Ensembles/RandomTrees.json +91 -91
  78. package/examples/datamining/Classification/FindBestModel.json +86 -86
  79. package/examples/datamining/Classification/LogisticRegression.json +82 -82
  80. package/examples/datamining/Classification/NaiveBayes.json +78 -78
  81. package/examples/datamining/Classification/NearestNeighbors.json +84 -84
  82. package/examples/datamining/Classification/NeuralNetwork.json +92 -92
  83. package/examples/datamining/Clustering/Hierarchical.json +54 -54
  84. package/examples/datamining/Clustering/KMeans.json +71 -71
  85. package/examples/datamining/DataSources/DelimitedFile.json +49 -49
  86. package/examples/datamining/DataSources/JSONFile.json +49 -49
  87. package/examples/datamining/DataSources/MSAccessDatabase.json +49 -49
  88. package/examples/datamining/DataSources/MSExcelTable.json +50 -50
  89. package/examples/datamining/DataSources/MSSQLDatabase.json +49 -49
  90. package/examples/datamining/DataSources/ODATATable.json +49 -49
  91. package/examples/datamining/DataSources/ODBCDatabase.json +49 -49
  92. package/examples/datamining/FeatureSelection/LinearWrapping.json +53 -53
  93. package/examples/datamining/FeatureSelection/LogisticWrapping.json +56 -56
  94. package/examples/datamining/FeatureSelection/Univariate.json +78 -78
  95. package/examples/datamining/Regression/DecisionTree.json +82 -82
  96. package/examples/datamining/Regression/Ensembles/Bagging.json +62 -62
  97. package/examples/datamining/Regression/Ensembles/Boosting.json +62 -62
  98. package/examples/datamining/Regression/Ensembles/RandomTrees.json +78 -78
  99. package/examples/datamining/Regression/FindBestModel.json +86 -86
  100. package/examples/datamining/Regression/LinearRegression.json +124 -124
  101. package/examples/datamining/Regression/NearestNeighbors.json +77 -77
  102. package/examples/datamining/Regression/NeuralNetwork.json +82 -82
  103. package/examples/datamining/Scoring/JSONClassifier.json +62 -62
  104. package/examples/datamining/Scoring/JSONClassifierNN.json +62 -62
  105. package/examples/datamining/Scoring/JSONClusterizer.json +37 -37
  106. package/examples/datamining/Scoring/JSONForecaster.json +49 -49
  107. package/examples/datamining/Scoring/JSONLinearRegression.json +56 -56
  108. package/examples/datamining/Scoring/JSONPCA.json +41 -41
  109. package/examples/datamining/Scoring/JSONRegressor.json +56 -56
  110. package/examples/datamining/Scoring/JSONTransformer.json +38 -38
  111. package/examples/datamining/Scoring/PMMLClassifier.json +42 -42
  112. package/examples/datamining/Scoring/PMMLForecaster.json +43 -43
  113. package/examples/datamining/Scoring/PMMLRegressor.json +38 -38
  114. package/examples/datamining/Scoring/PMMLTransformer.json +38 -38
  115. package/examples/datamining/Simulation/LinearRegressionSimulation.json +117 -117
  116. package/examples/datamining/Simulation/SyntheticDataGeneration.json +108 -108
  117. package/examples/datamining/Simulation/pmml-risk-scoring.json +62 -62
  118. package/examples/datamining/Summarizer/Summarization.json +54 -54
  119. package/examples/datamining/TextMining/LatentSemanticAnalysis.json +51 -51
  120. package/examples/datamining/TextMining/TfIdf-FileData.json +65 -65
  121. package/examples/datamining/TextMining/TfIdf-InlineData.json +55 -55
  122. package/examples/datamining/TimeSeries/AddHoltWinters.json +79 -79
  123. package/examples/datamining/TimeSeries/Arima.json +74 -74
  124. package/examples/datamining/TimeSeries/DoubleExponential.json +65 -65
  125. package/examples/datamining/TimeSeries/Exponential.json +64 -64
  126. package/examples/datamining/TimeSeries/LagAnalysis.json +48 -48
  127. package/examples/datamining/TimeSeries/MovingAverage.json +65 -65
  128. package/examples/datamining/TimeSeries/MulHoltWinters.json +65 -65
  129. package/examples/datamining/TimeSeries/NoTrendHoltWinters.json +65 -65
  130. package/examples/datamining/Transformation/Binning.json +69 -69
  131. package/examples/datamining/Transformation/CanonicalVariateAnalysis.json +47 -47
  132. package/examples/datamining/Transformation/CategoryReduction.json +51 -51
  133. package/examples/datamining/Transformation/Factorization.json +50 -50
  134. package/examples/datamining/Transformation/MissingDataHandling.json +83 -83
  135. package/examples/datamining/Transformation/OneHotEncoding-DataInline.json +54 -54
  136. package/examples/datamining/Transformation/OneHotEncoding-DatainFile.json +48 -48
  137. package/examples/datamining/Transformation/PartitionTimeSeries.json +48 -48
  138. package/examples/datamining/Transformation/Partitioning-DF.json +72 -72
  139. package/examples/datamining/Transformation/Partitioning.json +46 -46
  140. package/examples/datamining/Transformation/PartitioningWithOversampling-DF.json +65 -65
  141. package/examples/datamining/Transformation/PartitioningWithOversampling.json +44 -44
  142. package/examples/datamining/Transformation/PrincipalComponentsAnalysis.json +52 -52
  143. package/examples/datamining/Transformation/Rescaling.json +67 -67
  144. package/examples/datamining/Transformation/Sampling.json +43 -43
  145. package/examples/datamining/Transformation/StratifiedSampling.json +46 -46
  146. package/examples/flow/SQLServerTransform.json +260 -260
  147. package/examples/flow/dm-calc-pipeline.json +277 -277
  148. package/examples/flow/dm-pipeline-simulation.json +113 -113
  149. package/examples/flow/opt-sim-pipeline.json +159 -159
  150. package/examples/flow/sim-dm-pipeline.json +106 -106
  151. package/examples/flow/sim-sim-pipeline.json +136 -136
  152. package/examples/index.json +4678 -4678
  153. package/examples/rason-features/Arrays_Loops_Tables/ArrayExamples/DataFiltering/ListwithFilter.json +52 -52
  154. package/examples/rason-features/Arrays_Loops_Tables/ArrayExamples/Loops/ProductMix5.json +57 -57
  155. package/examples/rason-features/Arrays_Loops_Tables/ArrayExamples/Loops/compoundWhileStatement.json +35 -35
  156. package/examples/rason-features/Arrays_Loops_Tables/ArrayExamples/Loops/ifThenElseStatement.json +33 -33
  157. package/examples/rason-features/Arrays_Loops_Tables/ArrayExamples/Loops/nestedLoop.json +25 -25
  158. package/examples/rason-features/Arrays_Loops_Tables/ArrayExamples/ParallelArray.json +47 -47
  159. package/examples/rason-features/Arrays_Loops_Tables/ArrayExamples/indexedArray.json +69 -69
  160. package/examples/rason-features/Arrays_Loops_Tables/ArrayExamples/nonParallelArray.json +49 -49
  161. package/examples/rason-features/Arrays_Loops_Tables/ArrayExamples/sumAggregateExample.json +337 -337
  162. package/examples/rason-features/Arrays_Loops_Tables/ArrayExamples/tsp.json +61 -61
  163. package/examples/rason-features/BoxIterators/Box_Fun_Loop_Iter_Sim_RASON.json +190 -190
  164. package/examples/rason-features/BoxIterators/Box_Fun_Loop_Sim_RASON.json +75 -75
  165. package/examples/rason-features/BoxIterators/Box_Fun_Sim_RASON.json +108 -108
  166. package/examples/rason-features/BoxIterators/Box_Iter_SIM_RASON.json +68 -68
  167. package/examples/rason-features/BoxIterators/Box_Iterator_Calc_Loop.json +183 -183
  168. package/examples/rason-features/BoxIterators/Box_Iterator_with_typeDef_partial.json +79 -79
  169. package/examples/rason-features/BoxLambdaExamples/BoxFunOptimize.json +154 -154
  170. package/examples/rason-features/BoxLambdaExamples/BoxFunSimulate.json +118 -118
  171. package/examples/rason-features/BoxLambdaExamples/LambdaFunOptimize.json +142 -142
  172. package/examples/rason-features/BoxLambdaExamples/LambdaFunSimulate.json +81 -81
  173. package/examples/rason-features/ReferenceGuide/RGFirehouseLocation.json +69 -69
  174. package/examples/rason-features/ReferenceGuide/RGFirehouseLocationConic.json +113 -113
  175. package/examples/rason-features/ReferenceGuide/RGProductMixCsv1.json +107 -107
  176. package/examples/rason-features/ReferenceGuide/RGProductMixExcel11.json +117 -117
  177. package/examples/rason-features/ReferenceGuide/RGProductMixSQL11.json +108 -108
  178. package/examples/rason-features/UserGuide/UGAirlineHubCSV.json +67 -67
  179. package/examples/rason-features/UserGuide/UGForecast.json +50 -50
  180. package/examples/rason-features/UserGuide/UGProductMix1.json +48 -48
  181. package/examples/rason-features/UserGuide/UGProductMix2.json +48 -48
  182. package/examples/rason-features/UserGuide/UGProductMixTab1.json +67 -67
  183. package/examples/rason-features/UserGuide/UGProductMixTab2.json +76 -76
  184. package/examples/rason-features/UserGuide/UGProductMixTab3.json +66 -66
  185. package/examples/rason-features/UserGuide/UGProductMixTab4.json +70 -70
  186. package/examples/rason-features/UserGuide/UGProductMixTab5.json +67 -67
  187. package/examples/rason-features/UserGuide/UGProjectSelect0.json +91 -91
  188. package/examples/rason-features/UserGuide/UGProjectSelect1.json +74 -74
  189. package/examples/rason-features/UserGuide/UGProjectSelect2.json +74 -74
  190. package/examples/rason-features/UserGuide/UGYieldManagement1.json +61 -61
  191. package/examples/rason-features/UserGuide/UGYieldManagement2.json +61 -61
  192. package/examples/rason-features/UserGuide/UGYieldManagement3.json +63 -63
  193. package/out/index.cjs +1 -1
  194. package/package.json +3 -2
@@ -1,63 +1,63 @@
1
- {
2
- "modelDescription": "Regression: Linear RASON model scoring from pmml and risk analysis. This example model first imports two datasources, a training partition and a file containing new data. Then each datasource is bound to a dataset. Afterwards a previously posted fitted model, linear-fitted, is used to score both datasets. The fitted model must first be POSTed to the RASON Server BEFORE this model can be POSTed. Download the fitted model by clicking the download icon above RASON Examples (on the ribbon). Then click the Open File icon (far left), browse to the downloaded files, and open the file, linear-fitted.xml. POST the fitted model by clicking the POST icon, cloud icon on the left of the ribbon.",
3
- "comment": "Fitted model, linear-fitted, must first be POSTed to RASON Server. (Click Download RASON Example data to download file.)",
4
- "modelName": "pmmlRiskScorer",
5
- "modelType": "datamining",
6
- "datasources": {
7
- "comment": "Datasources to use with this model. Typically these bind to external data sources due to data volume.",
8
- "trainDataSource": {
9
- "comment": "Binds the bh-scale-reg.txt data set to the trainDataSource datasource. This represents the training partition.",
10
- "type": "csv",
11
- "connection": "bh-scale-reg.txt"
12
- },
13
- "newDataSource": {
14
- "comment": "Binds the bh-scale-reg-score.txt data set to the newDataSource datasource. This represents the new data to be scored.",
15
- "type": "csv",
16
- "connection": "bh-scale-reg-score.txt"
17
- }
18
- },
19
- "datasets": {
20
- "comment": "Binds each datasource to a dataset.",
21
- "trainData": {
22
- "comment": "Binds the data source trainDataSource (bh-scale-reg.txt) to the trainData dataset.",
23
- "binding": "trainDataSource",
24
- "targetCol": "MEDV"
25
- },
26
- "newData": {
27
- "comment": "Binds the data source newDataSource (bh-scale-reg-score.txt) to the newData dataset.",
28
- "binding": "newDataSource"
29
- }
30
- },
31
- "fittedModel": {
32
- "comment": "Binds an imported or POSTed fitted model to a fittedModel. This step is not optional.",
33
- "mlrModel": {
34
- "comment": "Binds the linear-fitted fitted model, already POSTed to the RASON Server, to mlrModel. Recall that this fitted model must first be downloaded (by clicking the Download RASON Examples icon) and then POSTed to the RASON model (by clicking the POST icon, cloud icon on the top left).",
35
- "modelName": "linear-fitted",
36
- "simulation": {
37
- "metalogAuto": true,
38
- "useMinMaxAsBounds": true,
39
- "correlationType": "RANK",
40
- "sampleSize": 506,
41
- "randomSeed": 12345,
42
- "expression": "IF(CRIM<10, MEDV, 2*MEDV)"
43
- }
44
- }
45
- },
46
- "actions": {
47
- "comment": "define the actions, evaluations, and data to be used by the estimator defined above.",
48
- "trainPrediction": {
49
- "comment": "Scores the trainData dataset (bh-scale-reg.txt) using the fitted model, mlrModel. For a complete list of all available evaluations and parameters, see the RASON Data Science Model Components chapter in the RASON Reference Guide. (Click the Help tab to download.) ",
50
- "data": "trainData",
51
- "fittedModel": "mlrModel",
52
- "action": "predict",
53
- "evaluations": [ "prediction", "simulationLog", "simulationData", "simulationPrediction", "simulationExpression", "trainingExpression", "summary", "advancedSummary", "sixSigma", "percentiles", "histogram" ]
54
- },
55
- "newPrediction": {
56
- "comment": "Scores the myData dataset (bh-scale-reg-score.txt) using the fitted model, mlrModel. For a complete list of all available evaluations and parameters, see the RASON Data Science Model Components chapter in the RASON Reference Guide. (Click the Help tab to download.)",
57
- "data": "newData",
58
- "fittedModel": "mlrModel",
59
- "action": "predict",
60
- "evaluations": [ "prediction", "summary", "advancedSummary", "sixSigma", "percentiles", "histogram" ]
61
- }
62
- }
1
+ {
2
+ "modelDescription": "Regression: Linear RASON model scoring from pmml and risk analysis. This example model first imports two datasources, a training partition and a file containing new data. Then each datasource is bound to a dataset. Afterwards a previously posted fitted model, linear-fitted, is used to score both datasets. The fitted model must first be POSTed to the RASON Server BEFORE this model can be POSTed. Download the fitted model by clicking the download icon above RASON Examples (on the ribbon). Then click the Open File icon (far left), browse to the downloaded files, and open the file, linear-fitted.xml. POST the fitted model by clicking the POST icon, cloud icon on the left of the ribbon.",
3
+ "comment": "Fitted model, linear-fitted, must first be POSTed to RASON Server. (Click Download RASON Example data to download file.)",
4
+ "modelName": "pmmlRiskScorer",
5
+ "modelType": "datamining",
6
+ "datasources": {
7
+ "comment": "Datasources to use with this model. Typically these bind to external data sources due to data volume.",
8
+ "trainDataSource": {
9
+ "comment": "Binds the bh-scale-reg.txt data set to the trainDataSource datasource. This represents the training partition.",
10
+ "type": "csv",
11
+ "connection": "bh-scale-reg.txt"
12
+ },
13
+ "newDataSource": {
14
+ "comment": "Binds the bh-scale-reg-score.txt data set to the newDataSource datasource. This represents the new data to be scored.",
15
+ "type": "csv",
16
+ "connection": "bh-scale-reg-score.txt"
17
+ }
18
+ },
19
+ "datasets": {
20
+ "comment": "Binds each datasource to a dataset.",
21
+ "trainData": {
22
+ "comment": "Binds the data source trainDataSource (bh-scale-reg.txt) to the trainData dataset.",
23
+ "binding": "trainDataSource",
24
+ "targetCol": "MEDV"
25
+ },
26
+ "newData": {
27
+ "comment": "Binds the data source newDataSource (bh-scale-reg-score.txt) to the newData dataset.",
28
+ "binding": "newDataSource"
29
+ }
30
+ },
31
+ "fittedModel": {
32
+ "comment": "Binds an imported or POSTed fitted model to a fittedModel. This step is not optional.",
33
+ "mlrModel": {
34
+ "comment": "Binds the linear-fitted fitted model, already POSTed to the RASON Server, to mlrModel. Recall that this fitted model must first be downloaded (by clicking the Download RASON Examples icon) and then POSTed to the RASON model (by clicking the POST icon, cloud icon on the top left).",
35
+ "modelName": "linear-fitted",
36
+ "simulation": {
37
+ "metalogAuto": true,
38
+ "useMinMaxAsBounds": true,
39
+ "correlationType": "RANK",
40
+ "sampleSize": 506,
41
+ "randomSeed": 12345,
42
+ "expression": "IF(CRIM<10, MEDV, 2*MEDV)"
43
+ }
44
+ }
45
+ },
46
+ "actions": {
47
+ "comment": "define the actions, evaluations, and data to be used by the estimator defined above.",
48
+ "trainPrediction": {
49
+ "comment": "Scores the trainData dataset (bh-scale-reg.txt) using the fitted model, mlrModel. For a complete list of all available evaluations and parameters, see the RASON Data Science Model Components chapter in the RASON Reference Guide. (Click the Help tab to download.) ",
50
+ "data": "trainData",
51
+ "fittedModel": "mlrModel",
52
+ "action": "predict",
53
+ "evaluations": [ "prediction", "simulationLog", "simulationData", "simulationPrediction", "simulationExpression", "trainingExpression", "summary", "advancedSummary", "sixSigma", "percentiles", "histogram" ]
54
+ },
55
+ "newPrediction": {
56
+ "comment": "Scores the myData dataset (bh-scale-reg-score.txt) using the fitted model, mlrModel. For a complete list of all available evaluations and parameters, see the RASON Data Science Model Components chapter in the RASON Reference Guide. (Click the Help tab to download.)",
57
+ "data": "newData",
58
+ "fittedModel": "mlrModel",
59
+ "action": "predict",
60
+ "evaluations": [ "prediction", "summary", "advancedSummary", "sixSigma", "percentiles", "histogram" ]
61
+ }
62
+ }
63
63
  }
@@ -1,55 +1,55 @@
1
- {
2
- "modelName": "summarization",
3
- "modelDescription": "This RASON model example calls summarization to calculate statistics, percentiles and six sigma metrics for the dataset.",
4
- "modelType": "datamining",
5
- "datasources": {
6
- "comment": "Datasources to use with this model. Typically these bind to external data sources due to data volume.",
7
- "mySrc": {
8
- "comment": "Binds the hald-small.txt data set to the mySrc datasource.",
9
- "type": "csv",
10
- "connection": "hald-small.txt"
11
- }
12
- },
13
- "datasets": {
14
- "comment": "Binds each datasource to a dataset.",
15
- "myData": {
16
- "comment": "Binds the data source mySrc (hald-small.txt) to the myData dataset.",
17
- "binding": "mySrc"
18
- }
19
- },
20
- "transformer": {
21
- "comment": "Defines a transformer, including the type, algorithm and parameters. Only 1 estimator/transformer may appear in a RASON model.",
22
- "summarizer": {
23
- "comment": "Defines the summarizer as a summarization transformer. For a complete list of all supported options for summarization, see the RASON Data Mining Components chapter in the RASON Reference Guide. (Click the Help tab to download.)",
24
- "type": "transformation",
25
- "algorithm": "summarization",
26
- "parameters": {
27
- "numBins": [
28
- [ "X2", 4 ],
29
- [ "X4", 5 ]
30
- ]
31
- }
32
- }
33
- },
34
- "actions": {
35
- "comment": "Define actions, evaluations, and data to be used by the estimator created above.",
36
- "mySummaries": {
37
- "comment": "Summarizes the myData dataset (hald-small.txt) using the summarization transformer. Various evaluations are requested such as summary information, six sigma metrics, percentiles, etc. For a complete list of all available parameters and evaluations for summarization, see the RASON Data Mining Components chapter in the RASON Reference Guide. (Click the Help tab to download.)",
38
- "data": "myData",
39
- "action": "transform",
40
- "evaluations": [ "summary", "advancedSummary", "sixSigma", "percentiles", "histogram" ],
41
- "parameters": {
42
- "semiVariancePower": 2,
43
- "semiDeviationPower": 2,
44
- "varPercentile": 0.95,
45
- "cvarPercentile": 0.95,
46
- "meanConfidencePercentile": 0.95,
47
- "sixSigmaPercentileLB": 0.05,
48
- "sixSigmaPercentileUB": 0.95,
49
- "sixSigmaShift": 0.0,
50
- "sixSigmaNumStdDev": 6.0,
51
- "sixSigmaTarget": 0.0
52
- }
53
- }
54
- }
1
+ {
2
+ "modelName": "summarization",
3
+ "modelDescription": "This RASON model example calls summarization to calculate statistics, percentiles and six sigma metrics for the dataset.",
4
+ "modelType": "datamining",
5
+ "datasources": {
6
+ "comment": "Datasources to use with this model. Typically these bind to external data sources due to data volume.",
7
+ "mySrc": {
8
+ "comment": "Binds the hald-small.txt data set to the mySrc datasource.",
9
+ "type": "csv",
10
+ "connection": "hald-small.txt"
11
+ }
12
+ },
13
+ "datasets": {
14
+ "comment": "Binds each datasource to a dataset.",
15
+ "myData": {
16
+ "comment": "Binds the data source mySrc (hald-small.txt) to the myData dataset.",
17
+ "binding": "mySrc"
18
+ }
19
+ },
20
+ "transformer": {
21
+ "comment": "Defines a transformer, including the type, algorithm and parameters. Only 1 estimator/transformer may appear in a RASON model.",
22
+ "summarizer": {
23
+ "comment": "Defines the summarizer as a summarization transformer. For a complete list of all supported options for summarization, see the RASON Data Mining Components chapter in the RASON Reference Guide. (Click the Help tab to download.)",
24
+ "type": "transformation",
25
+ "algorithm": "summarization",
26
+ "parameters": {
27
+ "numBins": [
28
+ [ "X2", 4 ],
29
+ [ "X4", 5 ]
30
+ ]
31
+ }
32
+ }
33
+ },
34
+ "actions": {
35
+ "comment": "Define actions, evaluations, and data to be used by the estimator created above.",
36
+ "mySummaries": {
37
+ "comment": "Summarizes the myData dataset (hald-small.txt) using the summarization transformer. Various evaluations are requested such as summary information, six sigma metrics, percentiles, etc. For a complete list of all available parameters and evaluations for summarization, see the RASON Data Mining Components chapter in the RASON Reference Guide. (Click the Help tab to download.)",
38
+ "data": "myData",
39
+ "action": "transform",
40
+ "evaluations": [ "summary", "advancedSummary", "sixSigma", "percentiles", "histogram" ],
41
+ "parameters": {
42
+ "semiVariancePower": 2,
43
+ "semiDeviationPower": 2,
44
+ "varPercentile": 0.95,
45
+ "cvarPercentile": 0.95,
46
+ "meanConfidencePercentile": 0.95,
47
+ "sixSigmaPercentileLB": 0.05,
48
+ "sixSigmaPercentileUB": 0.95,
49
+ "sixSigmaShift": 0.0,
50
+ "sixSigmaNumStdDev": 6.0,
51
+ "sixSigmaTarget": 0.0
52
+ }
53
+ }
54
+ }
55
55
  }
@@ -1,52 +1,52 @@
1
- {
2
- "modelName": "LatentSemanticAnalysis",
3
- "modelDescription": "RASON Example using Text Miner - Latent Semantic Anlaysis is a technique in natural language processing between a set of documents and their contained terms by generating a set of concepts related to the documents and terms.",
4
- "modelType": "datamining",
5
- "datasources": {
6
- "comment": "Datasources to use with this model. Typically these bind to external data sources due to data volume.",
7
- "myTrainSrc": {
8
- "comment": "Imports tdmRomeo.txt data source. This file contains a term-document matrix. This matrix is an evaluation, or output, from the Text Miner feature. See the two TFIDF (Text Miner) examples for help on generating this output. ",
9
- "type": "csv",
10
- "connection": "tdmRomeo.txt",
11
- "direction": "import"
12
- }
13
- },
14
- "datasets": {
15
- "comment": "Binds each datasource to a dataset.",
16
- "trainTermDocMatrix": {
17
- "comment": "Binds the myTrainSrc data source (tdmRomeo.txt) to trainTermDocMatrix data set",
18
- "binding": "myTrainSrc"
19
- }
20
- },
21
- "estimator": {
22
- "comment": "Defines a transformer, including the type, algorithm and parameters. Only 1 estimator/transformer may appear in a RASON model.",
23
- "lsaEstimator": {
24
- "comment": "Defines the lsaEstimator as a text mining, latent semantic analysis (LSA) regression estimator. For a complete list of all supported algorithm options for LSA, see the RASON Data Science Model Components chapter in the RASON Reference Guide. (Click the Help tab to download.)",
25
- "type": "textMining",
26
- "algorithm": "latentSemanticAnalysis",
27
- "parameters": {
28
- "maxNumConcepts": 4,
29
- "computeTermImportance": true,
30
- "computeConceptImportance": true
31
- }
32
- }
33
- },
34
- "actions": {
35
- "comment": "Define actions, evaluations, and data to be used by the estimator created above.",
36
- "lsaModel": {
37
- "comment": "Fits lsaEstimator to trainTermDocMatrix (tdmRomeo.txt). The fitted model, given the same name as this example, LatentSemanticAnalysis, is automatically posted to the RASON Server. This fitted model may be called The export property exports the fitted model to a JSON file. Three evaluations are requested: vocabulary, termImportance and conceptImportance. Vocabulary returns the final list of terms. The number of terms included in this list is determined by the 'maxVocabulary' estimator parameter setting. Termimportance returns the most frequently appearing terms along with their Importance factor. ConceptImportance returns the Concept Importance table which lists each concept, its singular value, the cumulative singular value and the % singular value explained. For more information on the evaluations supported by LSA, click the Help tab to download te RASON Reference guide.",
38
- "trainData": "trainTermDocMatrix",
39
- "estimator": "lsaEstimator",
40
- "export": "json",
41
- "action": "fit",
42
- "evaluations": [ "vocabulary", "termImportance", "conceptImportance" ]
43
- },
44
- "tfRomeo": {
45
- "comment": "Uses the fitted model lsaModel to score trainTermDocMatrix (tdmRomeo.txt). Two evaluations are requested in the results: transformation, which returns the transformed dataset, and termConceptMatrix, which lists the most important concepts vs most frequently appearing terms.",
46
- "data": "trainTermDocMatrix",
47
- "fittedModel": "lsaModel",
48
- "action": "transform",
49
- "evaluations": [ "transformation", "termConceptMatrix" ]
50
- }
51
- }
1
+ {
2
+ "modelName": "LatentSemanticAnalysis",
3
+ "modelDescription": "RASON Example using Text Miner - Latent Semantic Anlaysis is a technique in natural language processing between a set of documents and their contained terms by generating a set of concepts related to the documents and terms.",
4
+ "modelType": "datamining",
5
+ "datasources": {
6
+ "comment": "Datasources to use with this model. Typically these bind to external data sources due to data volume.",
7
+ "myTrainSrc": {
8
+ "comment": "Imports tdmRomeo.txt data source. This file contains a term-document matrix. This matrix is an evaluation, or output, from the Text Miner feature. See the two TFIDF (Text Miner) examples for help on generating this output. ",
9
+ "type": "csv",
10
+ "connection": "tdmRomeo.txt",
11
+ "direction": "import"
12
+ }
13
+ },
14
+ "datasets": {
15
+ "comment": "Binds each datasource to a dataset.",
16
+ "trainTermDocMatrix": {
17
+ "comment": "Binds the myTrainSrc data source (tdmRomeo.txt) to trainTermDocMatrix data set",
18
+ "binding": "myTrainSrc"
19
+ }
20
+ },
21
+ "estimator": {
22
+ "comment": "Defines a transformer, including the type, algorithm and parameters. Only 1 estimator/transformer may appear in a RASON model.",
23
+ "lsaEstimator": {
24
+ "comment": "Defines the lsaEstimator as a text mining, latent semantic analysis (LSA) regression estimator. For a complete list of all supported algorithm options for LSA, see the RASON Data Science Model Components chapter in the RASON Reference Guide. (Click the Help tab to download.)",
25
+ "type": "textMining",
26
+ "algorithm": "latentSemanticAnalysis",
27
+ "parameters": {
28
+ "maxNumConcepts": 4,
29
+ "computeTermImportance": true,
30
+ "computeConceptImportance": true
31
+ }
32
+ }
33
+ },
34
+ "actions": {
35
+ "comment": "Define actions, evaluations, and data to be used by the estimator created above.",
36
+ "lsaModel": {
37
+ "comment": "Fits lsaEstimator to trainTermDocMatrix (tdmRomeo.txt). The fitted model, given the same name as this example, LatentSemanticAnalysis, is automatically posted to the RASON Server. This fitted model may be called The export property exports the fitted model to a JSON file. Three evaluations are requested: vocabulary, termImportance and conceptImportance. Vocabulary returns the final list of terms. The number of terms included in this list is determined by the 'maxVocabulary' estimator parameter setting. Termimportance returns the most frequently appearing terms along with their Importance factor. ConceptImportance returns the Concept Importance table which lists each concept, its singular value, the cumulative singular value and the % singular value explained. For more information on the evaluations supported by LSA, click the Help tab to download te RASON Reference guide.",
38
+ "trainData": "trainTermDocMatrix",
39
+ "estimator": "lsaEstimator",
40
+ "export": "json",
41
+ "action": "fit",
42
+ "evaluations": [ "vocabulary", "termImportance", "conceptImportance" ]
43
+ },
44
+ "tfRomeo": {
45
+ "comment": "Uses the fitted model lsaModel to score trainTermDocMatrix (tdmRomeo.txt). Two evaluations are requested in the results: transformation, which returns the transformed dataset, and termConceptMatrix, which lists the most important concepts vs most frequently appearing terms.",
46
+ "data": "trainTermDocMatrix",
47
+ "fittedModel": "lsaModel",
48
+ "action": "transform",
49
+ "evaluations": [ "transformation", "termConceptMatrix" ]
50
+ }
51
+ }
52
52
  }
@@ -1,66 +1,66 @@
1
- {
2
- "modelName": "Tfldf-FileData",
3
- "modelDescription": "Text Mining RASON example - TF-IDF: TF-IDF stands for Term Frequency Inverse Document Frequency of records. It can be defined as the calculation of how relevant a word in a series or corpus is to a text.",
4
- "modelType": "datamining",
5
- "datasources": {
6
- "comment": "Datasources to use with this model. Typically these bind to external data sources due to data volume.",
7
- "myTrainSrc": {
8
- "comment": "Imports tm.txt as the myTrainSrc datasource. This file contains the sample text that will be mined. Note that content is set to corpus. This property setting is used to indicate to Text Miner that a text corpus is being imported.",
9
- "type": "csv",
10
- "connection": "tm.txt",
11
- "content": "corpus",
12
- "direction": "import"
13
- }
14
- },
15
- "datasets": {
16
- "comment": "Binds myTrainSrc datasource (tm.txt) to trainCorpus dataset.",
17
- "trainCorpus": {
18
- "comment": "Binds myTrainSrc datasource (tm.txt) to trainCorpus dataset.",
19
- "binding": "myTrainSrc"
20
- }
21
- },
22
- "estimator": {
23
- "comment": "Defines an estimator, including the type, algorithm and parameters. Only 1 estimator may appear in a RASON model.",
24
- "tfidfEstimator": {
25
- "comment": "Defines the tfidfEstimator as a tfIdf estimator; various options are set. For a complete list of all algorithm options, see the RASON Data Mining Components chapter in the RASON Reference Guide. (Click the Help tab to download.)",
26
- "type": "textMining",
27
- "algorithm": "tfIdf",
28
- "parameters": {
29
- "maxVocabulary": 5,
30
- "maxTermLength": 10,
31
- "minDocumentFrequency": 5,
32
- "maxDocumentFrequency": 95,
33
- "preprocessing": [ "REMOVE_STOPWORDS", "NORMALIZE_CASE", "STEM", "NORMALIZE_URL", "NORMALIZE_EMAIL", "NORMALIZE_NUMBER", "NORMALIZE_MONEY", "REMOVE_HTML_TAGS" ],
34
- "synonyms": [
35
- [ "rootTerm1", "synonym1", "synonym2" ]
36
- ],
37
- "phraseReplacement": [
38
- [ "phrase1", "phraseReplacement" ]
39
- ]
40
- }
41
- }
42
- },
43
- "actions": {
44
- "comment": "Defines an estimator, including the type, algorithm and parameters. Only 1 estimator may appear in a RASON model.",
45
- "tfidfModel": {
46
- "comment": "Fits the tfidfEstimator to trainCorpus, POSTs the fitted model to the RASON Server and also exports the fitted model to a JSON file using the export property. Various evaluations are requested. Vocabulary returns the final list of terms. The number of terms included in this list is determined by the 'maxVocabulary' estimator parameter setting. DetailedVocabulary returns the number of times the terms, included in the Final List of Terms, appears in the document collection and the number of documents that include each term. TermCountInfo Returns the number of total terms, the % Reduction in Terms, the Final number of terms after preprocessing or reduction, and the setting for 'maxVocabulary'. DocInfo returns the # Characters and the # Terms per document.",
47
- "trainData": "trainCorpus",
48
- "estimator": "tfidfEstimator",
49
- "export": "json",
50
- "action": "fit",
51
- "evaluations": [ "vocabulary", "detailedVocabulary", "termCountInfo", "docInfo" ]
52
- },
53
- "termDocMatrix": {
54
- "comment": "Uses the fitted model tfidfModel to generate the term document matrix, which lists the 200 most frequently appearing terms. For information on all evaluations supported by Text Miner, click the Help tab to download the RASON Reference Guide.",
55
- "data": "trainCorpus",
56
- "fittedModel": "tfidfModel",
57
- "parameters": {
58
- "weightingSchemeTerm": "LOGARITHMIC",
59
- "weightingSchemeDocument": "INVERSE",
60
- "weightingSchemeNormalization": "NONE"
61
- },
62
- "action": "transform",
63
- "evaluations": [ "transformation" ]
64
- }
65
- }
1
+ {
2
+ "modelName": "Tfldf-FileData",
3
+ "modelDescription": "Text Mining RASON example - TF-IDF: TF-IDF stands for Term Frequency Inverse Document Frequency of records. It can be defined as the calculation of how relevant a word in a series or corpus is to a text.",
4
+ "modelType": "datamining",
5
+ "datasources": {
6
+ "comment": "Datasources to use with this model. Typically these bind to external data sources due to data volume.",
7
+ "myTrainSrc": {
8
+ "comment": "Imports tm.txt as the myTrainSrc datasource. This file contains the sample text that will be mined. Note that content is set to corpus. This property setting is used to indicate to Text Miner that a text corpus is being imported.",
9
+ "type": "csv",
10
+ "connection": "tm.txt",
11
+ "content": "corpus",
12
+ "direction": "import"
13
+ }
14
+ },
15
+ "datasets": {
16
+ "comment": "Binds myTrainSrc datasource (tm.txt) to trainCorpus dataset.",
17
+ "trainCorpus": {
18
+ "comment": "Binds myTrainSrc datasource (tm.txt) to trainCorpus dataset.",
19
+ "binding": "myTrainSrc"
20
+ }
21
+ },
22
+ "estimator": {
23
+ "comment": "Defines an estimator, including the type, algorithm and parameters. Only 1 estimator may appear in a RASON model.",
24
+ "tfidfEstimator": {
25
+ "comment": "Defines the tfidfEstimator as a tfIdf estimator; various options are set. For a complete list of all algorithm options, see the RASON Data Mining Components chapter in the RASON Reference Guide. (Click the Help tab to download.)",
26
+ "type": "textMining",
27
+ "algorithm": "tfIdf",
28
+ "parameters": {
29
+ "maxVocabulary": 5,
30
+ "maxTermLength": 10,
31
+ "minDocumentFrequency": 5,
32
+ "maxDocumentFrequency": 95,
33
+ "preprocessing": [ "REMOVE_STOPWORDS", "NORMALIZE_CASE", "STEM", "NORMALIZE_URL", "NORMALIZE_EMAIL", "NORMALIZE_NUMBER", "NORMALIZE_MONEY", "REMOVE_HTML_TAGS" ],
34
+ "synonyms": [
35
+ [ "rootTerm1", "synonym1", "synonym2" ]
36
+ ],
37
+ "phraseReplacement": [
38
+ [ "phrase1", "phraseReplacement" ]
39
+ ]
40
+ }
41
+ }
42
+ },
43
+ "actions": {
44
+ "comment": "Defines an estimator, including the type, algorithm and parameters. Only 1 estimator may appear in a RASON model.",
45
+ "tfidfModel": {
46
+ "comment": "Fits the tfidfEstimator to trainCorpus, POSTs the fitted model to the RASON Server and also exports the fitted model to a JSON file using the export property. Various evaluations are requested. Vocabulary returns the final list of terms. The number of terms included in this list is determined by the 'maxVocabulary' estimator parameter setting. DetailedVocabulary returns the number of times the terms, included in the Final List of Terms, appears in the document collection and the number of documents that include each term. TermCountInfo Returns the number of total terms, the % Reduction in Terms, the Final number of terms after preprocessing or reduction, and the setting for 'maxVocabulary'. DocInfo returns the # Characters and the # Terms per document.",
47
+ "trainData": "trainCorpus",
48
+ "estimator": "tfidfEstimator",
49
+ "export": "json",
50
+ "action": "fit",
51
+ "evaluations": [ "vocabulary", "detailedVocabulary", "termCountInfo", "docInfo" ]
52
+ },
53
+ "termDocMatrix": {
54
+ "comment": "Uses the fitted model tfidfModel to generate the term document matrix, which lists the 200 most frequently appearing terms. For information on all evaluations supported by Text Miner, click the Help tab to download the RASON Reference Guide.",
55
+ "data": "trainCorpus",
56
+ "fittedModel": "tfidfModel",
57
+ "parameters": {
58
+ "weightingSchemeTerm": "LOGARITHMIC",
59
+ "weightingSchemeDocument": "INVERSE",
60
+ "weightingSchemeNormalization": "NONE"
61
+ },
62
+ "action": "transform",
63
+ "evaluations": [ "transformation" ]
64
+ }
65
+ }
66
66
  }
@@ -1,56 +1,56 @@
1
- {
2
- "modelName": "Tfldf-InlineData",
3
- "modelDescription": "RASON Text Mining - TF-IDF example: TF-IDF stands for Term Frequency Inverse Document Frequency of records. It can be defined as the calculation of how relevant a word in a series or corpus is to a text. See the TFIDF-FileData example (Examples - Data Mining - Text Mining) to see an example where the text sample is imported from an outside data source.",
4
- "modelType": "datamining",
5
- "datasets": {
6
- "comment": "Binds the text samples to the trainCorpus dataset.",
7
- "trainCorpus": {
8
- "value": [ "Romeo and Juliet.", "Juliet: O happy dagger!", "'Romeo died by dagger.'", "'Live free or die', that's the New-Hampshire's motto.", "'Did you know, New - Hampshire is in New - England.'" ]
9
- }
10
- },
11
- "estimator": {
12
- "comment": "Defines an estimator, including the type, algorithm and parameters. Only 1 estimator may appear in a RASON model.",
13
- "tfidfEstimator": {
14
- "comment": "Defines the tfidfEstimator as a tfIdf estimator; various options are set. For a complete list of all algorithm options, see the RASON Data Mining Components chapter in the RASON Reference Guide. (Click the Help tab to download.)",
15
- "type": "textMining",
16
- "algorithm": "tfIdf",
17
- "parameters": {
18
- "maxVocabulary": 5,
19
- "maxTermLength": 10,
20
- "minDocumentFrequency": 5,
21
- "maxDocumentFrequency": 95,
22
- "preprocessing": [ "REMOVE_STOPWORDS", "NORMALIZE_CASE", "STEM", "NORMALIZE_URL", "NORMALIZE_EMAIL", "NORMALIZE_NUMBER", "NORMALIZE_MONEY", "REMOVE_HTML_TAGS" ],
23
- "synonyms": [
24
- [ "rootTerm1", "synonym1", "synonym2" ],
25
- [ "rootTerm2", "synonym1", "synonym2" ]
26
- ],
27
- "phraseReplacement": [
28
- [ "phrase1", "phraseReplacement" ],
29
- [ "phrase2", "phraseReplacement" ]
30
- ]
31
- }
32
- }
33
- },
34
- "actions": {
35
- "comment": "Defines an estimator, including the type, algorithm and parameters. Only 1 estimator may appear in a RASON model.",
36
- "tfidfModel": {
37
- "comment": "Fits the tfidfEstimator to trainCorpus, POSTs the fitted model to the RASON Server and also exports the fitted model to a JSON file using the export property. Various evaluations are requested. Vocabulary returns the final list of terms. The number of terms included in this list is determined by the 'maxVocabulary' estimator parameter setting. DetailedVocabulary returns the number of times the terms, included in the Final List of Terms, appears in the document collection and the number of documents that include each term. TermCountInfo Returns the number of total terms, the % Reduction in Terms, the Final number of terms after preprocessing or reduction, and the setting for 'maxVocabulary'. DocInfo returns the # Characters and the # Terms per document.",
38
- "trainData": "trainCorpus",
39
- "estimator": "tfidfEstimator",
40
- "action": "fit",
41
- "evaluations": [ "vocabulary", "detailedVocabulary", "termCountInfo", "docInfo" ]
42
- },
43
- "termDocMatrix": {
44
- "comment": "Uses the fitted model tfidfModel to generate the term document matrix, which lists the 200 most frequently appearing terms. For information on all evaluations supported by Text Miner, click the Help tab to download the RASON Reference Guide.",
45
- "data": "trainCorpus",
46
- "fittedModel": "tfidfModel",
47
- "parameters": {
48
- "weightingSchemeTerm": "LOGARITHMIC",
49
- "weightingSchemeDocument": "INVERSE",
50
- "weightingSchemeNormalization": "NONE"
51
- },
52
- "action": "transform",
53
- "evaluations": [ "transformation" ]
54
- }
55
- }
1
+ {
2
+ "modelName": "Tfldf-InlineData",
3
+ "modelDescription": "RASON Text Mining - TF-IDF example: TF-IDF stands for Term Frequency Inverse Document Frequency of records. It can be defined as the calculation of how relevant a word in a series or corpus is to a text. See the TFIDF-FileData example (Examples - Data Mining - Text Mining) to see an example where the text sample is imported from an outside data source.",
4
+ "modelType": "datamining",
5
+ "datasets": {
6
+ "comment": "Binds the text samples to the trainCorpus dataset.",
7
+ "trainCorpus": {
8
+ "value": [ "Romeo and Juliet.", "Juliet: O happy dagger!", "'Romeo died by dagger.'", "'Live free or die', that's the New-Hampshire's motto.", "'Did you know, New - Hampshire is in New - England.'" ]
9
+ }
10
+ },
11
+ "estimator": {
12
+ "comment": "Defines an estimator, including the type, algorithm and parameters. Only 1 estimator may appear in a RASON model.",
13
+ "tfidfEstimator": {
14
+ "comment": "Defines the tfidfEstimator as a tfIdf estimator; various options are set. For a complete list of all algorithm options, see the RASON Data Mining Components chapter in the RASON Reference Guide. (Click the Help tab to download.)",
15
+ "type": "textMining",
16
+ "algorithm": "tfIdf",
17
+ "parameters": {
18
+ "maxVocabulary": 5,
19
+ "maxTermLength": 10,
20
+ "minDocumentFrequency": 5,
21
+ "maxDocumentFrequency": 95,
22
+ "preprocessing": [ "REMOVE_STOPWORDS", "NORMALIZE_CASE", "STEM", "NORMALIZE_URL", "NORMALIZE_EMAIL", "NORMALIZE_NUMBER", "NORMALIZE_MONEY", "REMOVE_HTML_TAGS" ],
23
+ "synonyms": [
24
+ [ "rootTerm1", "synonym1", "synonym2" ],
25
+ [ "rootTerm2", "synonym1", "synonym2" ]
26
+ ],
27
+ "phraseReplacement": [
28
+ [ "phrase1", "phraseReplacement" ],
29
+ [ "phrase2", "phraseReplacement" ]
30
+ ]
31
+ }
32
+ }
33
+ },
34
+ "actions": {
35
+ "comment": "Defines an estimator, including the type, algorithm and parameters. Only 1 estimator may appear in a RASON model.",
36
+ "tfidfModel": {
37
+ "comment": "Fits the tfidfEstimator to trainCorpus, POSTs the fitted model to the RASON Server and also exports the fitted model to a JSON file using the export property. Various evaluations are requested. Vocabulary returns the final list of terms. The number of terms included in this list is determined by the 'maxVocabulary' estimator parameter setting. DetailedVocabulary returns the number of times the terms, included in the Final List of Terms, appears in the document collection and the number of documents that include each term. TermCountInfo Returns the number of total terms, the % Reduction in Terms, the Final number of terms after preprocessing or reduction, and the setting for 'maxVocabulary'. DocInfo returns the # Characters and the # Terms per document.",
38
+ "trainData": "trainCorpus",
39
+ "estimator": "tfidfEstimator",
40
+ "action": "fit",
41
+ "evaluations": [ "vocabulary", "detailedVocabulary", "termCountInfo", "docInfo" ]
42
+ },
43
+ "termDocMatrix": {
44
+ "comment": "Uses the fitted model tfidfModel to generate the term document matrix, which lists the 200 most frequently appearing terms. For information on all evaluations supported by Text Miner, click the Help tab to download the RASON Reference Guide.",
45
+ "data": "trainCorpus",
46
+ "fittedModel": "tfidfModel",
47
+ "parameters": {
48
+ "weightingSchemeTerm": "LOGARITHMIC",
49
+ "weightingSchemeDocument": "INVERSE",
50
+ "weightingSchemeNormalization": "NONE"
51
+ },
52
+ "action": "transform",
53
+ "evaluations": [ "transformation" ]
54
+ }
55
+ }
56
56
  }