npm - nlptoolkit-classification - Versions diffs - 1.0.6 → 1.0.8 - Mend

nlptoolkit-classification 1.0.6 → 1.0.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (310) hide show

package/README.md +1 -0
package/dist/Attribute/DiscreteAttribute.d.ts +1 -1
package/dist/Attribute/DiscreteAttribute.js.map +1 -1
package/dist/Attribute/DiscreteIndexedAttribute.d.ts +2 -2
package/dist/DataSet/DataDefinition.d.ts +11 -0
package/dist/DataSet/DataDefinition.js +11 -0
package/dist/DataSet/DataDefinition.js.map +1 -1
package/dist/Experiment/BootstrapRun.js +2 -2
package/dist/Experiment/BootstrapRun.js.map +1 -1
package/dist/Experiment/Experiment.d.ts +7 -7
package/dist/Experiment/Experiment.js +6 -6
package/dist/Experiment/Experiment.js.map +1 -1
package/dist/Experiment/KFoldRun.d.ts +17 -2
package/dist/Experiment/KFoldRun.js +19 -4
package/dist/Experiment/KFoldRun.js.map +1 -1
package/dist/Experiment/KFoldRunSeparateTest.d.ts +13 -2
package/dist/Experiment/KFoldRunSeparateTest.js +15 -4
package/dist/Experiment/KFoldRunSeparateTest.js.map +1 -1
package/dist/Experiment/MxKFoldRun.js +1 -1
package/dist/Experiment/MxKFoldRun.js.map +1 -1
package/dist/Experiment/MxKFoldRunSeparateTest.js +1 -1
package/dist/Experiment/MxKFoldRunSeparateTest.js.map +1 -1
package/dist/Experiment/SingleRunWithK.d.ts +18 -3
package/dist/Experiment/SingleRunWithK.js +18 -3
package/dist/Experiment/SingleRunWithK.js.map +1 -1
package/dist/Experiment/StratifiedKFoldRun.js +1 -1
package/dist/Experiment/StratifiedKFoldRun.js.map +1 -1
package/dist/Experiment/StratifiedKFoldRunSeparateTest.js +1 -1
package/dist/Experiment/StratifiedKFoldRunSeparateTest.js.map +1 -1
package/dist/Experiment/StratifiedMxKFoldRun.js +1 -1
package/dist/Experiment/StratifiedMxKFoldRun.js.map +1 -1
package/dist/Experiment/StratifiedMxKFoldRunSeparateTest.js +3 -3
package/dist/Experiment/StratifiedMxKFoldRunSeparateTest.js.map +1 -1
package/dist/Experiment/StratifiedSingleRunWithK.js +1 -1
package/dist/Experiment/StratifiedSingleRunWithK.js.map +1 -1
package/dist/Filter/LaryFilter.d.ts +1 -1
package/dist/Filter/LaryFilter.js +1 -1
package/dist/Filter/TrainedFeatureFilter.d.ts +1 -1
package/dist/Filter/TrainedFeatureFilter.js +1 -1
package/dist/InstanceList/Partition.d.ts +45 -0
package/dist/InstanceList/Partition.js +125 -70
package/dist/InstanceList/Partition.js.map +1 -1
package/dist/Model/DecisionTree/DecisionCondition.d.ts +8 -0
package/dist/Model/DecisionTree/DecisionCondition.js +8 -0
package/dist/Model/DecisionTree/DecisionCondition.js.map +1 -1
package/dist/Model/DecisionTree/DecisionNode.d.ts +39 -1
package/dist/Model/DecisionTree/DecisionNode.js +64 -22
package/dist/Model/DecisionTree/DecisionNode.js.map +1 -1
package/dist/Model/DecisionTree/DecisionStump.d.ts +17 -0
package/dist/{Classifier/C45Stump.js → Model/DecisionTree/DecisionStump.js} +13 -10
package/dist/Model/DecisionTree/DecisionStump.js.map +1 -0
package/dist/Model/DecisionTree/DecisionTree.d.ts +24 -9
package/dist/Model/DecisionTree/DecisionTree.js +39 -16
package/dist/Model/DecisionTree/DecisionTree.js.map +1 -1
package/dist/Model/DummyModel.d.ts +28 -3
package/dist/Model/DummyModel.js +36 -23
package/dist/Model/DummyModel.js.map +1 -1
package/dist/{Classifier/Bagging.d.ts → Model/Ensemble/BaggingModel.d.ts} +8 -4
package/dist/{Classifier/Bagging.js → Model/Ensemble/BaggingModel.js} +16 -14
package/dist/Model/Ensemble/BaggingModel.js.map +1 -0
package/dist/{Classifier/RandomForest.d.ts → Model/Ensemble/RandomForestModel.d.ts} +8 -4
package/dist/{Classifier/RandomForest.js → Model/Ensemble/RandomForestModel.js} +16 -14
package/dist/Model/Ensemble/RandomForestModel.js.map +1 -0
package/dist/Model/Ensemble/TreeEnsembleModel.d.ts +32 -0
package/dist/Model/{TreeEnsembleModel.js → Ensemble/TreeEnsembleModel.js} +23 -17
package/dist/Model/Ensemble/TreeEnsembleModel.js.map +1 -0
package/dist/Model/Model.d.ts +52 -0
package/dist/Model/Model.js +84 -1
package/dist/Model/Model.js.map +1 -1
package/dist/Model/NeuralNetwork/DeepNetworkModel.d.ts +47 -0
package/dist/Model/{DeepNetworkModel.js → NeuralNetwork/DeepNetworkModel.js} +55 -55
package/dist/Model/NeuralNetwork/DeepNetworkModel.js.map +1 -0
package/dist/Model/NeuralNetwork/LinearPerceptronModel.d.ts +31 -0
package/dist/Model/NeuralNetwork/LinearPerceptronModel.js +84 -0
package/dist/Model/NeuralNetwork/LinearPerceptronModel.js.map +1 -0
package/dist/Model/NeuralNetwork/MultiLayerPerceptronModel.d.ts +39 -0
package/dist/Model/{MultiLayerPerceptronModel.js → NeuralNetwork/MultiLayerPerceptronModel.js} +41 -37
package/dist/Model/NeuralNetwork/MultiLayerPerceptronModel.js.map +1 -0
package/dist/Model/{NeuralNetworkModel.d.ts → NeuralNetwork/NeuralNetworkModel.d.ts} +19 -5
package/dist/Model/{NeuralNetworkModel.js → NeuralNetwork/NeuralNetworkModel.js} +19 -6
package/dist/Model/NeuralNetwork/NeuralNetworkModel.js.map +1 -0
package/dist/Model/{KnnInstance.d.ts → NonParametric/KnnInstance.d.ts} +1 -1
package/dist/Model/NonParametric/KnnInstance.js.map +1 -0
package/dist/Model/{KnnModel.d.ts → NonParametric/KnnModel.d.ts} +30 -6
package/dist/Model/{KnnModel.js → NonParametric/KnnModel.js} +42 -19
package/dist/Model/NonParametric/KnnModel.js.map +1 -0
package/dist/Model/{GaussianModel.d.ts → Parametric/GaussianModel.d.ts} +20 -2
package/dist/Model/{GaussianModel.js → Parametric/GaussianModel.js} +21 -3
package/dist/Model/Parametric/GaussianModel.js.map +1 -0
package/dist/Model/Parametric/KMeansModel.d.ts +36 -0
package/dist/Model/Parametric/KMeansModel.js +73 -0
package/dist/Model/Parametric/KMeansModel.js.map +1 -0
package/dist/Model/Parametric/LdaModel.d.ts +44 -0
package/dist/Model/Parametric/LdaModel.js +98 -0
package/dist/Model/Parametric/LdaModel.js.map +1 -0
package/dist/Model/{NaiveBayesModel.d.ts → Parametric/NaiveBayesModel.d.ts} +30 -10
package/dist/Model/{NaiveBayesModel.js → Parametric/NaiveBayesModel.js} +64 -27
package/dist/Model/Parametric/NaiveBayesModel.js.map +1 -0
package/dist/Model/Parametric/QdaModel.d.ts +30 -0
package/dist/Model/Parametric/QdaModel.js +84 -0
package/dist/Model/Parametric/QdaModel.js.map +1 -0
package/dist/Model/RandomModel.d.ts +32 -2
package/dist/Model/RandomModel.js +48 -16
package/dist/Model/RandomModel.js.map +1 -1
package/dist/Parameter/C45Parameter.d.ts +2 -2
package/dist/Parameter/DeepNetworkParameter.d.ts +2 -2
package/dist/Parameter/KnnParameter.d.ts +1 -1
package/dist/Parameter/LinearPerceptronParameter.d.ts +4 -4
package/dist/Parameter/MultiLayerPerceptronParameter.d.ts +2 -2
package/dist/Parameter/Parameter.d.ts +1 -1
package/dist/Performance/ConfusionMatrix.d.ts +1 -1
package/dist/StatisticalTest/Combined5x2F.d.ts +12 -0
package/dist/StatisticalTest/Combined5x2F.js +12 -0
package/dist/StatisticalTest/Combined5x2F.js.map +1 -1
package/dist/StatisticalTest/Combined5x2t.d.ts +13 -0
package/dist/StatisticalTest/Combined5x2t.js +13 -0
package/dist/StatisticalTest/Combined5x2t.js.map +1 -1
package/dist/StatisticalTest/Paired5x2t.d.ts +12 -0
package/dist/StatisticalTest/Paired5x2t.js +12 -0
package/dist/StatisticalTest/Paired5x2t.js.map +1 -1
package/dist/StatisticalTest/PairedTest.d.ts +12 -0
package/dist/StatisticalTest/PairedTest.js +12 -0
package/dist/StatisticalTest/PairedTest.js.map +1 -1
package/dist/StatisticalTest/Pairedt.d.ts +12 -0
package/dist/StatisticalTest/Pairedt.js +12 -0
package/dist/StatisticalTest/Pairedt.js.map +1 -1
package/dist/StatisticalTest/Sign.d.ts +17 -0
package/dist/StatisticalTest/Sign.js +17 -0
package/dist/StatisticalTest/Sign.js.map +1 -1
package/dist/StatisticalTest/StatisticalTestResult.d.ts +30 -0
package/dist/StatisticalTest/StatisticalTestResult.js +30 -0
package/dist/StatisticalTest/StatisticalTestResult.js.map +1 -1
package/dist/index.d.ts +88 -0
package/dist/index.js +111 -0
package/dist/index.js.map +1 -0
package/models/bagging-bupa.txt +10346 -0
package/models/bagging-car.txt +40752 -0
package/models/bagging-dermatology.txt +2990 -0
package/models/bagging-iris.txt +1332 -0
package/models/bagging-tictactoe.txt +29442 -0
package/models/c45-bupa.txt +3 -0
package/models/c45-car.txt +212 -0
package/models/c45-carIndexed.txt +92 -0
package/models/c45-dermatology.txt +22 -0
package/models/c45-iris.txt +7 -0
package/models/c45-tictactoe.txt +147 -0
package/models/c45-tictactoeIndexed.txt +79 -0
package/models/c45stump-bupa.txt +6 -0
package/models/c45stump-car.txt +11 -0
package/models/c45stump-chess.txt +35 -0
package/models/c45stump-dermatology.txt +11 -0
package/models/c45stump-iris.txt +5 -0
package/models/c45stump-nursery.txt +10 -0
package/models/c45stump-tictactoe.txt +9 -0
package/models/randomforest-bupa.txt +10346 -0
package/models/randomforest-car.txt +40752 -0
package/models/randomforest-carIndexed.txt +15594 -0
package/models/randomforest-dermatology.txt +2990 -0
package/models/randomforest-iris.txt +1332 -0
package/models/randomforest-tictactoe.txt +29442 -0
package/package.json +7 -7
package/source/Attribute/DiscreteAttribute.ts +1 -1
package/source/Attribute/DiscreteIndexedAttribute.ts +2 -2
package/source/DataSet/DataDefinition.ts +11 -0
package/source/Experiment/BootstrapRun.ts +2 -2
package/source/Experiment/Experiment.ts +10 -10
package/source/Experiment/KFoldRun.ts +20 -5
package/source/Experiment/KFoldRunSeparateTest.ts +16 -5
package/source/Experiment/MxKFoldRun.ts +1 -1
package/source/Experiment/MxKFoldRunSeparateTest.ts +1 -1
package/source/Experiment/SingleRunWithK.ts +20 -5
package/source/Experiment/StratifiedKFoldRun.ts +1 -1
package/source/Experiment/StratifiedKFoldRunSeparateTest.ts +1 -1
package/source/Experiment/StratifiedMxKFoldRun.ts +1 -1
package/source/Experiment/StratifiedMxKFoldRunSeparateTest.ts +3 -3
package/source/Experiment/StratifiedSingleRunWithK.ts +1 -1
package/source/Filter/LaryFilter.ts +1 -1
package/source/Filter/TrainedFeatureFilter.ts +1 -1
package/source/InstanceList/Partition.ts +125 -65
package/source/Model/DecisionTree/DecisionCondition.ts +8 -0
package/source/Model/DecisionTree/DecisionNode.ts +65 -22
package/source/Model/DecisionTree/DecisionStump.ts +26 -0
package/source/Model/DecisionTree/DecisionTree.ts +44 -15
package/source/Model/DummyModel.ts +40 -19
package/source/{Classifier/Bagging.ts → Model/Ensemble/BaggingModel.ts} +15 -12
package/source/{Classifier/RandomForest.ts → Model/Ensemble/RandomForestModel.ts} +14 -12
package/source/Model/{TreeEnsembleModel.ts → Ensemble/TreeEnsembleModel.ts} +26 -18
package/source/Model/Model.ts +92 -0
package/source/Model/{DeepNetworkModel.ts → NeuralNetwork/DeepNetworkModel.ts} +59 -56
package/source/Model/NeuralNetwork/LinearPerceptronModel.ts +81 -0
package/source/Model/{MultiLayerPerceptronModel.ts → NeuralNetwork/MultiLayerPerceptronModel.ts} +46 -39
package/source/Model/{NeuralNetworkModel.ts → NeuralNetwork/NeuralNetworkModel.ts} +20 -7
package/source/Model/{KnnInstance.ts → NonParametric/KnnInstance.ts} +1 -1
package/source/Model/{KnnModel.ts → NonParametric/KnnModel.ts} +48 -19
package/source/Model/{GaussianModel.ts → Parametric/GaussianModel.ts} +21 -3
package/source/Model/Parametric/KMeansModel.ts +72 -0
package/source/Model/Parametric/LdaModel.ts +98 -0
package/source/Model/{NaiveBayesModel.ts → Parametric/NaiveBayesModel.ts} +68 -25
package/source/Model/Parametric/QdaModel.ts +83 -0
package/source/Model/RandomModel.ts +54 -16
package/source/Parameter/C45Parameter.ts +2 -2
package/source/Parameter/DeepNetworkParameter.ts +2 -2
package/source/Parameter/KnnParameter.ts +1 -1
package/source/Parameter/LinearPerceptronParameter.ts +4 -4
package/source/Parameter/MultiLayerPerceptronParameter.ts +2 -2
package/source/Parameter/Parameter.ts +1 -1
package/source/Performance/ConfusionMatrix.ts +1 -1
package/source/StatisticalTest/Combined5x2F.ts +12 -0
package/source/StatisticalTest/Combined5x2t.ts +13 -0
package/source/StatisticalTest/Paired5x2t.ts +12 -0
package/source/StatisticalTest/PairedTest.ts +12 -0
package/source/StatisticalTest/Pairedt.ts +12 -0
package/source/StatisticalTest/Sign.ts +17 -0
package/source/StatisticalTest/StatisticalTestResult.ts +30 -0
package/source/index.ts +88 -0
package/source/tsconfig.json +1 -1
package/tests/Classifier/C45Test.ts +2 -2
package/tests/Classifier/DeepNetworkTest.ts +3 -5
package/tests/Classifier/DummyTest.ts +2 -2
package/tests/Classifier/KMeansTest.ts +2 -2
package/tests/Classifier/KnnTest.ts +2 -2
package/tests/Classifier/LdaTest.ts +2 -2
package/tests/Classifier/LinearPerceptronTest.ts +2 -2
package/tests/Classifier/MultiLayerPerceptronTest.ts +2 -3
package/tests/Classifier/NaiveBayesTest.ts +2 -2
package/tests/Classifier/QdaTest.ts +2 -2
package/tests/Classifier/RandomForestTest.ts +2 -2
package/tsconfig.json +1 -2
package/dist/Classifier/Bagging.js.map +0 -1
package/dist/Classifier/C45.d.ts +0 -14
package/dist/Classifier/C45.js +0 -43
package/dist/Classifier/C45.js.map +0 -1
package/dist/Classifier/C45Stump.d.ts +0 -13
package/dist/Classifier/C45Stump.js.map +0 -1
package/dist/Classifier/Classifier.d.ts +0 -40
package/dist/Classifier/Classifier.js +0 -72
package/dist/Classifier/Classifier.js.map +0 -1
package/dist/Classifier/DeepNetwork.d.ts +0 -14
package/dist/Classifier/DeepNetwork.js +0 -34
package/dist/Classifier/DeepNetwork.js.map +0 -1
package/dist/Classifier/Dummy.d.ts +0 -14
package/dist/Classifier/Dummy.js +0 -32
package/dist/Classifier/Dummy.js.map +0 -1
package/dist/Classifier/KMeans.d.ts +0 -13
package/dist/Classifier/KMeans.js +0 -39
package/dist/Classifier/KMeans.js.map +0 -1
package/dist/Classifier/Knn.d.ts +0 -14
package/dist/Classifier/Knn.js +0 -32
package/dist/Classifier/Knn.js.map +0 -1
package/dist/Classifier/Lda.d.ts +0 -13
package/dist/Classifier/Lda.js +0 -55
package/dist/Classifier/Lda.js.map +0 -1
package/dist/Classifier/LinearPerceptron.d.ts +0 -15
package/dist/Classifier/LinearPerceptron.js +0 -35
package/dist/Classifier/LinearPerceptron.js.map +0 -1
package/dist/Classifier/MultiLayerPerceptron.d.ts +0 -15
package/dist/Classifier/MultiLayerPerceptron.js +0 -35
package/dist/Classifier/MultiLayerPerceptron.js.map +0 -1
package/dist/Classifier/NaiveBayes.d.ts +0 -26
package/dist/Classifier/NaiveBayes.js +0 -70
package/dist/Classifier/NaiveBayes.js.map +0 -1
package/dist/Classifier/Qda.d.ts +0 -13
package/dist/Classifier/Qda.js +0 -53
package/dist/Classifier/Qda.js.map +0 -1
package/dist/Classifier/RandomClassifier.d.ts +0 -13
package/dist/Classifier/RandomClassifier.js +0 -35
package/dist/Classifier/RandomClassifier.js.map +0 -1
package/dist/Classifier/RandomForest.js.map +0 -1
package/dist/Model/DeepNetworkModel.d.ts +0 -45
package/dist/Model/DeepNetworkModel.js.map +0 -1
package/dist/Model/GaussianModel.js.map +0 -1
package/dist/Model/KMeansModel.d.ts +0 -28
package/dist/Model/KMeansModel.js +0 -61
package/dist/Model/KMeansModel.js.map +0 -1
package/dist/Model/KnnInstance.js.map +0 -1
package/dist/Model/KnnModel.js.map +0 -1
package/dist/Model/LdaModel.d.ts +0 -28
package/dist/Model/LdaModel.js +0 -67
package/dist/Model/LdaModel.js.map +0 -1
package/dist/Model/LinearPerceptronModel.d.ts +0 -24
package/dist/Model/LinearPerceptronModel.js +0 -91
package/dist/Model/LinearPerceptronModel.js.map +0 -1
package/dist/Model/MultiLayerPerceptronModel.d.ts +0 -33
package/dist/Model/MultiLayerPerceptronModel.js.map +0 -1
package/dist/Model/NaiveBayesModel.js.map +0 -1
package/dist/Model/NeuralNetworkModel.js.map +0 -1
package/dist/Model/QdaModel.d.ts +0 -27
package/dist/Model/QdaModel.js +0 -63
package/dist/Model/QdaModel.js.map +0 -1
package/dist/Model/TreeEnsembleModel.d.ts +0 -22
package/dist/Model/TreeEnsembleModel.js.map +0 -1
package/index.js +0 -100
package/source/Classifier/C45.ts +0 -34
package/source/Classifier/C45Stump.ts +0 -23
package/source/Classifier/Classifier.ts +0 -72
package/source/Classifier/DeepNetwork.ts +0 -26
package/source/Classifier/Dummy.ts +0 -23
package/source/Classifier/KMeans.ts +0 -30
package/source/Classifier/Knn.ts +0 -25
package/source/Classifier/Lda.ts +0 -47
package/source/Classifier/LinearPerceptron.ts +0 -27
package/source/Classifier/MultiLayerPerceptron.ts +0 -27
package/source/Classifier/NaiveBayes.ts +0 -66
package/source/Classifier/Qda.ts +0 -46
package/source/Classifier/RandomClassifier.ts +0 -26
package/source/Model/KMeansModel.ts +0 -56
package/source/Model/LdaModel.ts +0 -62
package/source/Model/LinearPerceptronModel.ts +0 -83
package/source/Model/QdaModel.ts +0 -57
/package/dist/Model/{KnnInstance.js → NonParametric/KnnInstance.js} +0 -0

package/source/Model/DecisionTree/DecisionNode.ts CHANGED Viewed

@@ -16,19 +16,46 @@ export class DecisionNode {
     children: Array<DecisionNode> = undefined
     private EPSILON: number = 0.0000000001;
-    private data : InstanceList = undefined
     private classLabel : string = undefined
     leaf: boolean = false
     private condition: DecisionCondition = undefined
+    private classLabelsDistribution: DiscreteDistribution
+    /**
+     * The DecisionNode method takes {@link InstanceList} data as input and then it sets the class label parameter by finding
+     * the most occurred class label of given data, it then gets distinct class labels as class labels ArrayList. Later, it adds ordered
+     * indices to the indexList and shuffles them randomly. Then, it gets the class distribution of given data and finds the best entropy value
+     * of these class distribution.
+     * <p>
+     * If an attribute of given data is {@link DiscreteIndexedAttribute}, it creates a Distribution according to discrete indexed attribute class distribution
+     * and finds the entropy. If it is better than the last best entropy it reassigns the best entropy, best attribute and best split value according to
+     * the newly founded best entropy's index. At the end, it also add new distribution to the class distribution .
+     * <p>
+     * If an attribute of given data is {@link DiscreteAttribute}, it directly finds the entropy. If it is better than the last best entropy it
+     * reassigns the best entropy, best attribute and best split value according to the newly founded best entropy's index.
+     * <p>
+     * If an attribute of given data is {@link ContinuousAttribute}, it creates two distributions; left and right according to class distribution
+     * and discrete distribution respectively, and finds the entropy. If it is better than the last best entropy it reassigns the best entropy,
+     * best attribute and best split value according to the newly founded best entropy's index. At the end, it also add new distribution to
+     * the right distribution and removes from left distribution .
+     *
+     * @param data      {@link InstanceList} input.
+     * @param condition {@link DecisionCondition} to check.
+     * @param parameter RandomForestParameter like seed, ensembleSize, attributeSubsetSize.
+     * @param isStump   Refers to decision trees with only 1 splitting rule.
+     */
     constructor1(data: InstanceList, condition?: DecisionCondition | number, parameter?: RandomForestParameter, isStump?: boolean){
         let bestAttribute = -1
         let bestSplitValue = 0
         if (condition instanceof DecisionCondition){
             this.condition = condition;
         }
-        this.data = data;
-        this.classLabel = Model.getMaximum(data.getClassLabels());
+        this.classLabelsDistribution = new DiscreteDistribution()
+        let labels = data.getClassLabels()
+        for (let label of labels){
+            this.classLabelsDistribution.addItem(label)
+        }
+        this.classLabel = Model.getMaximum(labels)
         this.leaf = true;
         let classLabels = data.getDistinctClassLabels();
         if (classLabels.length == 1) {
@@ -69,7 +96,7 @@ export class DecisionNode {
                 }
             } else {
                 if (data.get(0).getAttribute(index) instanceof DiscreteAttribute) {
-                    let entropy = this.entropyForDiscreteAttribute(index);
+                    let entropy = this.entropyForDiscreteAttribute(data, index);
                     if (entropy + this.EPSILON < bestEntropy) {
                         bestEntropy = entropy;
                         bestAttribute = index;
@@ -106,19 +133,23 @@ export class DecisionNode {
         if (bestAttribute != -1) {
             this.leaf = false;
             if (data.get(0).getAttribute(bestAttribute) instanceof DiscreteIndexedAttribute) {
-                this.createChildrenForDiscreteIndexed(bestAttribute, bestSplitValue, parameter, isStump);
+                this.createChildrenForDiscreteIndexed(data, bestAttribute, bestSplitValue, parameter, isStump);
             } else {
                 if (data.get(0).getAttribute(bestAttribute) instanceof DiscreteAttribute) {
-                    this.createChildrenForDiscrete(bestAttribute, parameter, isStump);
+                    this.createChildrenForDiscrete(data, bestAttribute, parameter, isStump);
                 } else {
                     if (data.get(0).getAttribute(bestAttribute) instanceof ContinuousAttribute) {
-                        this.createChildrenForContinuous(bestAttribute, bestSplitValue, parameter, isStump);
+                        this.createChildrenForContinuous(data, bestAttribute, bestSplitValue, parameter, isStump);
                     }
                 }
             }
         }
     }
+    /**
+     * Reads the decision node model (as one line) from model file.
+     * @param contents Model file
+     */
     constructor2(contents: FileContents){
         let items = contents.readLine().split(" ")
         if (items[0] != "-1"){
@@ -144,6 +175,7 @@ export class DecisionNode {
         } else {
             this.leaf = true
             this.classLabel = contents.readLine()
+            this.classLabelsDistribution = Model.loadDiscreteDistribution(contents);
         }
     }
@@ -184,14 +216,15 @@ export class DecisionNode {
      * The entropyForDiscreteAttribute method takes an attributeIndex and creates an ArrayList of DiscreteDistribution.
      * Then loops through the distributions and calculates the total entropy.
      *
+     * @param data Instance list.
      * @param attributeIndex Index of the attribute.
      * @return Total entropy for the discrete attribute.
      */
-    private entropyForDiscreteAttribute(attributeIndex: number): number{
+    private entropyForDiscreteAttribute(data: InstanceList, attributeIndex: number): number{
         let sum = 0.0;
-        let distributions = this.data.attributeClassDistribution(attributeIndex);
+        let distributions = data.attributeClassDistribution(attributeIndex);
         for (let distribution of distributions) {
-            sum += (distribution.getSum() / this.data.size()) * distribution.entropy();
+            sum += (distribution.getSum() / data.size()) * distribution.entropy();
         }
         return sum;
     }
@@ -200,29 +233,31 @@ export class DecisionNode {
      * The createChildrenForDiscreteIndexed method creates an ArrayList of DecisionNodes as children and a partition with respect to
      * indexed attribute.
      *
+     * @param data Instance list.
      * @param attributeIndex Index of the attribute.
      * @param attributeValue Value of the attribute.
      * @param parameter      RandomForestParameter like seed, ensembleSize, attributeSubsetSize.
      * @param isStump        Refers to decision trees with only 1 splitting rule.
      */
-    private createChildrenForDiscreteIndexed(attributeIndex: number, attributeValue: number, parameter: RandomForestParameter, isStump: boolean){
-        let childrenData = new Partition(this.data, attributeIndex, attributeValue);
+    private createChildrenForDiscreteIndexed(data: InstanceList, attributeIndex: number, attributeValue: number, parameter: RandomForestParameter, isStump: boolean){
+        let childrenData = new Partition(data, attributeIndex, attributeValue);
         this.children = new Array<DecisionNode>();
-        this.children.push(new DecisionNode(childrenData.get(0), new DecisionCondition(attributeIndex, new DiscreteIndexedAttribute("", attributeValue, (<DiscreteIndexedAttribute> this.data.get(0).getAttribute(attributeIndex)).getMaxIndex())), parameter, isStump));
-        this.children.push(new DecisionNode(childrenData.get(1), new DecisionCondition(attributeIndex, new DiscreteIndexedAttribute("", -1, (<DiscreteIndexedAttribute> this.data.get(0).getAttribute(attributeIndex)).getMaxIndex())), parameter, isStump));
+        this.children.push(new DecisionNode(childrenData.get(0), new DecisionCondition(attributeIndex, new DiscreteIndexedAttribute("", attributeValue, (<DiscreteIndexedAttribute> data.get(0).getAttribute(attributeIndex)).getMaxIndex())), parameter, isStump));
+        this.children.push(new DecisionNode(childrenData.get(1), new DecisionCondition(attributeIndex, new DiscreteIndexedAttribute("", -1, (<DiscreteIndexedAttribute> data.get(0).getAttribute(attributeIndex)).getMaxIndex())), parameter, isStump));
     }
     /**
      * The createChildrenForDiscrete method creates an ArrayList of values, a partition with respect to attributes and an ArrayList
      * of DecisionNodes as children.
      *
+     * @param data Instance list.
      * @param attributeIndex Index of the attribute.
      * @param parameter      RandomForestParameter like seed, ensembleSize, attributeSubsetSize.
      * @param isStump        Refers to decision trees with only 1 splitting rule.
      */
-    private createChildrenForDiscrete(attributeIndex: number, parameter: RandomForestParameter, isStump: boolean){
-        let valueList = this.data.getAttributeValueList(attributeIndex);
-        let childrenData = new Partition(this.data, attributeIndex);
+    private createChildrenForDiscrete(data: InstanceList, attributeIndex: number, parameter: RandomForestParameter, isStump: boolean){
+        let valueList = data.getAttributeValueList(attributeIndex);
+        let childrenData = new Partition(data, attributeIndex);
         this.children = new Array<DecisionNode>();
         for (let i = 0; i < valueList.length; i++) {
             this.children.push(new DecisionNode(childrenData.get(i), new DecisionCondition(attributeIndex, new DiscreteAttribute(valueList[i])), parameter, isStump));
@@ -233,13 +268,14 @@ export class DecisionNode {
      * The createChildrenForContinuous method creates an ArrayList of DecisionNodes as children and a partition with respect to
      * continuous attribute and the given split value.
      *
+     * @param data Instance list.
      * @param attributeIndex Index of the attribute.
      * @param parameter      RandomForestParameter like seed, ensembleSize, attributeSubsetSize.
      * @param isStump        Refers to decision trees with only 1 splitting rule.
      * @param splitValue     Split value is used for partitioning.
      */
-    private createChildrenForContinuous(attributeIndex: number, splitValue: number, parameter: RandomForestParameter, isStump: boolean){
-        let childrenData = new Partition(this.data, attributeIndex, splitValue + 0.0000001);
+    private createChildrenForContinuous(data: InstanceList, attributeIndex: number, splitValue: number, parameter: RandomForestParameter, isStump: boolean){
+        let childrenData = new Partition(data, attributeIndex, splitValue + 0.0000001);
         this.children = new Array<DecisionNode>();
         this.children.push(new DecisionNode(childrenData.get(0), new DecisionCondition(attributeIndex, new ContinuousAttribute(splitValue), "<"), parameter, isStump));
         this.children.push(new DecisionNode(childrenData.get(1), new DecisionCondition(attributeIndex, new ContinuousAttribute(splitValue), ">"), parameter, isStump));
@@ -255,7 +291,7 @@ export class DecisionNode {
     predict(instance: Instance): string{
         if (instance instanceof CompositeInstance) {
             let possibleClassLabels = (<CompositeInstance> instance).getPossibleClassLabels();
-            let distribution = this.data.classDistribution();
+            let distribution = this.classLabelsDistribution;
             let predictedClass = distribution.getMaxItem(possibleClassLabels);
             if (this.leaf) {
                 return predictedClass;
@@ -286,16 +322,23 @@ export class DecisionNode {
         }
     }
+    /**
+     * Recursive method that returns the posterior probability distribution of a given instance. If the node is a leaf
+     * node, it returns the class label distribution, otherwise it checks in which direction (child node) this instance
+     * is forwarded.
+     * @param instance Instance for which the posterior probability distribution is calculated.
+     * @return Posterior probability distribution for this instance.
+     */
     predictProbabilityDistribution(instance: Instance): Map<string, number>{
         if (this.leaf) {
-            return this.data.classDistribution().getProbabilityDistribution();
+            return this.classLabelsDistribution.getProbabilityDistribution();
         } else {
             for (let node of this.children) {
                 if (node.condition.satisfy(instance)) {
                     return node.predictProbabilityDistribution(instance);
                 }
             }
-            return this.data.classDistribution().getProbabilityDistribution();
+            return this.classLabelsDistribution.getProbabilityDistribution();
         }
     }
 }

package/source/Model/DecisionTree/DecisionStump.ts ADDED Viewed

@@ -0,0 +1,26 @@
+import {DecisionTree} from "./DecisionTree";
+import {InstanceList} from "../../InstanceList/InstanceList";
+import {Parameter} from "../../Parameter/Parameter";
+import {DecisionNode} from "./DecisionNode";
+export class DecisionStump extends DecisionTree {
+    /**
+     * Training algorithm for C4.5 Stump univariate decision tree classifier.
+     *
+     * @param trainSet   Training data given to the algorithm.
+     * @param parameters -
+     */
+    train(trainSet: InstanceList, parameters: Parameter): void {
+        this.root = new DecisionNode(trainSet, undefined, undefined, true);
+    }
+    /**
+     * Loads the decision tree model from an input file.
+     * @param fileName File name of the decision tree model.
+     */
+    loadModel(fileName: string): void{
+        this.constructor2(fileName)
+    }
+}

package/source/Model/DecisionTree/DecisionTree.ts CHANGED Viewed

@@ -4,29 +4,27 @@ import {Instance} from "../../Instance/Instance";
 import {CompositeInstance} from "../../Instance/CompositeInstance";
 import {InstanceList} from "../../InstanceList/InstanceList";
 import {FileContents} from "nlptoolkit-util/dist/FileContents";
+import {Parameter} from "../../Parameter/Parameter";
+import {C45Parameter} from "../../Parameter/C45Parameter";
+import {Partition} from "../../InstanceList/Partition";
 export class DecisionTree extends ValidatedModel{
-    private readonly root: DecisionNode
+    protected root: DecisionNode
-    /**
-     * Constructor that sets root node of the decision tree.
-     *
-     * @param rootOrFileName DecisionNode type input or fileName
-     */
-    constructor(rootOrFileName: DecisionNode | string) {
+    constructor2(fileName: string) {
+        let contents = new FileContents(fileName)
+        this.root = new DecisionNode(contents)
+    }
+    constructor(root?: DecisionNode) {
         super();
-        if (rootOrFileName instanceof DecisionNode){
-            this.root = rootOrFileName
-        } else {
-            let contents = new FileContents(rootOrFileName)
-            this.root = new DecisionNode(contents)
-        }
+        this.root = root;
     }
     /**
-     * The predict method  performs prediction on the root node of given instance, and if it is null, it returns the possible class labels.
-     * Otherwise it returns the returned class labels.
+     * The predict method  performs prediction on the root node of given instance, and if it is null, it returns the
+     * possible class labels. Otherwise, it returns the returned class labels.
      *
      * @param instance Instance make prediction.
      * @return Possible class labels.
@@ -39,6 +37,11 @@ export class DecisionTree extends ValidatedModel{
         return predictedClass;
     }
+    /**
+     * Calculates the posterior probability distribution for the given instance according to Decision tree model.
+     * @param instance Instance for which posterior probability distribution is calculated.
+     * @return Posterior probability distribution for the given instance.
+     */
     predictProbability(instance: Instance): Map<string, number> {
         return this.root.predictProbabilityDistribution(instance)
     }
@@ -77,4 +80,30 @@ export class DecisionTree extends ValidatedModel{
     prune(pruneSet: InstanceList){
         this.pruneNode(this.root, pruneSet)
     }
+    /**
+     * Training algorithm for C4.5 univariate decision tree classifier. 20 percent of the data are left aside for pruning
+     * 80 percent of the data is used for constructing the tree.
+     *
+     * @param trainSet   Training data given to the algorithm.
+     * @param parameters -
+     */
+    train(trainSet: InstanceList, parameters: Parameter): void {
+        if ((<C45Parameter> parameters).isPrune()) {
+            let partition = new Partition(trainSet, (<C45Parameter> parameters).getCrossValidationRatio(), true);
+            this.root = new DecisionNode(partition.get(1), undefined, undefined, false);
+            this.prune(partition.get(0));
+        } else {
+            this.root = new DecisionNode(trainSet, undefined, undefined, false);
+        }
+    }
+    /**
+     * Loads the decision tree model from an input file.
+     * @param fileName File name of the decision tree model.
+     */
+    loadModel(fileName: string): void{
+        this.constructor2(fileName)
+    }
 }

package/source/Model/DummyModel.ts CHANGED Viewed

@@ -4,33 +4,29 @@ import {DiscreteDistribution} from "nlptoolkit-math/dist/DiscreteDistribution";
 import {InstanceList} from "../InstanceList/InstanceList";
 import {CompositeInstance} from "../Instance/CompositeInstance";
 import {FileContents} from "nlptoolkit-util/dist/FileContents";
+import {Parameter} from "../Parameter/Parameter";
 export class DummyModel extends Model{
     private distribution: DiscreteDistribution
     /**
-     * Constructor which sets the distribution using the given {@link InstanceList}.
+     * Training algorithm for the dummy classifier. Actually dummy classifier returns the maximum occurring class in
+     * the training data, there is no training. Sets the distribution using the given {@link InstanceList}.
      *
-     * @param trainSet {@link InstanceList} which is used to get the class distribution.
+     * @param trainSet   Training data given to the algorithm.
      */
-    constructor(trainSet: InstanceList | string) {
-        super();
-        if (trainSet instanceof InstanceList){
-            this.distribution = trainSet.classDistribution();
-        } else {
-            let input = new FileContents(trainSet)
-            this.distribution = new DiscreteDistribution()
-            let size = parseInt(input.readLine())
-            for (let i = 0; i < size; i++){
-                let line = input.readLine()
-                let items = line.split(" ")
-                let count = parseInt(items[1])
-                for (let j = 0; j < count; j++){
-                    this.distribution.addItem(items[0])
-                }
-            }
-        }
+    constructor1(trainSet: InstanceList){
+        this.distribution = trainSet.classDistribution()
+    }
+    /**
+     * Loads the dummy model from an input file.
+     * @param fileName File name of the dummy model.
+     */
+    constructor2(fileName: string) {
+        let input = new FileContents(fileName)
+        this.distribution = Model.loadDiscreteDistribution(input)
     }
     /**
@@ -48,6 +44,11 @@ export class DummyModel extends Model{
         }
     }
+    /**
+     * Calculates the posterior probability distribution for the given instance according to dummy model.
+     * @param instance Instance for which posterior probability distribution is calculated.
+     * @return Posterior probability distribution for the given instance.
+     */
     predictProbability(instance: Instance): Map<string, number> {
         return this.distribution.getProbabilityDistribution();
     }
@@ -55,4 +56,24 @@ export class DummyModel extends Model{
     saveTxt(fileName: string){
     }
+    /**
+     * Training algorithm for the dummy classifier. Actually dummy classifier returns the maximum occurring class in
+     * the training data, there is no training.
+     *
+     * @param trainSet   Training data given to the algorithm.
+     * @param parameters -
+     */
+    train(trainSet: InstanceList, parameters: Parameter): void {
+        this.constructor1(trainSet)
+    }
+    /**
+     * Loads the dummy model from an input file.
+     * @param fileName File name of the dummy model.
+     */
+    loadModel(fileName: string): void{
+        this.constructor2(fileName)
+    }
 }

package/source/{Classifier/Bagging.ts → Model/Ensemble/BaggingModel.ts} RENAMED Viewed

@@ -1,12 +1,11 @@
-import {Classifier} from "./Classifier";
-import {InstanceList} from "../InstanceList/InstanceList";
-import {Parameter} from "../Parameter/Parameter";
-import {BaggingParameter} from "../Parameter/BaggingParameter";
-import {DecisionTree} from "../Model/DecisionTree/DecisionTree";
-import {DecisionNode} from "../Model/DecisionTree/DecisionNode";
-import {TreeEnsembleModel} from "../Model/TreeEnsembleModel";
+import {TreeEnsembleModel} from "./TreeEnsembleModel";
+import {InstanceList} from "../../InstanceList/InstanceList";
+import {Parameter} from "../../Parameter/Parameter";
+import {BaggingParameter} from "../../Parameter/BaggingParameter";
+import {DecisionTree} from "../DecisionTree/DecisionTree";
+import {DecisionNode} from "../DecisionTree/DecisionNode";
-export class Bagging extends Classifier{
+export class BaggingModel extends TreeEnsembleModel{
     /**
      * Bagging bootstrap ensemble method that creates individuals for its ensemble by training each classifier on a random
@@ -20,16 +19,20 @@ export class Bagging extends Classifier{
      */
     train(trainSet: InstanceList, parameters: Parameter): void {
         let forestSize = (<BaggingParameter> parameters).getEnsembleSize();
-        let forest = new Array<DecisionTree>();
+        this.forest = new Array<DecisionTree>();
         for (let i = 0; i < forestSize; i++) {
             let bootstrap = trainSet.bootstrap(i);
             let tree = new DecisionTree(new DecisionNode(new InstanceList(bootstrap.getSample()), undefined, undefined, false));
-            forest.push(tree);
+            this.forest.push(tree);
         }
-        this.model = new TreeEnsembleModel(forest);
     }
+    /**
+     * Loads the Bagging ensemble model from an input file.
+     * @param fileName File name of the decision tree model.
+     */
     loadModel(fileName: string): void{
-        this.model = new TreeEnsembleModel(fileName)
+        this.constructor2(fileName)
     }
 }

package/source/{Classifier/RandomForest.ts → Model/Ensemble/RandomForestModel.ts} RENAMED Viewed

@@ -1,12 +1,11 @@
-import {Classifier} from "./Classifier";
-import {InstanceList} from "../InstanceList/InstanceList";
-import {Parameter} from "../Parameter/Parameter";
-import {RandomForestParameter} from "../Parameter/RandomForestParameter";
-import {DecisionTree} from "../Model/DecisionTree/DecisionTree";
-import {DecisionNode} from "../Model/DecisionTree/DecisionNode";
-import {TreeEnsembleModel} from "../Model/TreeEnsembleModel";
+import {TreeEnsembleModel} from "./TreeEnsembleModel";
+import {InstanceList} from "../../InstanceList/InstanceList";
+import {Parameter} from "../../Parameter/Parameter";
+import {RandomForestParameter} from "../../Parameter/RandomForestParameter";
+import {DecisionTree} from "../DecisionTree/DecisionTree";
+import {DecisionNode} from "../DecisionTree/DecisionNode";
-export class RandomForest extends Classifier{
+export class RandomForestModel extends TreeEnsembleModel{
     /**
      * Training algorithm for random forest classifier. Basically the algorithm creates K distinct decision trees from
@@ -17,17 +16,20 @@ export class RandomForest extends Classifier{
      */
     train(trainSet: InstanceList, parameters: Parameter): void {
         let forestSize = (<RandomForestParameter> parameters).getEnsembleSize();
-        let forest = new Array<DecisionTree>();
+        this.forest = new Array<DecisionTree>();
         for (let i = 0; i < forestSize; i++){
             let bootstrap = trainSet.bootstrap(i);
             let tree = new DecisionTree(new DecisionNode(new InstanceList(bootstrap.getSample()), undefined, <RandomForestParameter> parameters, false));
-            forest.push(tree);
+            this.forest.push(tree);
         }
-        this.model = new TreeEnsembleModel(forest);
     }
+    /**
+     * Loads the random forest model from an input file.
+     * @param fileName File name of the random forest model.
+     */
     loadModel(fileName: string): void{
-        this.model = new TreeEnsembleModel(fileName)
+        this.constructor2(fileName)
     }
 }

package/source/Model/{TreeEnsembleModel.ts → Ensemble/TreeEnsembleModel.ts} RENAMED Viewed

@@ -1,30 +1,33 @@
-import {Model} from "./Model";
-import {Instance} from "../Instance/Instance";
-import {DecisionTree} from "./DecisionTree/DecisionTree";
+import {Model} from "../Model";
+import {Instance} from "../../Instance/Instance";
+import {DecisionTree} from "../DecisionTree/DecisionTree";
 import {DiscreteDistribution} from "nlptoolkit-math/dist/DiscreteDistribution";
 import {FileContents} from "nlptoolkit-util/dist/FileContents";
-import {DecisionNode} from "./DecisionTree/DecisionNode";
+import {DecisionNode} from "../DecisionTree/DecisionNode";
-export class TreeEnsembleModel extends Model{
+export abstract class TreeEnsembleModel extends Model{
-    private forest: Array<DecisionTree>
+    protected forest: Array<DecisionTree>
     /**
      * A constructor which sets the {@link Array} of {@link DecisionTree} with given input.
      *
-     * @param forestOrFileName An {@link Array} of {@link DecisionTree}.
+     * @param forest An {@link Array} of {@link DecisionTree}.
      */
-    constructor(forestOrFileName: Array<DecisionTree> | string) {
-        super();
-        if (forestOrFileName instanceof Array){
-            this.forest = forestOrFileName
-        } else {
-            let input = new FileContents(forestOrFileName)
-            let numberOfTrees = parseInt(input.readLine())
-            this.forest = new Array<DecisionTree>()
-            for (let i = 0; i < numberOfTrees; i++){
-                this.forest.push(new DecisionTree(new DecisionNode(input)))
-            }
+    constructor1(forest: Array<DecisionTree>) {
+        this.forest = forest
+    }
+    /**
+     * Loads a tree ensemble model such as Random Forest model or Bagging model from an input model file.
+     * @param fileName Model file name.
+     */
+    constructor2(fileName: string) {
+        let input = new FileContents(fileName)
+        let numberOfTrees = parseInt(input.readLine())
+        this.forest = new Array<DecisionTree>()
+        for (let i = 0; i < numberOfTrees; i++){
+            this.forest.push(new DecisionTree(new DecisionNode(input)))
         }
     }
@@ -43,6 +46,11 @@ export class TreeEnsembleModel extends Model{
         return distribution.getMaxItem();
     }
+    /**
+     * Calculates the posterior probability distribution for the given instance according to ensemble tree model.
+     * @param instance Instance for which posterior probability distribution is calculated.
+     * @return Posterior probability distribution for the given instance.
+     */
     predictProbability(instance: Instance): Map<string, number> {
         let distribution = new DiscreteDistribution();
         for (let tree of this.forest) {