RubyGems - svmkit - Versions diffs - 0.2.7 → 0.2.8 - Mend

svmkit 0.2.7 → 0.2.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (29) hide show

checksums.yaml +4 -4
data/HISTORY.md +5 -0
data/lib/svmkit/base/base_estimator.rb +1 -1
data/lib/svmkit/base/classifier.rb +2 -0
data/lib/svmkit/ensemble/random_forest_classifier.rb +11 -1
data/lib/svmkit/evaluation_measure/accuracy.rb +3 -0
data/lib/svmkit/evaluation_measure/f_score.rb +4 -0
data/lib/svmkit/evaluation_measure/precision.rb +4 -0
data/lib/svmkit/evaluation_measure/recall.rb +4 -0
data/lib/svmkit/kernel_approximation/rbf.rb +11 -1
data/lib/svmkit/kernel_machine/kernel_svc.rb +12 -11
data/lib/svmkit/linear_model/logistic_regression.rb +20 -6
data/lib/svmkit/linear_model/svc.rb +12 -0
data/lib/svmkit/model_selection/cross_validation.rb +6 -0
data/lib/svmkit/model_selection/k_fold.rb +6 -4
data/lib/svmkit/model_selection/stratified_k_fold.rb +6 -0
data/lib/svmkit/multiclass/one_vs_rest_classifier.rb +5 -0
data/lib/svmkit/naive_bayes/naive_bayes.rb +14 -0
data/lib/svmkit/nearest_neighbors/k_neighbors_classifier.rb +5 -0
data/lib/svmkit/pairwise_metric.rb +15 -0
data/lib/svmkit/polynomial_model/factorization_machine_classifier.rb +12 -0
data/lib/svmkit/preprocessing/l2_normalizer.rb +2 -0
data/lib/svmkit/preprocessing/min_max_scaler.rb +4 -0
data/lib/svmkit/preprocessing/standard_scaler.rb +3 -0
data/lib/svmkit/tree/decision_tree_classifier.rb +16 -3
data/lib/svmkit/validation.rb +55 -0
data/lib/svmkit/version.rb +1 -1
data/lib/svmkit.rb +1 -0
metadata +3 -2

checksums.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 SHA1:
-  metadata.gz: 46878b59860b61bae7b522fb02af984208609f56
-  data.tar.gz: 6e889c6ad8382c654455a242d2f7f27de41de2d5
+  metadata.gz: bbc648db53b4285bd15ae00e2464c4376d027893
+  data.tar.gz: 28d9db47ae3053031f1643329cf02cd4e7d9c135
 SHA512:
-  metadata.gz: cddb239bf0768e6d983ce942ed6a7bdda8b827fa2e73e51c1b4591e8af3c641339377417f844358159c3a2bdff51d2f5678ef07fe21fe86e51136289e69ea38c
-  data.tar.gz: 64c2029c729de580765ad9ee89fd57821a40773721eac291201cb9b9f4c72697f5945c8f5259ed8d6a879f0b35dac841bcdd6d5322014c9cc78b9a42046dc310
+  metadata.gz: c504f010a70fc7a31afa4471096092adac9ff44de979d42d7277c63d737d517981e2ac6d7481ad42dc1c864f2a7756d39cd1d7697d2d4b1bca150d0a4eca3b8e
+  data.tar.gz: 8d89dc525ed37626a2d97e6fe3bebdacd4ec2945df285d8275cd0bd5df62c5ebc897dca67b91157df0bfc460fa987ed4098654ce6d164cb05ec46de4c6fe27af

data/HISTORY.md CHANGED Viewed

@@ -1,3 +1,8 @@
+# 0.2.8
+- Fixed bug on gradient calculation of Logistic Regression.
+- Fixed to change accessor of params of estimators to read only.
+- Added parameter validation.
 # 0.2.7
 - Fixed to support multiclass classifiction into LinearSVC, LogisticRegression, KernelSVC, and FactorizationMachineClassifier

data/lib/svmkit/base/base_estimator.rb CHANGED Viewed

@@ -7,7 +7,7 @@ module SVMKit
     module BaseEstimator
       # Return parameters about an estimator.
       # @return [Hash]
-      attr_accessor :params
+      attr_reader :params
     end
   end
 end

data/lib/svmkit/base/classifier.rb CHANGED Viewed

@@ -20,6 +20,8 @@ module SVMKit
       # @param y [Numo::Int32] (shape: [n_samples]) True labels for testing data.
       # @return [Float] Mean accuracy
       def score(x, y)
+        SVMKit::Validation.check_sample_array(x)
+        SVMKit::Validation.check_label_array(y)
         evaluator = SVMKit::EvaluationMeasure::Accuracy.new
         evaluator.score(y, predict(x))
       end

data/lib/svmkit/ensemble/random_forest_classifier.rb CHANGED Viewed

@@ -50,6 +50,11 @@ module SVMKit
       #   It is used to randomly determine the order of features when deciding spliting point.
       def initialize(n_estimators: 10, criterion: 'gini', max_depth: nil, max_leaf_nodes: nil, min_samples_leaf: 1,
                      max_features: nil, random_seed: nil)
+        SVMKit::Validation.check_params_type_or_nil(Integer, max_depth: max_depth, max_leaf_nodes: max_leaf_nodes,
+                                                    max_features: max_features, random_seed: random_seed)
+        SVMKit::Validation.check_params_integer(n_estimators: n_estimators, min_samples_leaf: min_samples_leaf)
+        SVMKit::Validation.check_params_string(criterion: criterion)
         @params = {}
         @params[:n_estimators] = n_estimators
         @params[:criterion] = criterion
@@ -59,10 +64,10 @@ module SVMKit
         @params[:max_features] = max_features
         @params[:random_seed] = random_seed
         @params[:random_seed] ||= srand
-        @rng = Random.new(@params[:random_seed])
         @estimators = nil
         @classes = nil
         @feature_importances = nil
+        @rng = Random.new(@params[:random_seed])
       end
       # Fit the model with given training data.
@@ -71,6 +76,8 @@ module SVMKit
       # @param y [Numo::Int32] (shape: [n_samples]) The labels to be used for fitting the model.
       # @return [RandomForestClassifier] The learned classifier itself.
       def fit(x, y)
+        SVMKit::Validation.check_sample_array(x)
+        SVMKit::Validation.check_label_array(y)
         # Initialize some variables.
         n_samples, n_features = x.shape
         @params[:max_features] = n_features unless @params[:max_features].is_a?(Integer)
@@ -98,6 +105,7 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to predict the labels.
       # @return [Numo::Int32] (shape: [n_samples]) Predicted class label per sample.
       def predict(x)
+        SVMKit::Validation.check_sample_array(x)
         n_samples, = x.shape
         n_classes = @classes.size
         classes_arr = @classes.to_a
@@ -117,6 +125,7 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to predict the probailities.
       # @return [Numo::DFloat] (shape: [n_samples, n_classes]) Predicted probability of each class per sample.
       def predict_proba(x)
+        SVMKit::Validation.check_sample_array(x)
         n_samples, = x.shape
         n_classes = @classes.size
         classes_arr = @classes.to_a
@@ -136,6 +145,7 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to predict the labels.
       # @return [Numo::Int32] (shape: [n_samples, n_estimators]) Leaf index for sample.
       def apply(x)
+        SVMKit::Validation.check_sample_array(x)
         Numo::Int32[*Array.new(@params[:n_estimators]) { |n| @estimators[n].apply(x) }].transpose
       end

data/lib/svmkit/evaluation_measure/accuracy.rb CHANGED Viewed

@@ -19,6 +19,9 @@ module SVMKit
       # @param y_pred [Numo::Int32] (shape: [n_samples]) Predicted labels.
       # @return [Float] Mean accuracy
       def score(y_true, y_pred)
+        SVMKit::Validation.check_label_array(y_true)
+        SVMKit::Validation.check_label_array(y_pred)
         (y_true.to_a.map.with_index { |label, n| label == y_pred[n] ? 1 : 0 }).inject(:+) / y_true.size.to_f
       end
     end

data/lib/svmkit/evaluation_measure/f_score.rb CHANGED Viewed

@@ -23,6 +23,7 @@ module SVMKit
       #
       # @param average [String] The average type ('binary', 'micro', 'macro')
       def initialize(average: 'binary')
+        SVMKit::Validation.check_params_string(average: average)
         @average = average
       end
@@ -32,6 +33,9 @@ module SVMKit
       # @param y_pred [Numo::Int32] (shape: [n_samples]) Predicted labels.
       # @return [Float] Average F1-score
       def score(y_true, y_pred)
+        SVMKit::Validation.check_label_array(y_true)
+        SVMKit::Validation.check_label_array(y_pred)
         case @average
         when 'binary'
           f_score_each_class(y_true, y_pred).last

data/lib/svmkit/evaluation_measure/precision.rb CHANGED Viewed

@@ -23,6 +23,7 @@ module SVMKit
       #
       # @param average [String] The average type ('binary', 'micro', 'macro')
       def initialize(average: 'binary')
+        SVMKit::Validation.check_params_string(average: average)
         @average = average
       end
@@ -32,6 +33,9 @@ module SVMKit
       # @param y_pred [Numo::Int32] (shape: [n_samples]) Predicted labels.
       # @return [Float] Average precision
       def score(y_true, y_pred)
+        SVMKit::Validation.check_label_array(y_true)
+        SVMKit::Validation.check_label_array(y_pred)
         case @average
         when 'binary'
           precision_each_class(y_true, y_pred).last

data/lib/svmkit/evaluation_measure/recall.rb CHANGED Viewed

@@ -23,6 +23,7 @@ module SVMKit
       #
       # @param average [String] The average type ('binary', 'micro', 'macro')
       def initialize(average: 'binary')
+        SVMKit::Validation.check_params_string(average: average)
         @average = average
       end
@@ -32,6 +33,9 @@ module SVMKit
       # @param y_pred [Numo::Int32] (shape: [n_samples]) Predicted labels.
       # @return [Float] Average recall
       def score(y_true, y_pred)
+        SVMKit::Validation.check_label_array(y_true)
+        SVMKit::Validation.check_label_array(y_pred)
         case @average
         when 'binary'
           recall_each_class(y_true, y_pred).last

data/lib/svmkit/kernel_approximation/rbf.rb CHANGED Viewed

@@ -37,14 +37,18 @@ module SVMKit
       # @param n_components [Integer] The number of dimensions of the RBF kernel feature space.
       # @param random_seed [Integer] The seed value using to initialize the random generator.
       def initialize(gamma: 1.0, n_components: 128, random_seed: nil)
+        SVMKit::Validation.check_params_float(gamma: gamma)
+        SVMKit::Validation.check_params_integer(n_components: n_components)
+        SVMKit::Validation.check_params_type_or_nil(Integer, random_seed: random_seed)
         @params = {}
         @params[:gamma] = gamma
         @params[:n_components] = n_components
         @params[:random_seed] = random_seed
         @params[:random_seed] ||= srand
-        @rng = Random.new(@params[:random_seed])
         @random_mat = nil
         @random_vec = nil
+        @rng = Random.new(@params[:random_seed])
       end
       # Fit the model with given training data.
@@ -55,6 +59,8 @@ module SVMKit
       #   This method uses only the number of features of the data.
       # @return [RBF] The learned transformer itself.
       def fit(x, _y = nil)
+        SVMKit::Validation.check_sample_array(x)
         n_features = x.shape[1]
         @params[:n_components] = 2 * n_features if @params[:n_components] <= 0
         @random_mat = rand_normal([n_features, @params[:n_components]]) * (2.0 * @params[:gamma])**0.5
@@ -72,6 +78,8 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The training data to be used for fitting the model.
       # @return [Numo::DFloat] (shape: [n_samples, n_components]) The transformed data
       def fit_transform(x, _y = nil)
+        SVMKit::Validation.check_sample_array(x)
         fit(x).transform(x)
       end
@@ -82,6 +90,8 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The data to be transformed with the learned model.
       # @return [Numo::DFloat] (shape: [n_samples, n_components]) The transformed data.
       def transform(x)
+        SVMKit::Validation.check_sample_array(x)
         n_samples, = x.shape
         projection = x.dot(@random_mat) + @random_vec.tile(n_samples, 1)
         Numo::NMath.sin(projection) * ((2.0 / @params[:n_components])**0.5)

data/lib/svmkit/kernel_machine/kernel_svc.rb CHANGED Viewed

@@ -42,13 +42,17 @@ module SVMKit
       # @param max_iter [Integer] The maximum number of iterations.
       # @param random_seed [Integer] The seed value using to initialize the random generator.
       def initialize(reg_param: 1.0, max_iter: 1000, random_seed: nil)
+        SVMKit::Validation.check_params_float(reg_param: reg_param)
+        SVMKit::Validation.check_params_integer(max_iter: max_iter)
+        SVMKit::Validation.check_params_type_or_nil(Integer, random_seed: random_seed)
         @params = {}
         @params[:reg_param] = reg_param
         @params[:max_iter] = max_iter
         @params[:random_seed] = random_seed
         @params[:random_seed] ||= srand
         @weight_vec = nil
-        @classes
+        @classes = nil
         @rng = Random.new(@params[:random_seed])
       end
@@ -59,6 +63,9 @@ module SVMKit
       # @param y [Numo::Int32] (shape: [n_training_samples]) The labels to be used for fitting the model.
       # @return [KernelSVC] The learned classifier itself.
       def fit(x, y)
+        SVMKit::Validation.check_sample_array(x)
+        SVMKit::Validation.check_label_array(y)
         @classes = Numo::Int32[*y.to_a.uniq.sort]
         n_classes = @classes.size
         _n_samples, n_features = x.shape
@@ -84,6 +91,8 @@ module SVMKit
       #     The kernel matrix between testing samples and training samples to compute the scores.
       # @return [Numo::DFloat] (shape: [n_testing_samples, n_classes]) Confidence score per sample.
       def decision_function(x)
+        SVMKit::Validation.check_sample_array(x)
         x.dot(@weight_vec.transpose)
       end
@@ -93,6 +102,8 @@ module SVMKit
       #     The kernel matrix between testing samples and training samples to predict the labels.
       # @return [Numo::Int32] (shape: [n_testing_samples]) Predicted class label per sample.
       def predict(x)
+        SVMKit::Validation.check_sample_array(x)
         return Numo::Int32.cast(decision_function(x).ge(0.0)) * 2 - 1 if @classes.size <= 2
         n_samples, = x.shape
@@ -100,16 +111,6 @@ module SVMKit
         Numo::Int32.asarray(Array.new(n_samples) { |n| @classes[decision_values[n, true].max_index] })
       end
-      # Claculate the mean accuracy of the given testing data.
-      #
-      # @param x [Numo::DFloat] (shape: [n_testing_samples, n_training_samples])
-      #     The kernel matrix between testing samples and training samples.
-      # @param y [Numo::Int32] (shape: [n_testing_samples]) True labels for testing data.
-      # @return [Float] Mean accuracy
-      def score(x, y)
-        super
-      end
       # Dump marshal data.
       # @return [Hash] The marshal data about KernelSVC.
       def marshal_dump

data/lib/svmkit/linear_model/logistic_regression.rb CHANGED Viewed

@@ -50,6 +50,11 @@ module SVMKit
       # @param random_seed [Integer] The seed value using to initialize the random generator.
       def initialize(reg_param: 1.0, fit_bias: false, bias_scale: 1.0,
                      max_iter: 100, batch_size: 50, normalize: true, random_seed: nil)
+        SVMKit::Validation.check_params_float(reg_param: reg_param, bias_scale: bias_scale)
+        SVMKit::Validation.check_params_integer(max_iter: max_iter, batch_size: batch_size)
+        SVMKit::Validation.check_params_boolean(fit_bias: fit_bias, normalize: normalize)
+        SVMKit::Validation.check_params_type_or_nil(Integer, random_seed: random_seed)
         @params = {}
         @params[:reg_param] = reg_param
         @params[:fit_bias] = fit_bias
@@ -71,6 +76,9 @@ module SVMKit
       # @param y [Numo::Int32] (shape: [n_samples]) The labels to be used for fitting the model.
       # @return [LogisticRegression] The learned classifier itself.
       def fit(x, y)
+        SVMKit::Validation.check_sample_array(x)
+        SVMKit::Validation.check_label_array(y)
         @classes = Numo::Int32[*y.to_a.uniq.sort]
         n_classes = @classes.size
         _n_samples, n_features = x.shape
@@ -79,14 +87,14 @@ module SVMKit
           @weight_vec = Numo::DFloat.zeros(n_classes, n_features)
           @bias_term = Numo::DFloat.zeros(n_classes)
           n_classes.times do |n|
-            bin_y = Numo::Int32.cast(y.eq(@classes[n]))
+            bin_y = Numo::Int32.cast(y.eq(@classes[n])) * 2 - 1
             weight, bias = binary_fit(x, bin_y)
             @weight_vec[n, true] = weight
             @bias_term[n] = bias
           end
         else
           negative_label = y.to_a.uniq.sort.first
-          bin_y = Numo::Int32.cast(y.ne(negative_label))
+          bin_y = Numo::Int32.cast(y.ne(negative_label)) * 2 - 1
           @weight_vec, @bias_term = binary_fit(x, bin_y)
         end
@@ -98,6 +106,8 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to compute the scores.
       # @return [Numo::DFloat] (shape: [n_samples, n_classes]) Confidence score per sample.
       def decision_function(x)
+        SVMKit::Validation.check_sample_array(x)
         x.dot(@weight_vec.transpose) + @bias_term
       end
@@ -106,10 +116,12 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to predict the labels.
       # @return [Numo::Int32] (shape: [n_samples]) Predicted class label per sample.
       def predict(x)
-        return Numo::Int32.cast(decision_function(x).ge(0.5)) * 2 - 1 if @classes.size <= 2
+        SVMKit::Validation.check_sample_array(x)
+        return Numo::Int32.cast(predict_proba(x)[true, 1].ge(0.5)) * 2 - 1 if @classes.size <= 2
         n_samples, = x.shape
-        decision_values = decision_function(x)
+        decision_values = predict_proba(x)
         Numo::Int32.asarray(Array.new(n_samples) { |n| @classes[decision_values[n, true].max_index] })
       end
@@ -118,6 +130,8 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to predict the probailities.
       # @return [Numo::DFloat] (shape: [n_samples, n_classes]) Predicted probability of each class per sample.
       def predict_proba(x)
+        SVMKit::Validation.check_sample_array(x)
         proba = 1.0 / (Numo::NMath.exp(-decision_function(x)) + 1.0)
         return (proba.transpose / proba.sum(axis: 1)).transpose if @classes.size > 2
@@ -165,9 +179,9 @@ module SVMKit
           rand_ids.concat(subset_ids)
           # update the weight vector.
           df = samples[subset_ids, true].dot(weight_vec.transpose)
-          coef = bin_y[subset_ids] / (Numo::NMath.exp(-bin_y[subset_ids] * df) + 1.0)
+          coef = bin_y[subset_ids] / (Numo::NMath.exp(-bin_y[subset_ids] * df) + 1.0) - bin_y[subset_ids]
           mean_vec = samples[subset_ids, true].transpose.dot(coef) / @params[:batch_size]
-          weight_vec -= learning_rate(t) * (@params[:reg_param] * weight_vec - mean_vec)
+          weight_vec -= learning_rate(t) * (@params[:reg_param] * weight_vec + mean_vec)
           # scale the weight vector.
           normalize_weight_vec(weight_vec) if @params[:normalize]
         end

data/lib/svmkit/linear_model/svc.rb CHANGED Viewed

@@ -49,6 +49,11 @@ module SVMKit
       # @param random_seed [Integer] The seed value using to initialize the random generator.
       def initialize(reg_param: 1.0, fit_bias: false, bias_scale: 1.0,
                      max_iter: 100, batch_size: 50, normalize: true, random_seed: nil)
+        SVMKit::Validation.check_params_float(reg_param: reg_param, bias_scale: bias_scale)
+        SVMKit::Validation.check_params_integer(max_iter: max_iter, batch_size: batch_size)
+        SVMKit::Validation.check_params_boolean(fit_bias: fit_bias, normalize: normalize)
+        SVMKit::Validation.check_params_type_or_nil(Integer, random_seed: random_seed)
         @params = {}
         @params[:reg_param] = reg_param
         @params[:fit_bias] = fit_bias
@@ -70,6 +75,9 @@ module SVMKit
       # @param y [Numo::Int32] (shape: [n_samples]) The labels to be used for fitting the model.
       # @return [SVC] The learned classifier itself.
       def fit(x, y)
+        SVMKit::Validation.check_sample_array(x)
+        SVMKit::Validation.check_label_array(y)
         @classes = Numo::Int32[*y.to_a.uniq.sort]
         n_classes = @classes.size
         _n_samples, n_features = x.shape
@@ -97,6 +105,8 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to compute the scores.
       # @return [Numo::DFloat] (shape: [n_samples, n_classes]) Confidence score per sample.
       def decision_function(x)
+        SVMKit::Validation.check_sample_array(x)
         x.dot(@weight_vec.transpose) + @bias_term
       end
@@ -105,6 +115,8 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to predict the labels.
       # @return [Numo::Int32] (shape: [n_samples]) Predicted class label per sample.
       def predict(x)
+        SVMKit::Validation.check_sample_array(x)
         return Numo::Int32.cast(decision_function(x).ge(0.0)) * 2 - 1 if @classes.size <= 2
         n_samples, = x.shape

data/lib/svmkit/model_selection/cross_validation.rb CHANGED Viewed

@@ -38,6 +38,10 @@ module SVMKit
       # @param evaluator [Evaluator] The evaluator that calculates score of estimator results.
       # @param return_train_score [Boolean] The flag indicating whether to calculate the score of training dataset.
       def initialize(estimator: nil, splitter: nil, evaluator: nil, return_train_score: false)
+        SVMKit::Validation.check_params_type(SVMKit::Base::BaseEstimator, estimator: estimator)
+        SVMKit::Validation.check_params_type(SVMKit::Base::Splitter, splitter: splitter)
+        SVMKit::Validation.check_params_type_or_nil(SVMKit::Base::Evaluator, evaluator: evaluator)
+        SVMKit::Validation.check_params_boolean(return_train_score: return_train_score)
         @estimator = estimator
         @splitter = splitter
         @evaluator = evaluator
@@ -56,6 +60,8 @@ module SVMKit
       #   * :train_score (Array<Float>) The scores of training dataset for each split. This option is nil if
       #     the return_train_score is false.
       def perform(x, y)
+        SVMKit::Validation.check_sample_array(x)
+        SVMKit::Validation.check_label_array(y)
         # Initialize the report of cross validation.
         report = { test_score: [], train_score: nil, fit_time: [] }
         report[:train_score] = [] if @return_train_score

data/lib/svmkit/model_selection/k_fold.rb CHANGED Viewed

@@ -32,6 +32,10 @@ module SVMKit
       # @param shuffle [Boolean] The flag indicating whether to shuffle the dataset.
       # @param random_seed [Integer] The seed value using to initialize the random generator.
       def initialize(n_splits: 3, shuffle: false, random_seed: nil)
+        SVMKit::Validation.check_params_integer(n_splits: n_splits)
+        SVMKit::Validation.check_params_boolean(shuffle: shuffle)
+        SVMKit::Validation.check_params_type_or_nil(Integer, random_seed: random_seed)
         @n_splits = n_splits
         @shuffle = shuffle
         @random_seed = random_seed
@@ -43,11 +47,9 @@ module SVMKit
       #
       # @param x [Numo::DFloat] (shape: [n_samples, n_features])
       #   The dataset to be used to generate data indices for K-fold cross validation.
-      # @param y [Numo::Int32] (shape: [n_samples])
-      #   The labels to be used to generate data indices for stratified K-fold cross validation.
-      #   This argument exists to unify the interface between the K-fold methods, it is not used in the method.
       # @return [Array] The set of data indices for constructing the training and testing dataset in each fold.
-      def split(x, y) # rubocop:disable Lint/UnusedMethodArgument
+      def split(x, _y = nil)
+        SVMKit::Validation.check_sample_array(x)
         # Initialize and check some variables.
         n_samples, = x.shape
         unless @n_splits.between?(2, n_samples)

data/lib/svmkit/model_selection/stratified_k_fold.rb CHANGED Viewed

@@ -32,6 +32,10 @@ module SVMKit
       # @param shuffle [Boolean] The flag indicating whether to shuffle the dataset.
       # @param random_seed [Integer] The seed value using to initialize the random generator.
       def initialize(n_splits: 3, shuffle: false, random_seed: nil)
+        SVMKit::Validation.check_params_integer(n_splits: n_splits)
+        SVMKit::Validation.check_params_boolean(shuffle: shuffle)
+        SVMKit::Validation.check_params_type_or_nil(Integer, random_seed: random_seed)
         @n_splits = n_splits
         @shuffle = shuffle
         @random_seed = random_seed
@@ -48,6 +52,8 @@ module SVMKit
       #   The labels to be used to generate data indices for stratified K-fold cross validation.
       # @return [Array] The set of data indices for constructing the training and testing dataset in each fold.
       def split(x, y) # rubocop:disable Lint/UnusedMethodArgument
+        SVMKit::Validation.check_sample_array(x)
+        SVMKit::Validation.check_label_array(y)
         # Check the number of samples in each class.
         unless valid_n_splits?(y)
           raise ArgumentError,

data/lib/svmkit/multiclass/one_vs_rest_classifier.rb CHANGED Viewed

@@ -33,6 +33,7 @@ module SVMKit
       #
       # @param estimator [Classifier] The (binary) classifier for construction a multi-class classifier.
       def initialize(estimator: nil)
+        SVMKit::Validation.check_params_type(SVMKit::Base::BaseEstimator, estimator: estimator)
         @params = {}
         @params[:estimator] = estimator
         @estimators = nil
@@ -45,6 +46,8 @@ module SVMKit
       # @param y [Numo::Int32] (shape: [n_samples]) The labels to be used for fitting the model.
       # @return [OneVsRestClassifier] The learned classifier itself.
       def fit(x, y)
+        SVMKit::Validation.check_sample_array(x)
+        SVMKit::Validation.check_label_array(y)
         y_arr = y.to_a
         @classes = Numo::Int32.asarray(y_arr.uniq.sort)
         @estimators = @classes.to_a.map do |label|
@@ -59,6 +62,7 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to compute the scores.
       # @return [Numo::DFloat] (shape: [n_samples, n_classes]) Confidence scores per sample for each class.
       def decision_function(x)
+        SVMKit::Validation.check_sample_array(x)
         n_classes = @classes.size
         Numo::DFloat.asarray(Array.new(n_classes) { |m| @estimators[m].decision_function(x).to_a }).transpose
       end
@@ -68,6 +72,7 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to predict the labels.
       # @return [Numo::Int32] (shape: [n_samples]) Predicted class label per sample.
       def predict(x)
+        SVMKit::Validation.check_sample_array(x)
         n_samples, = x.shape
         decision_values = decision_function(x)
         Numo::Int32.asarray(Array.new(n_samples) { |n| @classes[decision_values[n, true].max_index] })

data/lib/svmkit/naive_bayes/naive_bayes.rb CHANGED Viewed

@@ -16,6 +16,7 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to predict the labels.
       # @return [Numo::Int32] (shape: [n_samples]) Predicted class label per sample.
       def predict(x)
+        SVMKit::Validation.check_sample_array(x)
         n_samples = x.shape.first
         decision_values = decision_function(x)
         Numo::Int32.asarray(Array.new(n_samples) { |n| @classes[decision_values[n, true].max_index] })
@@ -26,6 +27,7 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to predict the log-probailities.
       # @return [Numo::DFloat] (shape: [n_samples, n_classes]) Predicted log-probability of each class per sample.
       def predict_log_proba(x)
+        SVMKit::Validation.check_sample_array(x)
         n_samples, = x.shape
         log_likelihoods = decision_function(x)
         log_likelihoods - Numo::NMath.log(Numo::NMath.exp(log_likelihoods).sum(1)).reshape(n_samples, 1)
@@ -36,6 +38,7 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to predict the probailities.
       # @return [Numo::DFloat] (shape: [n_samples, n_classes]) Predicted probability of each class per sample.
       def predict_proba(x)
+        SVMKit::Validation.check_sample_array(x)
         Numo::NMath.exp(predict_log_proba(x)).abs
       end
     end
@@ -75,6 +78,8 @@ module SVMKit
       #   to be used for fitting the model.
       # @return [GaussianNB] The learned classifier itself.
       def fit(x, y)
+        SVMKit::Validation.check_sample_array(x)
+        SVMKit::Validation.check_label_array(y)
         n_samples, = x.shape
         @classes = Numo::Int32[*y.to_a.uniq.sort]
         @class_priors = Numo::DFloat[*@classes.to_a.map { |l| y.eq(l).count / n_samples.to_f }]
@@ -88,6 +93,7 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to compute the scores.
       # @return [Numo::DFloat] (shape: [n_samples, n_classes]) Confidence scores per sample for each class.
       def decision_function(x)
+        SVMKit::Validation.check_sample_array(x)
         n_classes = @classes.size
         log_likelihoods = Array.new(n_classes) do |l|
           Math.log(@class_priors[l]) - 0.5 * (
@@ -147,6 +153,7 @@ module SVMKit
       #
       # @param smoothing_param [Float] The Laplace smoothing parameter.
       def initialize(smoothing_param: 1.0)
+        SVMKit::Validation.check_params_float(smoothing_param: smoothing_param)
         @params = {}
         @params[:smoothing_param] = smoothing_param
       end
@@ -158,6 +165,8 @@ module SVMKit
       #   to be used for fitting the model.
       # @return [MultinomialNB] The learned classifier itself.
       def fit(x, y)
+        SVMKit::Validation.check_sample_array(x)
+        SVMKit::Validation.check_label_array(y)
         n_samples, = x.shape
         @classes = Numo::Int32[*y.to_a.uniq.sort]
         @class_priors = Numo::DFloat[*@classes.to_a.map { |l| y.eq(l).count / n_samples.to_f }]
@@ -173,6 +182,7 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to compute the scores.
       # @return [Numo::DFloat] (shape: [n_samples, n_classes]) Confidence scores per sample for each class.
       def decision_function(x)
+        SVMKit::Validation.check_sample_array(x)
         n_classes = @classes.size
         bin_x = x.gt(0)
         log_likelihoods = Array.new(n_classes) do |l|
@@ -230,6 +240,7 @@ module SVMKit
       # @param smoothing_param [Float] The Laplace smoothing parameter.
       # @param bin_threshold [Float] The threshold for binarizing of features.
       def initialize(smoothing_param: 1.0, bin_threshold: 0.0)
+        SVMKit::Validation.check_params_float(smoothing_param: smoothing_param, bin_threshold: bin_threshold)
         @params = {}
         @params[:smoothing_param] = smoothing_param
         @params[:bin_threshold] = bin_threshold
@@ -242,6 +253,8 @@ module SVMKit
       #   to be used for fitting the model.
       # @return [BernoulliNB] The learned classifier itself.
       def fit(x, y)
+        SVMKit::Validation.check_sample_array(x)
+        SVMKit::Validation.check_label_array(y)
         n_samples, = x.shape
         bin_x = Numo::DFloat[*x.gt(@params[:bin_threshold])]
         @classes = Numo::Int32[*y.to_a.uniq.sort]
@@ -260,6 +273,7 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to compute the scores.
       # @return [Numo::DFloat] (shape: [n_samples, n_classes]) Confidence scores per sample for each class.
       def decision_function(x)
+        SVMKit::Validation.check_sample_array(x)
         n_classes = @classes.size
         bin_x = Numo::DFloat[*x.gt(@params[:bin_threshold])]
         not_bin_x = Numo::DFloat[*x.le(@params[:bin_threshold])]

data/lib/svmkit/nearest_neighbors/k_neighbors_classifier.rb CHANGED Viewed

@@ -35,6 +35,7 @@ module SVMKit
       #
       # @param n_neighbors [Integer] The number of neighbors.
       def initialize(n_neighbors: 5)
+        SVMKit::Validation.check_params_integer(n_neighbors: n_neighbors)
         @params = {}
         @params[:n_neighbors] = n_neighbors
         @prototypes = nil
@@ -48,6 +49,8 @@ module SVMKit
       # @param y [Numo::Int32] (shape: [n_samples]) The labels to be used for fitting the model.
       # @return [KNeighborsClassifier] The learned classifier itself.
       def fit(x, y)
+        SVMKit::Validation.check_sample_array(x)
+        SVMKit::Validation.check_label_array(y)
         @prototypes = Numo::DFloat.asarray(x.to_a)
         @labels = Numo::Int32.asarray(y.to_a)
         @classes = Numo::Int32.asarray(y.to_a.uniq.sort)
@@ -59,6 +62,7 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to compute the scores.
       # @return [Numo::DFloat] (shape: [n_samples, n_classes]) Confidence scores per sample for each class.
       def decision_function(x)
+        SVMKit::Validation.check_sample_array(x)
         distance_matrix = PairwiseMetric.euclidean_distance(x, @prototypes)
         n_samples, n_prototypes = distance_matrix.shape
         n_classes = @classes.size
@@ -76,6 +80,7 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to predict the labels.
       # @return [Numo::Int32] (shape: [n_samples]) Predicted class label per sample.
       def predict(x)
+        SVMKit::Validation.check_sample_array(x)
         n_samples = x.shape.first
         decision_values = decision_function(x)
         Numo::Int32.asarray(Array.new(n_samples) { |n| @classes[decision_values[n, true].max_index] })

data/lib/svmkit/pairwise_metric.rb CHANGED Viewed

@@ -11,6 +11,8 @@ module SVMKit
       # @return [Numo::DFloat] (shape: [n_samples_x, n_samples_x] or [n_samples_x, n_samples_y] if y is given)
       def euclidean_distance(x, y = nil)
         y = x if y.nil?
+        SVMKit::Validation.check_sample_array(x)
+        SVMKit::Validation.check_sample_array(y)
         sum_x_vec = (x**2).sum(1)
         sum_y_vec = (y**2).sum(1)
         dot_xy_mat = x.dot(y.transpose)
@@ -29,6 +31,9 @@ module SVMKit
       def rbf_kernel(x, y = nil, gamma = nil)
         y = x if y.nil?
         gamma ||= 1.0 / x.shape[1]
+        SVMKit::Validation.check_sample_array(x)
+        SVMKit::Validation.check_sample_array(y)
+        SVMKit::Validation.check_params_float(gamma: gamma)
         distance_matrix = euclidean_distance(x, y)
         Numo::NMath.exp((distance_matrix**2) * -gamma)
       end
@@ -40,6 +45,8 @@ module SVMKit
       # @return [Numo::DFloat] (shape: [n_samples_x, n_samples_x] or [n_samples_x, n_samples_y] if y is given)
       def linear_kernel(x, y = nil)
         y = x if y.nil?
+        SVMKit::Validation.check_sample_array(x)
+        SVMKit::Validation.check_sample_array(y)
         x.dot(y.transpose)
       end
@@ -54,6 +61,10 @@ module SVMKit
       def polynomial_kernel(x, y = nil, degree = 3, gamma = nil, coef = 1)
         y = x if y.nil?
         gamma ||= 1.0 / x.shape[1]
+        SVMKit::Validation.check_sample_array(x)
+        SVMKit::Validation.check_sample_array(y)
+        SVMKit::Validation.check_params_float(gamma: gamma)
+        SVMKit::Validation.check_params_integer(degree: degree, coef: coef)
         (x.dot(y.transpose) * gamma + coef)**degree
       end
@@ -67,6 +78,10 @@ module SVMKit
       def sigmoid_kernel(x, y = nil, gamma = nil, coef = 1)
         y = x if y.nil?
         gamma ||= 1.0 / x.shape[1]
+        SVMKit::Validation.check_sample_array(x)
+        SVMKit::Validation.check_sample_array(y)
+        SVMKit::Validation.check_params_float(gamma: gamma)
+        SVMKit::Validation.check_params_integer(coef: coef)
         Numo::NMath.tanh(x.dot(y.transpose) * gamma + coef)
       end
     end

data/lib/svmkit/polynomial_model/factorization_machine_classifier.rb CHANGED Viewed

@@ -58,6 +58,12 @@ module SVMKit
       # @param random_seed [Integer] The seed value using to initialize the random generator.
       def initialize(n_factors: 2, loss: 'hinge', reg_param_bias: 1.0, reg_param_weight: 1.0, reg_param_factor: 1.0,
                      init_std: 0.1, max_iter: 1000, batch_size: 10, random_seed: nil)
+        SVMKit::Validation.check_params_float(reg_param_bias: reg_param_bias, reg_param_weight: reg_param_weight,
+                                              reg_param_factor: reg_param_factor, init_std: init_std)
+        SVMKit::Validation.check_params_integer(n_factors: n_factors, max_iter: max_iter, batch_size: batch_size)
+        SVMKit::Validation.check_params_string(loss: loss)
+        SVMKit::Validation.check_params_type_or_nil(Integer, random_seed: random_seed)
         @params = {}
         @params[:n_factors] = n_factors
         @params[:loss] = loss
@@ -82,6 +88,9 @@ module SVMKit
       # @param y [Numo::Int32] (shape: [n_samples]) The labels to be used for fitting the model.
       # @return [FactorizationMachineClassifier] The learned classifier itself.
       def fit(x, y)
+        SVMKit::Validation.check_sample_array(x)
+        SVMKit::Validation.check_label_array(y)
         @classes = Numo::Int32[*y.to_a.uniq.sort]
         n_classes = @classes.size
         _n_samples, n_features = x.shape
@@ -111,6 +120,7 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to compute the scores.
       # @return [Numo::DFloat] (shape: [n_samples]) Confidence score per sample.
       def decision_function(x)
+        SVMKit::Validation.check_sample_array(x)
         linear_term = @bias_term + x.dot(@weight_vec.transpose)
         factor_term = if @classes.size <= 2
                         0.5 * (@factor_mat.dot(x.transpose)**2 - (@factor_mat**2).dot(x.transpose**2)).sum
@@ -125,6 +135,7 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to predict the labels.
       # @return [Numo::Int32] (shape: [n_samples]) Predicted class label per sample.
       def predict(x)
+        SVMKit::Validation.check_sample_array(x)
         return Numo::Int32.cast(decision_function(x).ge(0.0)) * 2 - 1 if @classes.size <= 2
         n_samples, = x.shape
@@ -137,6 +148,7 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to predict the probailities.
       # @return [Numo::DFloat] (shape: [n_samples, n_classes]) Predicted probability of each class per sample.
       def predict_proba(x)
+        SVMKit::Validation.check_sample_array(x)
         proba = 1.0 / (Numo::NMath.exp(-decision_function(x)) + 1.0)
         return (proba.transpose / proba.sum(axis: 1)).transpose if @classes.size > 2

data/lib/svmkit/preprocessing/l2_normalizer.rb CHANGED Viewed

@@ -32,6 +32,7 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to calculate L2-norms.
       # @return [L2Normalizer]
       def fit(x, _y = nil)
+        SVMKit::Validation.check_sample_array(x)
         @norm_vec = Numo::NMath.sqrt((x**2).sum(1))
         self
       end
@@ -43,6 +44,7 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to calculate L2-norms.
       # @return [Numo::DFloat] The normalized samples.
       def fit_transform(x, _y = nil)
+        SVMKit::Validation.check_sample_array(x)
         fit(x)
         x / @norm_vec.tile(x.shape[1], 1).transpose
       end

data/lib/svmkit/preprocessing/min_max_scaler.rb CHANGED Viewed

@@ -28,6 +28,7 @@ module SVMKit
       #
       # @param feature_range [Array<Float>] The desired range of samples.
       def initialize(feature_range: [0.0, 1.0])
+        SVMKit::Validation.check_params_type(Array, feature_range: feature_range)
         @params = {}
         @params[:feature_range] = feature_range
         @min_vec = nil
@@ -41,6 +42,7 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to calculate the minimum and maximum values.
       # @return [MinMaxScaler]
       def fit(x, _y = nil)
+        SVMKit::Validation.check_sample_array(x)
         @min_vec = x.min(0)
         @max_vec = x.max(0)
         self
@@ -53,6 +55,7 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to calculate the minimum and maximum values.
       # @return [Numo::DFloat] The scaled samples.
       def fit_transform(x, _y = nil)
+        SVMKit::Validation.check_sample_array(x)
         fit(x).transform(x)
       end
@@ -61,6 +64,7 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to be scaled.
       # @return [Numo::DFloat] The scaled samples.
       def transform(x)
+        SVMKit::Validation.check_sample_array(x)
         n_samples, = x.shape
         dif_vec = @max_vec - @min_vec
         nx = (x - @min_vec.tile(n_samples, 1)) / dif_vec.tile(n_samples, 1)

data/lib/svmkit/preprocessing/standard_scaler.rb CHANGED Viewed

@@ -39,6 +39,7 @@ module SVMKit
       #   The samples to calculate the mean values and standard deviations.
       # @return [StandardScaler]
       def fit(x, _y = nil)
+        SVMKit::Validation.check_sample_array(x)
         @mean_vec = x.mean(0)
         @std_vec = x.stddev(0)
         self
@@ -52,6 +53,7 @@ module SVMKit
       #   The samples to calculate the mean values and standard deviations.
       # @return [Numo::DFloat] The scaled samples.
       def fit_transform(x, _y = nil)
+        SVMKit::Validation.check_sample_array(x)
         fit(x).transform(x)
       end
@@ -60,6 +62,7 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to be scaled.
       # @return [Numo::DFloat] The scaled samples.
       def transform(x)
+        SVMKit::Validation.check_sample_array(x)
         n_samples, = x.shape
         (x - @mean_vec.tile(n_samples, 1)) / @std_vec.tile(n_samples, 1)
       end

data/lib/svmkit/tree/decision_tree_classifier.rb CHANGED Viewed

@@ -54,6 +54,11 @@ module SVMKit
       #   It is used to randomly determine the order of features when deciding spliting point.
       def initialize(criterion: 'gini', max_depth: nil, max_leaf_nodes: nil, min_samples_leaf: 1, max_features: nil,
                      random_seed: nil)
+        SVMKit::Validation.check_params_type_or_nil(Integer, max_depth: max_depth, max_leaf_nodes: max_leaf_nodes,
+                                                    max_features: max_features, random_seed: random_seed)
+        SVMKit::Validation.check_params_integer(min_samples_leaf: min_samples_leaf)
+        SVMKit::Validation.check_params_string(criterion: criterion)
         @params = {}
         @params[:criterion] = criterion
         @params[:max_depth] = max_depth
@@ -62,12 +67,12 @@ module SVMKit
         @params[:max_features] = max_features
         @params[:random_seed] = random_seed
         @params[:random_seed] ||= srand
-        @rng = Random.new(@params[:random_seed])
         @tree = nil
         @classes = nil
         @feature_importances = nil
         @n_leaves = nil
         @leaf_labels = nil
+        @rng = Random.new(@params[:random_seed])
       end
       # Fit the model with given training data.
@@ -76,6 +81,8 @@ module SVMKit
       # @param y [Numo::Int32] (shape: [n_samples]) The labels to be used for fitting the model.
       # @return [DecisionTreeClassifier] The learned classifier itself.
       def fit(x, y)
+        SVMKit::Validation.check_sample_array(x)
+        SVMKit::Validation.check_label_array(y)
         n_samples, n_features = x.shape
         @params[:max_features] = n_features unless @params[:max_features].is_a?(Integer)
         @params[:max_features] = [[1, @params[:max_features]].max, n_features].min
@@ -90,6 +97,7 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to predict the labels.
       # @return [Numo::Int32] (shape: [n_samples]) Predicted class label per sample.
       def predict(x)
+        SVMKit::Validation.check_sample_array(x)
         @leaf_labels[apply(x)]
       end
@@ -98,6 +106,7 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to predict the probailities.
       # @return [Numo::DFloat] (shape: [n_samples, n_classes]) Predicted probability of each class per sample.
       def predict_proba(x)
+        SVMKit::Validation.check_sample_array(x)
         probs = Numo::DFloat[*(Array.new(x.shape[0]) { |n| predict_at_node(@tree, x[n, true]) })]
         probs[true, @classes]
       end
@@ -107,14 +116,18 @@ module SVMKit
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to predict the labels.
       # @return [Numo::Int32] (shape: [n_samples]) Leaf index for sample.
       def apply(x)
+        SVMKit::Validation.check_sample_array(x)
         Numo::Int32[*(Array.new(x.shape[0]) { |n| apply_at_node(@tree, x[n, true]) })]
       end
       # Dump marshal data.
       # @return [Hash] The marshal data about DecisionTreeClassifier
       def marshal_dump
-        { params: @params, classes: @classes, tree: @tree,
-          feature_importances: @feature_importances, leaf_labels: @leaf_labels,
+        { params: @params,
+          classes: @classes,
+          tree: @tree,
+          feature_importances: @feature_importances,
+          leaf_labels: @leaf_labels,
           rng: @rng }
       end

data/lib/svmkit/validation.rb ADDED Viewed

@@ -0,0 +1,55 @@
+# frozen_string_literal: true
+module SVMKit
+  # @!visibility private
+  module Validation
+    module_function
+    # @!visibility private
+    def check_sample_array(x)
+      raise TypeError, 'Expect class of sample matrix to be Numo::DFloat' unless x.is_a?(Numo::DFloat)
+      raise ArgumentError, 'Expect sample matrix to be 2-D array' unless x.shape.size == 2
+      nil
+    end
+    # @!visibility private
+    def check_label_array(y)
+      raise TypeError, 'Expect class of label vector to be Numo::Int32' unless y.is_a?(Numo::Int32)
+      raise ArgumentError, 'Expect label vector to be 1-D arrray' unless y.shape.size == 1
+      nil
+    end
+    # @!visibility private
+    def check_params_type(type, params = {})
+      params.each { |k, v| raise TypeError, "Expect class of #{k} to be #{type}" unless v.is_a?(type) }
+      nil
+    end
+    # @!visibility private
+    def check_params_type_or_nil(type, params = {})
+      params.each { |k, v| raise TypeError, "Expect class of #{k} to be #{type} or nil" unless v.is_a?(type) || v.is_a?(NilClass) }
+      nil
+    end
+    # @!visibility private
+    def check_params_float(params = {})
+      check_params_type(Float, params)
+    end
+    # @!visibility private
+    def check_params_integer(params = {})
+      check_params_type(Integer, params)
+    end
+    # @!visibility private
+    def check_params_string(params = {})
+      check_params_type(String, params)
+    end
+    # @!visibility private
+    def check_params_boolean(params = {})
+      params.each { |k, v| raise TypeError, "Expect class of #{k} to be Boolean" unless v.is_a?(FalseClass) || v.is_a?(TrueClass) }
+      nil
+    end
+  end
+end

data/lib/svmkit/version.rb CHANGED Viewed

@@ -3,5 +3,5 @@
 # SVMKit is a machine learning library in Ruby.
 module SVMKit
   # @!visibility private
-  VERSION = '0.2.7'
+  VERSION = '0.2.8'
 end

data/lib/svmkit.rb CHANGED Viewed

@@ -3,6 +3,7 @@
 require 'numo/narray'
 require 'svmkit/version'
+require 'svmkit/validation'
 require 'svmkit/pairwise_metric'
 require 'svmkit/dataset'
 require 'svmkit/base/base_estimator'

metadata CHANGED Viewed

@@ -1,14 +1,14 @@
 --- !ruby/object:Gem::Specification
 name: svmkit
 version: !ruby/object:Gem::Version
-  version: 0.2.7
+  version: 0.2.8
 platform: ruby
 authors:
 - yoshoku
 autorequire:
 bindir: exe
 cert_chain: []
-date: 2018-04-01 00:00:00.000000000 Z
+date: 2018-04-05 00:00:00.000000000 Z
 dependencies:
 - !ruby/object:Gem::Dependency
   name: numo-narray
@@ -135,6 +135,7 @@ files:
 - lib/svmkit/preprocessing/min_max_scaler.rb
 - lib/svmkit/preprocessing/standard_scaler.rb
 - lib/svmkit/tree/decision_tree_classifier.rb
+- lib/svmkit/validation.rb
 - lib/svmkit/version.rb
 - svmkit.gemspec
 homepage: https://github.com/yoshoku/svmkit