RubyGems - rumale - Versions diffs - 0.13.8 → 0.14.0 - Mend

rumale 0.13.8 → 0.14.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (102) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +24 -0
data/README.md +8 -10
data/lib/rumale.rb +3 -0
data/lib/rumale/base/classifier.rb +2 -2
data/lib/rumale/base/cluster_analyzer.rb +2 -2
data/lib/rumale/base/regressor.rb +2 -2
data/lib/rumale/clustering/dbscan.rb +3 -4
data/lib/rumale/clustering/gaussian_mixture.rb +5 -6
data/lib/rumale/clustering/hdbscan.rb +4 -4
data/lib/rumale/clustering/k_means.rb +5 -6
data/lib/rumale/clustering/k_medoids.rb +5 -6
data/lib/rumale/clustering/power_iteration.rb +4 -6
data/lib/rumale/clustering/single_linkage.rb +3 -3
data/lib/rumale/clustering/snn.rb +1 -1
data/lib/rumale/clustering/spectral_clustering.rb +4 -6
data/lib/rumale/dataset.rb +6 -10
data/lib/rumale/decomposition/factor_analysis.rb +4 -4
data/lib/rumale/decomposition/fast_ica.rb +6 -7
data/lib/rumale/decomposition/nmf.rb +6 -7
data/lib/rumale/decomposition/pca.rb +6 -7
data/lib/rumale/ensemble/ada_boost_classifier.rb +8 -8
data/lib/rumale/ensemble/ada_boost_regressor.rb +7 -7
data/lib/rumale/ensemble/extra_trees_classifier.rb +8 -8
data/lib/rumale/ensemble/extra_trees_regressor.rb +7 -7
data/lib/rumale/ensemble/gradient_boosting_classifier.rb +8 -8
data/lib/rumale/ensemble/gradient_boosting_regressor.rb +8 -8
data/lib/rumale/ensemble/random_forest_classifier.rb +8 -8
data/lib/rumale/ensemble/random_forest_regressor.rb +7 -7
data/lib/rumale/evaluation_measure/accuracy.rb +2 -2
data/lib/rumale/evaluation_measure/adjusted_rand_score.rb +2 -2
data/lib/rumale/evaluation_measure/calinski_harabasz_score.rb +2 -2
data/lib/rumale/evaluation_measure/davies_bouldin_score.rb +2 -2
data/lib/rumale/evaluation_measure/explained_variance_score.rb +2 -2
data/lib/rumale/evaluation_measure/f_score.rb +2 -2
data/lib/rumale/evaluation_measure/log_loss.rb +2 -2
data/lib/rumale/evaluation_measure/mean_absolute_error.rb +2 -2
data/lib/rumale/evaluation_measure/mean_squared_error.rb +2 -2
data/lib/rumale/evaluation_measure/mean_squared_log_error.rb +2 -2
data/lib/rumale/evaluation_measure/median_absolute_error.rb +2 -2
data/lib/rumale/evaluation_measure/mutual_information.rb +2 -2
data/lib/rumale/evaluation_measure/normalized_mutual_information.rb +2 -2
data/lib/rumale/evaluation_measure/precision.rb +2 -2
data/lib/rumale/evaluation_measure/purity.rb +2 -2
data/lib/rumale/evaluation_measure/r2_score.rb +2 -2
data/lib/rumale/evaluation_measure/recall.rb +2 -2
data/lib/rumale/evaluation_measure/roc_auc.rb +6 -3
data/lib/rumale/evaluation_measure/silhouette_score.rb +2 -2
data/lib/rumale/kernel_approximation/rbf.rb +5 -6
data/lib/rumale/kernel_machine/kernel_pca.rb +4 -4
data/lib/rumale/kernel_machine/kernel_ridge.rb +3 -3
data/lib/rumale/kernel_machine/kernel_svc.rb +7 -8
data/lib/rumale/linear_model/lasso.rb +5 -6
data/lib/rumale/linear_model/linear_regression.rb +5 -6
data/lib/rumale/linear_model/logistic_regression.rb +16 -15
data/lib/rumale/linear_model/ridge.rb +5 -6
data/lib/rumale/linear_model/svc.rb +34 -28
data/lib/rumale/linear_model/svr.rb +5 -6
data/lib/rumale/manifold/mds.rb +3 -4
data/lib/rumale/manifold/tsne.rb +3 -5
data/lib/rumale/model_selection/cross_validation.rb +6 -5
data/lib/rumale/model_selection/grid_search_cv.rb +6 -6
data/lib/rumale/model_selection/k_fold.rb +3 -3
data/lib/rumale/model_selection/shuffle_split.rb +3 -5
data/lib/rumale/model_selection/stratified_k_fold.rb +4 -4
data/lib/rumale/model_selection/stratified_shuffle_split.rb +4 -6
data/lib/rumale/multiclass/one_vs_rest_classifier.rb +4 -4
data/lib/rumale/naive_bayes/naive_bayes.rb +14 -14
data/lib/rumale/nearest_neighbors/k_neighbors_classifier.rb +5 -5
data/lib/rumale/nearest_neighbors/k_neighbors_regressor.rb +4 -4
data/lib/rumale/neural_network/base_mlp.rb +244 -0
data/lib/rumale/neural_network/mlp_classifier.rb +119 -0
data/lib/rumale/neural_network/mlp_regressor.rb +89 -0
data/lib/rumale/optimizer/ada_grad.rb +1 -1
data/lib/rumale/optimizer/adam.rb +3 -3
data/lib/rumale/optimizer/nadam.rb +1 -1
data/lib/rumale/optimizer/rmsprop.rb +1 -1
data/lib/rumale/optimizer/sgd.rb +1 -1
data/lib/rumale/optimizer/yellow_fin.rb +1 -2
data/lib/rumale/pairwise_metric.rb +17 -19
data/lib/rumale/pipeline/pipeline.rb +10 -10
data/lib/rumale/polynomial_model/factorization_machine_classifier.rb +29 -21
data/lib/rumale/polynomial_model/factorization_machine_regressor.rb +6 -6
data/lib/rumale/preprocessing/bin_discretizer.rb +3 -3
data/lib/rumale/preprocessing/l2_normalizer.rb +2 -2
data/lib/rumale/preprocessing/label_binarizer.rb +2 -2
data/lib/rumale/preprocessing/label_encoder.rb +1 -1
data/lib/rumale/preprocessing/max_abs_scaler.rb +3 -3
data/lib/rumale/preprocessing/min_max_scaler.rb +3 -3
data/lib/rumale/preprocessing/one_hot_encoder.rb +4 -3
data/lib/rumale/preprocessing/ordinal_encoder.rb +1 -1
data/lib/rumale/preprocessing/standard_scaler.rb +3 -3
data/lib/rumale/tree/base_decision_tree.rb +1 -1
data/lib/rumale/tree/decision_tree_classifier.rb +7 -7
data/lib/rumale/tree/decision_tree_regressor.rb +6 -6
data/lib/rumale/tree/extra_tree_classifier.rb +7 -7
data/lib/rumale/tree/extra_tree_regressor.rb +6 -6
data/lib/rumale/tree/gradient_tree_regressor.rb +9 -9
data/lib/rumale/validation.rb +32 -2
data/lib/rumale/version.rb +1 -1
data/rumale.gemspec +7 -7
metadata +11 -7

data/lib/rumale/tree/extra_tree_regressor.rb CHANGED

@@ -46,9 +46,9 @@ module Rumale
       #   It is used to randomly determine the order of features when deciding spliting point.
       def initialize(criterion: 'mse', max_depth: nil, max_leaf_nodes: nil, min_samples_leaf: 1, max_features: nil,
                      random_seed: nil)
-        check_params_type_or_nil(Integer, max_depth: max_depth, max_leaf_nodes: max_leaf_nodes,
-                                          max_features: max_features, random_seed: random_seed)
-        check_params_integer(min_samples_leaf: min_samples_leaf)
+        check_params_numeric_or_nil(max_depth: max_depth, max_leaf_nodes: max_leaf_nodes,
+                                    max_features: max_features, random_seed: random_seed)
+        check_params_numeric(min_samples_leaf: min_samples_leaf)
         check_params_string(criterion: criterion)
         check_params_positive(max_depth: max_depth, max_leaf_nodes: max_leaf_nodes,
                               min_samples_leaf: min_samples_leaf, max_features: max_features)
@@ -61,8 +61,8 @@ module Rumale
       # @param y [Numo::DFloat] (shape: [n_samples, n_outputs]) The taget values to be used for fitting the model.
       # @return [ExtraTreeRegressor] The learned regressor itself.
       def fit(x, y)
-        check_sample_array(x)
-        check_tvalue_array(y)
+        x = check_convert_sample_array(x)
+        y = check_convert_tvalue_array(y)
         check_sample_tvalue_size(x, y)
         super
       end
@@ -72,7 +72,7 @@ module Rumale
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to predict the values.
       # @return [Numo::DFloat] (shape: [n_samples, n_outputs]) Predicted values per sample.
       def predict(x)
-        check_sample_array(x)
+        x = check_convert_sample_array(x)
         super
       end

data/lib/rumale/tree/gradient_tree_regressor.rb CHANGED

@@ -52,10 +52,9 @@ module Rumale
       #   It is used to randomly determine the order of features when deciding spliting point.
       def initialize(reg_lambda: 0.0, shrinkage_rate: 1.0,
                      max_depth: nil, max_leaf_nodes: nil, min_samples_leaf: 1, max_features: nil, random_seed: nil)
-        check_params_type_or_nil(Integer, max_depth: max_depth, max_leaf_nodes: max_leaf_nodes,
-                                          max_features: max_features, random_seed: random_seed)
-        check_params_float(reg_lambda: reg_lambda, shrinkage_rate: shrinkage_rate)
-        check_params_integer(min_samples_leaf: min_samples_leaf)
+        check_params_numeric_or_nil(max_depth: max_depth, max_leaf_nodes: max_leaf_nodes,
+                                    max_features: max_features, random_seed: random_seed)
+        check_params_numeric(reg_lambda: reg_lambda, shrinkage_rate: shrinkage_rate, min_samples_leaf: min_samples_leaf)
         check_params_positive(reg_lambda: reg_lambda, shrinkage_rate: shrinkage_rate,
                               max_depth: max_depth, max_leaf_nodes: max_leaf_nodes,
                               min_samples_leaf: min_samples_leaf, max_features: max_features)
@@ -83,10 +82,11 @@ module Rumale
       # @param h [Numo::DFloat] (shape: [n_samples]) The hessian of loss function.
       # @return [GradientTreeRegressor] The learned regressor itself.
       def fit(x, y, g, h)
-        check_sample_array(x)
-        check_tvalue_array(y)
+        x = check_convert_sample_array(x)
+        y = check_convert_tvalue_array(y)
+        g = check_convert_tvalue_array(g)
+        h = check_convert_tvalue_array(h)
         check_sample_tvalue_size(x, y)
-        check_params_type(Numo::DFloat, g: g, h: g)
         # Initialize some variables.
         n_features = x.shape[1]
         @params[:max_features] ||= n_features
@@ -105,7 +105,7 @@ module Rumale
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to predict the values.
       # @return [Numo::DFloat] (size: n_samples) Predicted values per sample.
       def predict(x)
-        check_sample_array(x)
+        x = check_convert_sample_array(x)
         @leaf_weights[apply(x)].dup
       end
@@ -114,7 +114,7 @@ module Rumale
       # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The samples to predict the labels.
       # @return [Numo::Int32] (shape: [n_samples]) Leaf index for sample.
       def apply(x)
-        check_sample_array(x)
+        x = check_convert_sample_array(x)
         Numo::Int32[*(Array.new(x.shape[0]) { |n| apply_at_node(@tree, x[n, true]) })]
       end

data/lib/rumale/validation.rb CHANGED

@@ -5,17 +5,37 @@ module Rumale
   module Validation
     module_function
+    # @!visibility private
+    def check_convert_sample_array(x)
+      x = Numo::DFloat.cast(x) unless x.is_a?(Numo::DFloat)
+      raise ArgumentError, 'Expect sample matrix to be 2-D array' unless x.ndim == 2
+      x
+    end
+    # @!visibility private
+    def check_convert_label_array(y)
+      y = Numo::Int32.cast(y) unless y.is_a?(Numo::Int32)
+      raise ArgumentError, 'Expect label vector to be 1-D arrray' unless y.ndim == 1
+      y
+    end
+    # @!visibility private
+    def check_convert_tvalue_array(y)
+      y = Numo::DFloat.cast(y) unless y.is_a?(Numo::DFloat)
+      y
+    end
     # @!visibility private
     def check_sample_array(x)
       raise TypeError, 'Expect class of sample matrix to be Numo::DFloat' unless x.is_a?(Numo::DFloat)
-      raise ArgumentError, 'Expect sample matrix to be 2-D array' unless x.shape.size == 2
+      raise ArgumentError, 'Expect sample matrix to be 2-D array' unless x.ndim == 2
       nil
     end
     # @!visibility private
     def check_label_array(y)
       raise TypeError, 'Expect class of label vector to be Numo::Int32' unless y.is_a?(Numo::Int32)
-      raise ArgumentError, 'Expect label vector to be 1-D arrray' unless y.shape.size == 1
+      raise ArgumentError, 'Expect label vector to be 1-D arrray' unless y.ndim == 1
       nil
     end
@@ -49,6 +69,16 @@ module Rumale
       nil
     end
+    # @!visibility private
+    def check_params_numeric(params = {})
+      check_params_type(Numeric, params)
+    end
+    # @!visibility private
+    def check_params_numeric_or_nil(params = {})
+      check_params_type_or_nil(Numeric, params)
+    end
     # @!visibility private
     def check_params_float(params = {})
       check_params_type(Float, params)

data/lib/rumale/version.rb CHANGED

@@ -3,5 +3,5 @@
 # Rumale is a machine learning library in Ruby.
 module Rumale
   # The version of Rumale you are using.
-  VERSION = '0.13.8'
+  VERSION = '0.14.0'
 end

data/rumale.gemspec CHANGED

@@ -1,4 +1,3 @@
 lib = File.expand_path('lib', __dir__)
 $LOAD_PATH.unshift(lib) unless $LOAD_PATH.include?(lib)
 require 'rumale/version'
@@ -13,14 +12,15 @@ Gem::Specification.new do |spec|
     Rumale is a machine learning library in Ruby.
     Rumale provides machine learning algorithms with interfaces similar to Scikit-Learn in Python.
   MSG
-  spec.description   = <<~MSG
+  spec.description = <<~MSG
     Rumale is a machine learning library in Ruby.
     Rumale provides machine learning algorithms with interfaces similar to Scikit-Learn in Python.
-    Rumale currently supports Linear / Kernel Support Vector Machine,
-    Logistic Regression, Linear Regression, Ridge, Lasso, Kernel Ridge, Factorization Machine,
-    Naive Bayes, Decision Tree, AdaBoost, Gradient Tree Boosting, Random Forest, Extra-Trees, K-nearest neighbor algorithm,
-    K-Means, K-Medoids, Gaussian Mixture Model, DBSCAN, HDBSCAN, SNN, Spectral Clustering, Power Iteration Clustering,
-    Multidimensional Scaling, t-SNE, Principal Component Analysis, Kernel PCA, and Non-negative Matrix Factorization.
+    Rumale supports Support Vector Machine,
+    Logistic Regression, Ridge, Lasso, Factorization Machine,
+    Multi-layer Perceptron,
+    Naive Bayes, Decision Tree, Gradient Tree Boosting, Random Forest,
+    K-Means, Gaussian Mixture Model, DBSCAN, Spectral Clustering,
+    Mutidimensional Scaling, t-SNE, Principal Component Analysis, and Non-negative Matrix Factorization.
   MSG
   spec.homepage      = 'https://github.com/yoshoku/rumale'
   spec.license       = 'BSD-2-Clause'

metadata CHANGED

@@ -1,14 +1,14 @@
 --- !ruby/object:Gem::Specification
 name: rumale
 version: !ruby/object:Gem::Version
-  version: 0.13.8
+  version: 0.14.0
 platform: ruby
 authors:
 - yoshoku
 autorequire:
 bindir: exe
 cert_chain: []
-date: 2019-11-08 00:00:00.000000000 Z
+date: 2019-11-16 00:00:00.000000000 Z
 dependencies:
 - !ruby/object:Gem::Dependency
   name: numo-narray
@@ -125,11 +125,12 @@ dependencies:
 description: |
   Rumale is a machine learning library in Ruby.
   Rumale provides machine learning algorithms with interfaces similar to Scikit-Learn in Python.
-  Rumale currently supports Linear / Kernel Support Vector Machine,
-  Logistic Regression, Linear Regression, Ridge, Lasso, Kernel Ridge, Factorization Machine,
-  Naive Bayes, Decision Tree, AdaBoost, Gradient Tree Boosting, Random Forest, Extra-Trees, K-nearest neighbor algorithm,
-  K-Means, K-Medoids, Gaussian Mixture Model, DBSCAN, HDBSCAN, SNN, Spectral Clustering, Power Iteration Clustering,
-  Multidimensional Scaling, t-SNE, Principal Component Analysis, Kernel PCA, and Non-negative Matrix Factorization.
+  Rumale supports Support Vector Machine,
+  Logistic Regression, Ridge, Lasso, Factorization Machine,
+  Multi-layer Perceptron,
+  Naive Bayes, Decision Tree, Gradient Tree Boosting, Random Forest,
+  K-Means, Gaussian Mixture Model, DBSCAN, Spectral Clustering,
+  Mutidimensional Scaling, t-SNE, Principal Component Analysis, and Non-negative Matrix Factorization.
 email:
 - yoshoku@outlook.com
 executables: []
@@ -226,6 +227,9 @@ files:
 - lib/rumale/naive_bayes/naive_bayes.rb
 - lib/rumale/nearest_neighbors/k_neighbors_classifier.rb
 - lib/rumale/nearest_neighbors/k_neighbors_regressor.rb
+- lib/rumale/neural_network/base_mlp.rb
+- lib/rumale/neural_network/mlp_classifier.rb
+- lib/rumale/neural_network/mlp_regressor.rb
 - lib/rumale/optimizer/ada_grad.rb
 - lib/rumale/optimizer/adam.rb
 - lib/rumale/optimizer/nadam.rb