RubyGems - rumale-decomposition - Versions diffs - 0.28.0 → 0.29.0 - Mend

rumale-decomposition 0.28.0 → 0.29.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

checksums.yaml +4 -4
data/LICENSE.txt +1 -1
data/lib/rumale/decomposition/fast_ica.rb +1 -1
data/lib/rumale/decomposition/nmf.rb +1 -1
data/lib/rumale/decomposition/pca.rb +1 -1
data/lib/rumale/decomposition/sparse_pca.rb +165 -0
data/lib/rumale/decomposition/version.rb +1 -1
data/lib/rumale/decomposition.rb +1 -0
metadata +6 -5

checksums.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 SHA256:
-  metadata.gz: c8af7f0f9ed9935345159cdc99580adf42a196e25e873572d065d3297831769d
-  data.tar.gz: 1cde7e86b60af3eb3013764479205bc7644b15d65e1efd4f89b5d399ded94125
+  metadata.gz: 84715613fb41ef3b6961b9280f6750fc831daa161ddee4e3666ab906e0670599
+  data.tar.gz: c3079e09e5ca5b011d8067457eb89a451b8fd0819a8f996630018a1b4cac41e7
 SHA512:
-  metadata.gz: ecc70ed7d6d49b0b4d9fc3a074cfce03f72a9d9bdcb53fe043059256f38826c9988e22312ab028ae3ae04a451da752e01f4483678e6441963b9aded4e0121f5b
-  data.tar.gz: b90020afa33252d132e7936711df156f13d89ceb23a49ef21f8d8ab654772b37417ea2f581ac4ef42c55fd467a6056e9aac2fd38d349b748bebfae0446c52e4e
+  metadata.gz: 8568f69c7acdf8ccc2c14ba6c9281e1ba145bcd400bf80ef9cbbdedd12f337455614170b1c5eff94c45ae8453ba00fb515deaad4a1ca0a56576a023264006f31
+  data.tar.gz: de013d05ad22b323d03e3eecac12edff941c3ecf9ad02e21a2302ee75cd6574cd06ccb1612d15bf758315191960065098212f70f8ea6980a26417dee3ef6090d

data/LICENSE.txt CHANGED Viewed

@@ -1,4 +1,4 @@
-Copyright (c) 2022-2023 Atsushi Tatsuma
+Copyright (c) 2022-2024 Atsushi Tatsuma
 All rights reserved.
 Redistribution and use in source and binary forms, with or without

data/lib/rumale/decomposition/fast_ica.rb CHANGED Viewed

@@ -57,7 +57,7 @@ module Rumale
           alpha: alpha,
           max_iter: max_iter,
           tol: tol,
-          random_seed: (random_seed || srand)
+          random_seed: random_seed || srand
         }
         @rng = Random.new(@params[:random_seed])
       end

data/lib/rumale/decomposition/nmf.rb CHANGED Viewed

@@ -42,7 +42,7 @@ module Rumale
           max_iter: max_iter,
           tol: tol,
           eps: eps,
-          random_seed: (random_seed || srand)
+          random_seed: random_seed || srand
         }
         @rng = Random.new(@params[:random_seed])
       end

data/lib/rumale/decomposition/pca.rb CHANGED Viewed

@@ -62,7 +62,7 @@ module Rumale
           solver: 'fpt',
           max_iter: max_iter,
           tol: tol,
-          random_seed: (random_seed || srand)
+          random_seed: random_seed || srand
         }
         @params[:solver] = 'evd' if (solver == 'auto' && enable_linalg?(warning: false)) || solver == 'evd'
         @rng = Random.new(@params[:random_seed])

data/lib/rumale/decomposition/sparse_pca.rb ADDED Viewed

@@ -0,0 +1,165 @@
+# frozen_string_literal: true
+require 'rumale/base/estimator'
+require 'rumale/base/transformer'
+require 'rumale/utils'
+require 'rumale/validation'
+module Rumale
+  module Decomposition
+    # SparsePCA is a class that implements Sparse Principal Component Analysis.
+    #
+    # @example
+    #   require 'numo/tiny_linalg'
+    #   Numo::Linalg = Numo::TinyLinalg
+    #
+    #   require 'rumale/decomposition/sparse_pca'
+    #
+    #   decomposer = Rumale::Decomposition::SparsePCA.new(n_components: 2, reg_param: 0.1)
+    #   representaion = decomposer.fit_transform(samples)
+    #   sparse_components = decomposer.components
+    #
+    # *Reference*
+    # - Macky, L., "Deflation Methods for Sparse PCA," Advances in NIPS'08, pp. 1017--1024, 2008.
+    # - Hein, M. and Bühler, T., "An Inverse Power Method for Nonlinear Eigenproblems with Applications in 1-Spectral Clustering and Sparse PCA," Advances in NIPS'10, pp. 847--855, 2010.
+    class SparsePCA < ::Rumale::Base::Estimator
+      include ::Rumale::Base::Transformer
+      # Returns the principal components.
+      # @return [Numo::DFloat] (shape: [n_components, n_features])
+      attr_reader :components
+      # Returns the mean vector.
+      # @return [Numo::DFloat] (shape: [n_features])
+      attr_reader :mean
+      # Return the random generator.
+      # @return [Random]
+      attr_reader :rng
+      # Create a new transformer with Sparse PCA.
+      #
+      # @param n_components [Integer] The number of principal components.
+      # @param reg_param [Float] The regularization parameter (interval: [0, 1]).
+      # @param max_iter [Integer] The maximum number of iterations.
+      # @param tol [Float] The tolerance of termination criterion.
+      # @param random_seed [Integer] The seed value using to initialize the random generator.
+      def initialize(n_components: 2, reg_param: 0.001, max_iter: 1000, tol: 1e-6, random_seed: nil)
+        super()
+        warn('reg_param should be in the interval [0, 1].') unless (0..1).cover?(reg_param)
+        @params = {
+          n_components: n_components,
+          reg_param: reg_param,
+          max_iter: max_iter,
+          tol: tol,
+          random_seed: random_seed || srand
+        }
+        @rng = Random.new(@params[:random_seed])
+      end
+      # Fit the model with given training data.
+      #
+      # @overload fit(x) -> SparsePCA
+      #   @param x [Numo::DFloat] (shape: [n_samples, n_features]) The training data to be used for fitting the model.
+      #   @return [SparsePCA] The learned transformer itself.
+      def fit(x, _y = nil)
+        x = ::Rumale::Validation.check_convert_sample_array(x)
+        # initialize some variables.
+        @components = Numo::DFloat.zeros(@params[:n_components], x.shape[1])
+        # centering.
+        @mean = x.mean(axis: 0)
+        centered_x = x - @mean
+        # optimization.
+        partial_fit(centered_x)
+        @components = @components[0, true].dup if @params[:n_components] == 1
+        self
+      end
+      # Fit the model with training data, and then transform them with the learned model.
+      #
+      # @overload fit_transform(x) -> Numo::DFloat
+      #   @param x [Numo::DFloat] (shape: [n_samples, n_features]) The training data to be used for fitting the model.
+      #   @return [Numo::DFloat] (shape: [n_samples, n_components]) The transformed data
+      def fit_transform(x, _y = nil)
+        x = ::Rumale::Validation.check_convert_sample_array(x)
+        fit(x).transform(x)
+      end
+      # Transform the given data with the learned model.
+      #
+      # @param x [Numo::DFloat] (shape: [n_samples, n_features]) The data to be transformed with the learned model.
+      # @return [Numo::DFloat] (shape: [n_samples, n_components]) The transformed data.
+      def transform(x)
+        x = ::Rumale::Validation.check_convert_sample_array(x)
+        (x - @mean).dot(@components.transpose)
+      end
+      private
+      def partial_fit(x)
+        sub_rng = @rng.dup
+        n_samples, n_features = x.shape
+        cov_mat = x.transpose.dot(x) / n_samples
+        prj_mat = Numo::DFloat.eye(n_features)
+        @params[:n_components].times do |i|
+          f = ::Rumale::Utils.rand_normal(n_features, sub_rng)
+          xf = x.dot(f)
+          norm_xf = norm(xf, 2)
+          coeff = coeff_numerator(f).fdiv(norm_xf)
+          mu = cov_mat.dot(f) / norm_xf
+          @params[:max_iter].times do |_t|
+            g = sign(mu) * Numo::DFloat.maximum(coeff * mu.abs - @params[:reg_param], 0)
+            f = g / norm(x.dot(g), 2)
+            mu = cov_mat.dot(f) / norm(x.dot(f), 2)
+            coeff_new = coeff_numerator(f)
+            break if (coeff - coeff_new).abs.fdiv(coeff) < @params[:tol]
+            coeff = coeff_new
+          end
+          # deflation
+          q = prj_mat.dot(f)
+          qqt = Numo::DFloat.eye(n_features) - q.outer(q)
+          x = x.dot(qqt)
+          cov_mat = qqt.dot(cov_mat).dot(qqt)
+          prj_mat = prj_mat.dot(qqt)
+          f /= norm(f, 2)
+          @components[i, true] = f.dup
+        end
+      end
+      def coeff_numerator(f)
+        (1 - @params[:reg_param]) * norm(f, 2) + @params[:reg_param] * norm(f, 1)
+      end
+      def sign(v)
+        r = Numo::DFloat.zeros(v.size)
+        r[v.lt(0)] = -1
+        r[v.gt(0)] = 1
+        r
+      end
+      def norm(v, ord)
+        nrm = if defined?(Numo::Linalg)
+                Numo::Linalg.norm(v, ord)
+              elsif ord == 2
+                Math.sqrt(v.dot(v))
+              else
+                v.abs.sum
+              end
+        nrm.zero? ? 1.0 : nrm
+      end
+    end
+  end
+end

data/lib/rumale/decomposition/version.rb CHANGED Viewed

@@ -5,6 +5,6 @@ module Rumale
   # Module for matrix decomposition algorithms.
   module Decomposition
     # @!visibility private
-    VERSION = '0.28.0'
+    VERSION = '0.29.0'
   end
 end

data/lib/rumale/decomposition.rb CHANGED Viewed

@@ -6,4 +6,5 @@ require_relative 'decomposition/factor_analysis'
 require_relative 'decomposition/fast_ica'
 require_relative 'decomposition/nmf'
 require_relative 'decomposition/pca'
+require_relative 'decomposition/sparse_pca'
 require_relative 'decomposition/version'

metadata CHANGED Viewed

@@ -1,14 +1,14 @@
 --- !ruby/object:Gem::Specification
 name: rumale-decomposition
 version: !ruby/object:Gem::Version
-  version: 0.28.0
+  version: 0.29.0
 platform: ruby
 authors:
 - yoshoku
 autorequire:
 bindir: exe
 cert_chain: []
-date: 2023-11-12 00:00:00.000000000 Z
+date: 2024-03-30 00:00:00.000000000 Z
 dependencies:
 - !ruby/object:Gem::Dependency
   name: numo-narray
@@ -30,14 +30,14 @@ dependencies:
     requirements:
     - - "~>"
       - !ruby/object:Gem::Version
-        version: 0.28.0
+        version: 0.29.0
   type: :runtime
   prerelease: false
   version_requirements: !ruby/object:Gem::Requirement
     requirements:
     - - "~>"
       - !ruby/object:Gem::Version
-        version: 0.28.0
+        version: 0.29.0
 description: |
   Rumale::Decomposition provides matrix decomposition algorithms,
   such as Principal Component Analysis, Non-negative Matrix Factorization, Factor Analysis, and Independent Component Analysis,
@@ -55,6 +55,7 @@ files:
 - lib/rumale/decomposition/fast_ica.rb
 - lib/rumale/decomposition/nmf.rb
 - lib/rumale/decomposition/pca.rb
+- lib/rumale/decomposition/sparse_pca.rb
 - lib/rumale/decomposition/version.rb
 homepage: https://github.com/yoshoku/rumale
 licenses:
@@ -80,7 +81,7 @@ required_rubygems_version: !ruby/object:Gem::Requirement
     - !ruby/object:Gem::Version
       version: '0'
 requirements: []
-rubygems_version: 3.4.20
+rubygems_version: 3.5.7
 signing_key:
 specification_version: 4
 summary: Rumale::Decomposition provides matrix decomposition algorithms with Rumale