RubyGems - ruby-dnn - Versions diffs - 0.8.8 → 0.9.0 - Mend

ruby-dnn 0.8.8 → 0.9.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (19) hide show

checksums.yaml +4 -4
data/API-Reference.ja.md +83 -46
data/examples/cifar10_example.rb +5 -5
data/examples/mnist_conv2d_example.rb +5 -5
data/examples/mnist_example.rb +5 -5
data/examples/mnist_lstm_example.rb +5 -5
data/examples/xor_example.rb +4 -3
data/lib/dnn.rb +3 -3
data/lib/dnn/core/activations.rb +1 -112
data/lib/dnn/core/cnn_layers.rb +14 -14
data/lib/dnn/core/dataset.rb +18 -0
data/lib/dnn/core/initializers.rb +28 -8
data/lib/dnn/core/layers.rb +62 -90
data/lib/dnn/core/losses.rb +120 -0
data/lib/dnn/core/model.rb +124 -66
data/lib/dnn/core/rnn_layers.rb +17 -13
data/lib/dnn/core/{util.rb → utils.rb} +10 -6
data/lib/dnn/version.rb +1 -1
metadata +5 -3

data/lib/dnn/core/losses.rb ADDED

@@ -0,0 +1,120 @@
+module DNN
+  module Losses
+    class Loss
+      def forward(out, y)
+        raise NotImplementedError.new("Class '#{self.class.name}' has implement method 'forward'")
+      end
+      def backward(y)
+        raise NotImplementedError.new("Class '#{self.class.name}' has implement method 'backward'")
+      end
+      def regularize(layers)
+        layers.select { |layer| layer.is_a?(Connection) }
+              .reduce(0) { |sum, layer| sum + layer.lasso + layer.ridge }
+      end
+      def d_regularize(layers)
+        layers.select { |layer| layer.is_a?(Connection) }.each do |layer|
+          layer.d_lasso
+          layer.d_ridge
+        end
+      end
+      def to_hash
+        {class: self.class.name}
+      end
+    end
+    class MeanSquaredError < Loss
+      def forward(out, y)
+        @out = out
+        batch_size = y.shape[0]
+        0.5 * ((out - y)**2).sum / batch_size
+      end
+      def backward(y)
+        @out - y
+      end
+    end
+    class MeanAbsoluteError < Loss
+      def forward(out, y)
+        @out = out
+        batch_size = y.shape[0]
+        (out - y).abs.sum / batch_size
+      end
+      def backward(y)
+        dout = @out - y
+        dout[dout >= 0] = 1
+        dout[dout < 0] = -1
+        dout
+      end
+    end
+    class HuberLoss < Loss
+      def forward(out, y)
+        @out = out
+        loss = loss_l1(y)
+        loss = loss > 1 ? loss : loss_l2(y)
+        @loss = loss + regularize
+      end
+      def backward(y)
+        dout = @out - y
+        if @loss > 1
+          dout[dout >= 0] = 1
+          dout[dout < 0] = -1
+        end
+        dout
+      end
+      private
+      def loss_l1(y)
+        batch_size = y.shape[0]
+        (@out - y).abs.sum / batch_size
+      end
+      def loss_l2(y)
+        batch_size = y.shape[0]
+        0.5 * ((@out - y)**2).sum / batch_size
+      end
+    end
+    class SoftmaxCrossEntropy < Loss
+      NMath = Xumo::NMath
+      def forward(x, y)
+        @out = Utils.softmax(x)
+        batch_size = y.shape[0]
+        -(y * NMath.log(@out + 1e-7)).sum / batch_size
+      end
+      def backward(y)
+        @out - y
+      end
+    end
+    class SigmoidCrossEntropy < Loss
+      NMath = Xumo::NMath
+      def forward(x, y)
+        @out = Utils.sigmoid(x)
+        batch_size = y.shape[0]
+        -(y * NMath.log(@out + 1e-7) + (1 - y) * NMath.log(1 - @out + 1e-7)).sum / batch_size
+      end
+      def backward(y)
+        @out - y
+      end
+    end
+  end
+end

data/lib/dnn/core/model.rb CHANGED

@@ -1,3 +1,4 @@
+require "zlib"
 require "json"
 require "base64"
@@ -9,14 +10,19 @@ module DNN
     attr_accessor :trainable # Setting false prevents learning of parameters.
     def self.load(file_name)
-      Marshal.load(File.binread(file_name))
+      Marshal.load(Zlib::Inflate.inflate(File.binread(file_name)))
     end
     def self.load_json(json_str)
       hash = JSON.parse(json_str, symbolize_names: true)
+      model = self.load_hash(hash)
+      model.compile(Utils.load_hash(hash[:optimizer]), Utils.load_hash(hash[:loss]))
+      model
+    end
+    def self.load_hash(hash)
       model = self.new
-      model.layers = hash[:layers].map { |hash_layer| Util.load_hash(hash_layer) }
-      model.compile(Util.load_hash(hash[:optimizer]))
+      model.layers = hash[:layers].map { |hash_layer| Utils.load_hash(hash_layer) }
       model
     end
@@ -24,15 +30,15 @@ module DNN
       @layers = []
       @trainable = true
       @optimizer = nil
-      @training = false
       @compiled = false
     end
     def load_json_params(json_str)
-      has_param_layers_params = JSON.parse(json_str, symbolize_names: true)
+      hash = JSON.parse(json_str, symbolize_names: true)
+      has_param_layers_params = hash[:params]
       has_param_layers_index = 0
-      @layers.each do |layer|
-        next unless layer.is_a?(HasParamLayer)
+      has_param_layers = get_all_layers.select { |layer| layer.is_a?(Layers::HasParamLayer) }
+      has_param_layers.each do |layer|
         hash_params = has_param_layers_params[has_param_layers_index]
         hash_params.each do |key, (shape, base64_param)|
           bin = Base64.decode64(base64_param)
@@ -46,71 +52,100 @@ module DNN
         has_param_layers_index += 1
       end
     end
     def save(file_name)
-      marshal = Marshal.dump(self)
+      bin = Zlib::Deflate.deflate(Marshal.dump(self))
       begin
-        File.binwrite(file_name, marshal)
+        File.binwrite(file_name, bin)
       rescue Errno::ENOENT => ex
         dir_name = file_name.match(%r`(.*)/.+$`)[1]
         Dir.mkdir(dir_name)
-        File.binwrite(file_name, marshal)
+        File.binwrite(file_name, bin)
       end
     end
     def to_json
-      hash_layers = @layers.map { |layer| layer.to_hash }
-      hash = {version: VERSION, layers: hash_layers, optimizer: @optimizer.to_hash}
+      hash = self.to_hash
+      hash[:version] = VERSION
       JSON.pretty_generate(hash)
     end
     def params_to_json
-      has_param_layers = @layers.select { |layer| layer.is_a?(Layers::HasParamLayer) }
+      has_param_layers = get_all_layers.select { |layer| layer.is_a?(Layers::HasParamLayer) }
       has_param_layers_params = has_param_layers.map do |layer|
         layer.params.map { |key, param|
           base64_data = Base64.encode64(param.data.to_binary)
           [key, [param.data.shape, base64_data]]
         }.to_h
       end
-      JSON.dump(has_param_layers_params)
+      hash = {version: VERSION, params: has_param_layers_params}
+      JSON.dump(hash)
     end
     def <<(layer)
-      if !layer.is_a?(Layers::Layer) && !layer.is_a?(Model)
-        raise TypeError.new("layer is not an instance of the DNN::Layers::Layer class or DNN::Model class.")
+      # Due to a bug in saving nested models, temporarily prohibit model nesting.
+      # if !layer.is_a?(Layers::Layer) && !layer.is_a?(Model)
+      #   raise TypeError.new("layer is not an instance of the DNN::Layers::Layer class or DNN::Model class.")
+      # end
+      unless layer.is_a?(Layers::Layer)
+        raise TypeError.new("layer:#{layer.class.name} is not an instance of the DNN::Layers::Layer class.")
       end
       @layers << layer
       self
     end
-    def compile(optimizer)
+    def compile(optimizer, loss)
       unless optimizer.is_a?(Optimizers::Optimizer)
-        raise TypeError.new("optimizer is not an instance of the DNN::Optimizers::Optimizer class.")
+        raise TypeError.new("optimizer:#{optimizer.class} is not an instance of DNN::Optimizers::Optimizer class.")
+      end
+      unless loss.is_a?(Losses::Loss)
+        raise TypeError.new("loss:#{loss.class} is not an instance of DNN::Losses::Loss class.")
       end
       @compiled = true
       layers_check
       @optimizer = optimizer
+      @loss = loss
       build
       layers_shape_check
     end
     def build(super_model = nil)
       @super_model = super_model
-      @layers.each do |layer|
-        layer.build(self)
+      shape = if super_model
+        super_model.output_shape
+      else
+        @layers.first.build
+      end
+      @layers[1..-1].each do |layer|
+        if layer.is_a?(Model)
+          layer.build(self)
+        else
+          layer.build(shape)
+        end
+        shape = layer.output_shape
       end
     end
+    def input_shape
+      @layers.first.input_shape
+    end
+    def output_shape
+      @layers.last.output_shape
+    end
     def optimizer
+      raise DNN_Error.new("The model is not compiled.") unless compiled?
       @optimizer ? @optimizer : @super_model.optimizer
     end
-    def compiled?
-      @compiled
+    def loss
+      raise DNN_Error.new("The model is not compiled.") unless compiled?
+      @loss ? @loss : @super_model.loss
     end
-    def training?
-      @training
+    def compiled?
+      @compiled
     end
     def train(x, y, epochs,
@@ -122,29 +157,31 @@ module DNN
       unless compiled?
         raise DNN_Error.new("The model is not compiled.")
       end
-      num_train_data = x.shape[0]
+      check_xy_type(x, y)
+      dataset = Dataset.new(x, y)
+      num_train_datas = x.shape[0]
       (1..epochs).each do |epoch|
         puts "【 epoch #{epoch}/#{epochs} 】" if verbose
-        (num_train_data.to_f / batch_size).ceil.times do |index|
-          x_batch, y_batch = Util.get_minibatch(x, y, batch_size)
+        (num_train_datas.to_f / batch_size).ceil.times do |index|
+          x_batch, y_batch = dataset.get_batch(batch_size)
           loss = train_on_batch(x_batch, y_batch, &batch_proc)
           if loss.nan?
             puts "\nloss is nan" if verbose
             return
           end
-          num_trained_data = (index + 1) * batch_size
-          num_trained_data = num_trained_data > num_train_data ? num_train_data : num_trained_data
+          num_trained_datas = (index + 1) * batch_size
+          num_trained_datas = num_trained_datas > num_train_datas ? num_train_datas : num_trained_datas
           log = "\r"
           40.times do |i|
-            if i < num_trained_data * 40 / num_train_data
+            if i < num_trained_datas * 40 / num_train_datas
               log << "="
-            elsif i == num_trained_data * 40 / num_train_data
+            elsif i == num_trained_datas * 40 / num_train_datas
               log << ">"
             else
               log << "_"
             end
           end
-          log << "  #{num_trained_data}/#{num_train_data} loss: #{sprintf('%.8f', loss)}"
+          log << "  #{num_trained_datas}/#{num_train_datas} loss: #{sprintf('%.8f', loss)}"
           print log if verbose
         end
         if verbose && test
@@ -157,17 +194,20 @@ module DNN
     end
     def train_on_batch(x, y, &batch_proc)
+      check_xy_type(x, y)
       input_data_shape_check(x, y)
       x, y = batch_proc.call(x, y) if batch_proc
-      forward(x, true)
-      loss_value = loss(y)
-      backward(y)
-      dloss
+      out = forward(x, true)
+      loss_value = @loss.forward(out, y) + @loss.regularize(get_all_layers)
+      dout = @loss.backward(y)
+      backward(dout, true)
+      @loss.d_regularize(get_all_layers)
       update
       loss_value
     end
     def accurate(x, y, batch_size = 100, &batch_proc)
+      check_xy_type(x, y)
       input_data_shape_check(x, y)
       batch_size = batch_size >= x.shape[0] ? x.shape[0] : batch_size
       correct = 0
@@ -183,7 +223,7 @@ module DNN
         x_batch, y_batch = batch_proc.call(x_batch, y_batch) if batch_proc
         out = forward(x_batch, false)
         batch_size.times do |j|
-          if @layers[-1].shape == [1]
+          if @layers.last.output_shape == [1]
             correct += 1 if out[j, 0].round == y_batch[j, 0].round
           else
             correct += 1 if out[j, true].max_index == y_batch[j, true].max_index
@@ -194,11 +234,13 @@ module DNN
     end
     def predict(x)
+      check_xy_type(x)
       input_data_shape_check(x)
       forward(x, false)
     end
     def predict1(x)
+      check_xy_type(x)
       predict(Xumo::SFloat.cast([x]))[0, false]
     end
@@ -222,37 +264,36 @@ module DNN
       }.flatten
     end
-    def forward(x, training)
-      @training = training
+    def forward(x, learning_phase)
       @layers.each do |layer|
-        x = if layer.is_a?(Layers::Layer)
+        x = if layer.is_a?(Layers::Dropout) || layer.is_a?(Layers::BatchNormalization) || layer.is_a?(Model)
+          layer.forward(x, learning_phase)
+        else
           layer.forward(x)
-        elsif layer.is_a?(Model)
-          layer.forward(x, training)
         end
       end
       x
     end
-    def loss(y)
-      @layers[-1].loss(y)
-    end
-    def dloss
-      @layers[-1].dloss
-    end
-    def backward(y)
-      dout = y
+    def backward(dout, learning_phase)
       @layers.reverse.each do |layer|
-        dout = layer.backward(dout)
+        if layer.is_a?(Layers::Dropout) || layer.is_a?(Layers::BatchNormalization) || layer.is_a?(Model)
+          dout = layer.backward(dout, learning_phase)
+        else
+          dout = layer.backward(dout)
+        end
       end
       dout
     end
     def update
+      return unless @trainable
       @layers.each do |layer|
-        layer.update if @trainable && (layer.is_a?(Layers::HasParamLayer) || layer.is_a?(Model))
+        if layer.is_a?(Layers::HasParamLayer)
+          layer.update(@optimizer)
+        elsif layer.is_a?(Model)
+          layer.update
+        end
       end
     end
@@ -270,33 +311,35 @@ module DNN
       if prev_layer.is_a?(Layers::Layer)
         prev_layer
       elsif prev_layer.is_a?(Model)
-        prev_layer.layers[-1]
+        prev_layer.layers.last
       end
     end
+    def to_hash
+      hash_layers = @layers.map { |layer| layer.to_hash }
+      {class: Model.name, layers: hash_layers, optimizer: @optimizer.to_hash, loss: @loss.to_hash}
+    end
     private
     def layers_check
       unless @layers.first.is_a?(Layers::InputLayer)
         raise TypeError.new("The first layer is not an InputLayer.")
       end
-      unless @layers.last.is_a?(Layers::OutputLayer)
-        raise TypeError.new("The last layer is not an OutputLayer.")
-      end
     end
     def input_data_shape_check(x, y = nil)
-      unless @layers.first.shape == x.shape[1..-1]
-        raise DNN_ShapeError.new("The shape of x does not match the input shape. x shape is #{x.shape[1..-1]}, but input shape is #{@layers.first.shape}.")
+      unless @layers.first.input_shape == x.shape[1..-1]
+        raise DNN_ShapeError.new("The shape of x does not match the input shape. x shape is #{x.shape[1..-1]}, but input shape is #{@layers.first.input_shape}.")
       end
-      if y && @layers.last.shape != y.shape[1..-1]
-        raise DNN_ShapeError.new("The shape of y does not match the input shape. y shape is #{y.shape[1..-1]}, but output shape is #{@layers.last.shape}.")
+      if y && @layers.last.output_shape != y.shape[1..-1]
+        raise DNN_ShapeError.new("The shape of y does not match the input shape. y shape is #{y.shape[1..-1]}, but output shape is #{@layers.last.output_shape}.")
       end
     end
     def layers_shape_check
       @layers.each.with_index do |layer, i|
-        prev_shape = layer.is_a?(Layers::Layer) ? layer.prev_layer.shape : layer.layers[-1]
+        prev_shape = layer.input_shape
         if layer.is_a?(Layers::Dense)
           if prev_shape.length != 1
             raise DNN_ShapeError.new("layer index(#{i}) Dense:  The shape of the previous layer is #{prev_shape}. The shape of the previous layer must be 1 dimensional.")
@@ -313,6 +356,21 @@ module DNN
         end
       end
     end
+    def check_xy_type(x, y = nil)
+      unless x.is_a?(Xumo::SFloat)
+        raise TypeError.new("x:#{x.class.name} is not an instance of #{Xumo::SFloat.name} class.")
+      end
+      if y && !y.is_a?(Xumo::SFloat)
+        raise TypeError.new("y:#{y.class.name} is not an instance of #{Xumo::SFloat.name} class.")
+      end
+    end
+    def type_check(var_name, var, type)
+      unless var.is_a?(type)
+        raise TypeError.new("#{var_name}:#{var.class} is not an instance of #{type} class.")
+      end
+    end
   end
 end