RubyGems - red-chainer - Versions diffs - 0.3.2 → 0.4.0 - Mend

red-chainer 0.3.2 → 0.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (81) hide show

checksums.yaml +4 -4
data/.gitignore +2 -2
data/.travis.yml +8 -3
data/.yardopts +1 -0
data/Gemfile +6 -1
data/README.md +34 -3
data/examples/cifar/train_cifar.rb +13 -2
data/examples/iris/iris.rb +9 -5
data/examples/mnist/mnist.rb +16 -4
data/lib/chainer.rb +17 -1
data/lib/chainer/backend.rb +27 -0
data/lib/chainer/cuda.rb +37 -15
data/lib/chainer/dataset/convert.rb +20 -16
data/lib/chainer/datasets/cifar.rb +8 -6
data/lib/chainer/datasets/mnist.rb +14 -55
data/lib/chainer/device.rb +88 -0
data/lib/chainer/function.rb +103 -41
data/lib/chainer/function_node.rb +454 -0
data/lib/chainer/functions/activation/leaky_relu.rb +38 -13
data/lib/chainer/functions/activation/log_softmax.rb +46 -9
data/lib/chainer/functions/activation/relu.rb +8 -8
data/lib/chainer/functions/activation/relu_grad2.rb +34 -0
data/lib/chainer/functions/activation/sigmoid.rb +13 -11
data/lib/chainer/functions/activation/sigmoid_grad.rb +25 -0
data/lib/chainer/functions/activation/tanh.rb +48 -11
data/lib/chainer/functions/array/broadcast_to.rb +56 -0
data/lib/chainer/functions/array/cast.rb +41 -0
data/lib/chainer/functions/array/reshape.rb +28 -0
data/lib/chainer/functions/array/rollaxis.rb +57 -0
data/lib/chainer/functions/array/select_item.rb +72 -0
data/lib/chainer/functions/array/squeeze.rb +78 -0
data/lib/chainer/functions/array/transpose.rb +44 -0
data/lib/chainer/functions/connection/convolution_2d.rb +43 -26
data/lib/chainer/functions/connection/convolution_2d_grad_w.rb +48 -0
data/lib/chainer/functions/connection/deconvolution_2d.rb +159 -0
data/lib/chainer/functions/connection/linear.rb +29 -22
data/lib/chainer/functions/evaluation/accuracy.rb +5 -5
data/lib/chainer/functions/loss/mean_squared_error.rb +21 -12
data/lib/chainer/functions/loss/softmax_cross_entropy.rb +98 -71
data/lib/chainer/functions/math/basic_math.rb +36 -30
data/lib/chainer/functions/math/exp.rb +28 -0
data/lib/chainer/functions/math/identity.rb +4 -3
data/lib/chainer/functions/math/sum.rb +52 -0
data/lib/chainer/functions/noise/dropout.rb +20 -4
data/lib/chainer/functions/normalization/batch_normalization.rb +257 -104
data/lib/chainer/functions/pooling/average_pooling_2d.rb +29 -6
data/lib/chainer/functions/pooling/max_pooling_2d.rb +67 -12
data/lib/chainer/functions/pooling/pooling_2d.rb +6 -4
data/lib/chainer/gradient_check.rb +157 -73
data/lib/chainer/gradient_method.rb +3 -2
data/lib/chainer/initializers/init.rb +5 -5
data/lib/chainer/initializers/normal.rb +4 -2
data/lib/chainer/initializers/uniform.rb +15 -0
data/lib/chainer/iterators/serial_iterator.rb +5 -3
data/lib/chainer/link.rb +4 -2
data/lib/chainer/links/connection/convolution_2d.rb +2 -2
data/lib/chainer/links/model/classifier.rb +24 -5
data/lib/chainer/links/normalization/batch_normalization.rb +7 -10
data/lib/chainer/optimizer.rb +42 -11
data/lib/chainer/optimizers/adam.rb +3 -2
data/lib/chainer/optimizers/momentum_sgd.rb +1 -1
data/lib/chainer/parameter.rb +7 -6
data/lib/chainer/serializer.rb +4 -4
data/lib/chainer/serializers/marshal.rb +10 -8
data/lib/chainer/testing/array.rb +1 -1
data/lib/chainer/training/extensions/evaluator.rb +2 -3
data/lib/chainer/training/extensions/exponential_shift.rb +1 -1
data/lib/chainer/training/extensions/progress_bar.rb +1 -0
data/lib/chainer/training/trainer.rb +4 -9
data/lib/chainer/training/triggers/interval.rb +7 -2
data/lib/chainer/utils/array.rb +80 -1
data/lib/chainer/utils/conv.rb +10 -2
data/lib/chainer/utils/initializer.rb +2 -2
data/lib/chainer/variable.rb +159 -69
data/lib/chainer/variable_node.rb +64 -10
data/lib/chainer/version.rb +1 -1
data/red-chainer.gemspec +4 -3
data/templates/default/layout/html/layout.erb +40 -0
data/templates/default/onefile/html/layout.erb +33 -0
metadata +44 -11
data/lib/chainer/dataset/download.rb +0 -56

data/lib/chainer/datasets/cifar.rb CHANGED Viewed

@@ -11,7 +11,7 @@ module Chainer
         get_cifar(100, with_label, ndim, scale)
       end
-      def self.get_cifar(n_classes, with_label, ndim, scale)
+      def self.get_cifar(n_classes, with_label, ndim, scale, device: Chainer::Device.default)
         train_table = ::Datasets::CIFAR.new(n_classes: n_classes, type: :train).to_table
         test_table = ::Datasets::CIFAR.new(n_classes: n_classes, type: :test).to_table
@@ -25,13 +25,14 @@ module Chainer
           test_labels = test_table[:fine_label]
         end
+        xm = device.xm
         [
-          preprocess_cifar(Numo::UInt8[*train_data], Numo::UInt8[*train_labels], with_label, ndim, scale),
-          preprocess_cifar(Numo::UInt8[*test_data], Numo::UInt8[*test_labels], with_label, ndim, scale)
+          preprocess_cifar(xm::UInt8[*train_data], xm::UInt8[*train_labels], with_label, ndim, scale),
+          preprocess_cifar(xm::UInt8[*test_data], xm::UInt8[*test_labels], with_label, ndim, scale)
         ]
       end
-      def self.preprocess_cifar(images, labels, withlabel, ndim, scale)
+      def self.preprocess_cifar(images, labels, withlabel, ndim, scale, device: Chainer::Device.default)
         if ndim == 1
           images = images.reshape(images.shape[0], 3072)
         elsif ndim == 3
@@ -39,11 +40,12 @@ module Chainer
         else
           raise 'invalid ndim for CIFAR dataset'
         end
-        images = images.cast_to(Numo::SFloat)
+        xm = device.xm
+        images = images.cast_to(xm::SFloat)
         images *= scale / 255.0
         if withlabel
-          labels = labels.cast_to(Numo::Int32)
+          labels = labels.cast_to(xm::Int32)
           TupleDataset.new(images, labels)
         else
           images

data/lib/chainer/datasets/mnist.rb CHANGED Viewed

@@ -1,13 +1,17 @@
-require 'zlib'
+require 'datasets'
 module Chainer
   module Datasets
-    module Mnist
-      def self.get_mnist(withlabel: true, ndim: 1, scale: 1.0, dtype: Numo::SFloat, label_dtype: Numo::Int32)
-        train_raw = retrieve_mnist_training
+    module MNIST
+      def self.get_mnist(withlabel: true, ndim: 1, scale: 1.0, dtype: nil, label_dtype: nil)
+        xm = Chainer::Device.default.xm
+        dtype ||= xm::SFloat
+        label_dtype ||= xm::Int32
+        train_raw = retrieve_mnist(type: :train)
         train = preprocess_mnist(train_raw, withlabel, ndim, scale, dtype, label_dtype)
-        test_raw = retrieve_mnist_test
+        test_raw = retrieve_mnist(type: :test)
         test = preprocess_mnist(test_raw, withlabel, ndim, scale, dtype, label_dtype)
         [train, test]
       end
@@ -24,7 +28,7 @@ module Chainer
         images = images.cast_to(image_dtype)
         images *= scale / 255.0
         if withlabel
           labels = raw[:y].cast_to(label_dtype)
           TupleDataset.new(images, labels)
@@ -33,56 +37,11 @@ module Chainer
         end
       end
-      def self.retrieve_mnist_training
-        urls = ['http://yann.lecun.com/exdb/mnist/train-images-idx3-ubyte.gz',
-                'http://yann.lecun.com/exdb/mnist/train-labels-idx1-ubyte.gz']
-        retrieve_mnist('train.npz', urls)
-      end
-      def self.retrieve_mnist_test
-        urls = ['http://yann.lecun.com/exdb/mnist/t10k-images-idx3-ubyte.gz',
-                'http://yann.lecun.com/exdb/mnist/t10k-labels-idx1-ubyte.gz']
-        retrieve_mnist('test.npz', urls)
-      end
-      def self.retrieve_mnist(name, urls)
-        root = Chainer::Dataset::Download.get_dataset_directory('pfnet/chainer/mnist')
-        path = File.expand_path(name, root)
-        Chainer::Dataset::Download.cache_or_load_file(path) do
-          make_npz(path, urls)
-        end
-      end
-      def self.make_npz(path, urls)
-        x_url, y_url = urls
-        x_path = Chainer::Dataset::Download.cached_download(x_url)
-        y_path = Chainer::Dataset::Download.cached_download(y_url)
-        x = nil
-        y = nil
-        Zlib::GzipReader.open(x_path) do |fx|
-          Zlib::GzipReader.open(y_path) do |fy|
-            fx.read(4)
-            fy.read(4)
-            n = fx.read(4).unpack('i>')[0]
-            fy.read(4)
-            fx.read(8)
-            x = Numo::UInt8.new(n, 784).rand(n)
-            y = Numo::UInt8.new(n).rand(n)
-            n.times do |i|
-              y[i] = fy.read(1).ord
-              784.times do |j|
-                x[i, j] = fx.read(1).ord
-              end
-            end
-          end
-        end
+      def self.retrieve_mnist(type:)
+        train_table = ::Datasets::MNIST.new(type: type).to_table
-        { x: x, y: y}
+        xm = Chainer::Device.default.xm
+        { x: xm::UInt8[*train_table[:pixels]], y: xm::UInt8[*train_table[:label]] }
       end
     end
   end

data/lib/chainer/device.rb ADDED Viewed

@@ -0,0 +1,88 @@
+module Chainer
+  module Device
+    # Creates device
+    #
+    # @param [Integer or Chainer::AbstractDevice] device_spec Device specifier.
+    #     Negative integer indicates CPU. 0 or positive integer indicates GPU.
+    #     If a device object is given, itself is returned.
+    # @return [Chainer::AbstractDevice] device object
+    def create(device_spec)
+      return device_spec if device_spec.kind_of?(AbstractDevice)
+      if device_spec.kind_of?(Integer)
+        return CpuDevice.new if device_spec < 0
+        return GpuDevice.new(device_spec)
+      end
+      raise "Invalid device_spec: #{device_spec}"
+    end
+    module_function :create
+    # Changes default device
+    #
+    # @param [Object] device_spec
+    # @see Chainer::Device.create
+    def change_default(device_spec)
+      @default = create(device_spec)
+      @default.use
+    end
+    module_function :change_default
+    # Gets default device
+    #
+    # @return [Chainer::AbstractDevice] the default device.
+    def default
+      @default ||= CpuDevice.new
+    end
+    module_function :default
+    # TODO(sonots): Add Device.from_array after Cumo provides an API
+    # to return GPU device ID from Cumo::NArray.
+  end
+  class AbstractDevice
+    def xm
+      raise NotImplementedError
+    end
+    def use
+    end
+  end
+  class CpuDevice < AbstractDevice
+    def xm
+      Numo
+    end
+    def ==(other)
+      return false unless other.is_a?(CpuDevice)
+      true
+    end
+  end
+  class GpuDevice < AbstractDevice
+    attr_reader :id
+    # @param [Integer] id GPU Device ID. If not given, CUDA current device id is used.
+    def initialize(id = nil)
+      Chainer::CUDA.check_available
+      id ||= Cumo::CUDA::Runtime.cudaGetDevice
+      if id < 0
+        raise 'GPU Device ID must not be negative'
+      end
+      @id = id
+    end
+    def xm
+      Cumo
+    end
+    def ==(other)
+      return false unless other.is_a?(GpuDevice)
+      id == other.id
+    end
+    # Sets CUDA current device with owned GPU Device ID
+    def use
+      Cumo::CUDA::Runtime.cudaSetDevice(@id)
+    end
+  end
+end

data/lib/chainer/function.rb CHANGED Viewed

@@ -1,70 +1,89 @@
+require 'chainer/function_node'
 module Chainer
   class Function
     attr_reader :rank, :inputs, :outputs, :retain_after_backward
-    attr_accessor :output_data
+    attr_accessor :output_data, :owned_node
     def initialize
       @rank = 0
     end
     def call(*inputs)
-      inputs = inputs.map do |x|
-        if x.kind_of?(Chainer::Variable)
-          x
-        else
-          Variable.new(x, requires_grad: false)
-        end
-      end
+      node = self.node
-      in_data = inputs.map(&:data)
-      requires_grad = inputs.any?(&:requires_grad)
+      node.function = self
+      node.weak_function = nil
+      @node = WeakRef.new(node)
+      @owned_node = nil
-      @input_indexes_to_retain = nil
-      @output_indexes_to_retain = nil
-      outputs = forward(in_data)
-      raise if !outputs.is_a? Array
+      ret = node.apply(inputs)
-      ret = outputs.map do |y|
-        Variable.new(y, requires_grad: requires_grad)
-      end
+      ret.size == 1 ? ret[0] : ret
+    end
-      if Chainer.configuration.enable_backprop
-        @rank = inputs.map(&:rank).max || 0
+    def inputs
+      @node.inputs
+    end
-        ret.each { |y| y.creator = self }
+    def outputs
+      @node.outputs
+    end
-        @inputs = inputs.map(&:node)
-        @outputs = ret.map { |y| WeakRef.new(y.node) }
+    def node
+      noderef = @node
+      nd = noderef ? noderef.__getobj__ : @owned_node
+      return nd if nd
-        @input_indexes_to_retain = 0...inputs.size if @input_indexes_to_retain.nil?
-        @input_indexes_to_retain.each do |index|
-          inputs[index].retain_data()
-        end
-        remove_instance_variable(:@input_indexes_to_retain)
+      nd = FunctionAdapter.new(self)
+      @owned_node = nd
+      nd
+    end
-        unless @output_indexes_to_retain.nil?
-          @output_indexes_to_retain.each do |index|
-            ret[index].retain_data()
-          end
-          remove_instance_variable(:@output_indexes_to_retain)
-        end
-      end
+    def output_data
+      node.output_data
+    end
-      ret.size == 1 ? ret[0] : ret
+    def rank
+      @node.rank
+    end
+    def label
+      self.class.to_s
     end
     def forward(inputs)
-      # TODO: GPU branch processing
-      forward_cpu(inputs)
+      xm = Chainer.get_array_module(*inputs)
+      if xm == Cumo
+        forward_gpu(inputs)
+      else
+        forward_cpu(inputs)
+      end
     end
     def forward_cpu(inputs)
       raise NotImplementedError
     end
+    def forward_gpu(inputs)
+      raise NotImplementedError
+    end
     def backward(inputs, grad_outputs)
-      backward_cpu(inputs, grad_outputs)
+      xm = Chainer.get_array_module(*(inputs + grad_outputs))
+      if xm == Cumo
+        backward_gpu(inputs, grad_outputs)
+      else
+        backward_cpu(inputs, grad_outputs)
+      end
+    end
+    def backward_cpu(inputs, grad_outputs)
+      return [nil] * inputs.size
+    end
+    def backward_gpu(inputs, grad_outputs)
+      return [nil] * inputs.size
     end
     def retain_inputs(indexes)
@@ -72,10 +91,53 @@ module Chainer
     end
     def retain_outputs(indexes, retain_after_backward: false)
-      @output_indexes_to_retain = indexes
-      if retain_after_backward
-        @retain_after_backward = retain_after_backward
+      node.retain_outputs(indexes)
+    end
+  end
+  class FunctionAdapter < ::Chainer::FunctionNode
+    attr_accessor :function, :weak_function
+    def initialize(function)
+      super()
+      @weak_function = WeakRef.new(function)
+      function.owned_node = self
+    end
+    def function
+      func = @function
+      return func if func
+      weak_func = @weak_function
+      weak_func.__getobj__
+    end
+    def label
+      @function.label
+    end
+    def forward(inputs)
+      retain_inputs(inputs.size.times.to_a)
+      @function.forward(inputs)
+    end
+    def backward(target_input_indexes, grad_outputs)
+      in_data = @inputs.map { |input| input.data }
+      grad_out_data = grad_outputs.map { |grad| grad.nil? ? nil : grad.data }
+      gxs = @function.backward(in_data, grad_out_data)
+      ret = []
+      target_input_indexes.each do |i|
+        if gxs[i].nil?
+          g = nil
+        else
+          g = Chainer::Variable.new(gxs[i])
+          g.node.old_style_grad_generator = @function.label
+        end
+        ret << g
       end
+      ret
     end
   end
 end

data/lib/chainer/function_node.rb ADDED Viewed

@@ -0,0 +1,454 @@
+# Function node of the computational graph.
+# FunctionNode is a class representing a node in a computational graph.
+# The node corresponds to an application of a differentiable function to input variables.
+# When a differentiable function is applied to `Chainer::Variable` objects,
+# it creates an instance of FunctionNode implementation and calls its `apply` method.
+# The `apply` method basically does the following three things.
+#   1. Adding an edge from the function node to the variable node corresponding to each input.
+#      The node of each input is extracted by `Chainer::`Variable.node`.
+#   2. Computing the output arrays of the function.
+#   3. Creating a :class:`Variable` object for each output array and
+#      adding an edge from the node of the variable to the function node.
+# The output variables are then returned.
+module Chainer
+  class FunctionNode
+    attr_accessor :rank, :inputs, :outputs
+    def initialize
+      @rank = 0
+      @inputs = nil
+      @outputs = nil
+      @retained_output_data = nil
+      @input_indexes_to_retain = nil
+      @output_indexes_to_retain = nil
+    end
+    # Short text that represents the function.
+    #
+    # The default implementation returns its type name.
+    # Each function should override it to give more information.
+    def label
+      self.class.name
+    end
+    # A tuple of the retained output arrays.
+    # This property is mainly used by $Function$. Users basically do
+    # not have to use this property; use $get_retained_outputs$ instead.
+    def output_data
+      raise RuntimeError, 'retained output data is gone' if @retained_output_data.nil?
+      out_data = [nil] * @outputs.size
+      @output_indexes_to_retain.zip(@retained_output_data).each do |index, data|
+        out_data[index] = data
+      end
+      out_data
+    end
+    # Computes output variables and grows the computational graph.
+    #
+    # Basic behavior is expressed in the documentation of `FunctionNode`.
+    # @param [Chainer::Variable, Numo::NArray] inputs If the element is an Numo::NArray,
+    #   it is automatically wrapped with `Chainer::Variable`.
+    # @return [Array<Chainer::Variable>] A tuple of output `Chainer::Variable` objectts.
+    def apply(inputs)
+      input_vars = inputs.map { |x| Chainer::Variable.as_variable(x) }
+      in_data = input_vars.map(&:data)
+      requires_grad = input_vars.map(&:requires_grad).any?
+      # Forward propagation
+      @input_indexes_to_retain = nil
+      @output_indexes_to_retain = nil
+      outputs = forward(in_data)
+      raise TypeError, "#{outputs.class} not Array" unless outputs.is_a?(Array)
+      ret = outputs.map { |y| Chainer::Variable.new(y, requires_grad: requires_grad) }
+      if Chainer.configuration.enable_backprop
+        # Topological ordering
+        @rank = input_vars.size > 0 ? input_vars.map(&:rank).max : 0
+        # Add backward edges
+        ret.each { |y| y.creator_node = self }
+        @inputs = input_vars.map(&:node)
+        # Add forward edges (must be weak references)
+        @outputs = ret.map { |y| WeakRef.new(y.node) }
+        unless @input_indexes_to_retain.nil?
+          @input_indexes_to_retain.each do |index|
+            input_vars[index].retain_data
+          end
+        end
+        unless @output_indexes_to_retain.nil?
+          retained_data = []
+          @output_indexes_to_retain.each do |index|
+            ret[index].retain_data
+            retained_data << outputs[index]
+          end
+          @retained_output_data = Array(retained_data)
+        end
+      end
+      ret
+    end
+    # Computes the output arrays from the input arrays.
+    #
+    # @param [Array] inputs input array(s)
+    # @return [Array] output array(s)
+    def forward(inputs)
+      raise TypeError, "mustt inputs > 0, inputs size is #{inputs.size}" if inputs.size.zero?
+      # TODO GPU
+      forward_cpu(inputs)
+    end
+    # Computes the output arrays from the input Numo::NArray.
+    #
+    # @param [Array<Numo::NArray>] inputs Numo::NArray objects.
+    # @return [Array<Numo::NArray>] Array of output arrays.
+    def forward_cpu(inputs)
+      raise NotImplementedError
+    end
+    # Lets specified input variable nodes keep data arrays.
+    #
+    # By calling this method from `forward`, the function node can specify which inputs are required for backprop.
+    # The input variables with retained arrays can be obtained by `get_retained_inputs` from `backward`.
+    #
+    # Note that **this method must not be called from the outside of forward method.**
+    # @param [Integer, Array] indexes Indexes of input variables that the function does not require for backprop.
+    def retain_inputs(indexes)
+      @input_indexes_to_retain = indexes
+    end
+    # Lets specified output variable nodes keep data arrays.
+    #
+    # By calling this method from `forward`, the function node can specify which outputs are required for backprop.
+    # If this method is not called, any output variables are not marked to keep the data array at the point of returning from `apply`.
+    # The output variables with retained arrays can be obtained by `get_retained_outputs` from `backward`.
+    # Note that **this method must not be called from the outside of forward method.**
+    # @param [Integer, Array] indexes Indexes of input variables that the function does not require for backprop.
+    def retain_outputs(indexes)
+      @output_indexes_to_retain = indexes
+    end
+    # Computes gradients w.r.t. specified inputs given output gradients.
+    #
+    # This method is used to compute one step of the backpropagation corresponding to the forward computation of this function node.
+    # Given the gradients w.r.t. output variables, this method computes the gradients w.r.t. specified input variables.
+    # Note that this method does not need to compute any input gradients not specified by `target_input_indexes`
+    # It enables the function node to return the input gradients with the full computational history,
+    #   in which case it supports *differentiable backpropagation* or *higher-order differentiation*.
+    #
+    # @param [Array<Integer>] target_indexes Indices of the input variables w.r.t. which the gradients are required.
+    #   It is guaranteed that this tuple contains at least one element.
+    # @param [Array<Chainer::Variable>] grad_outputs Gradients w.r.t. the output variables.
+    #   If the gradient w.r.t. an output variable is not given, the corresponding element is `None`.
+    # @return [Array<Chainer::Variable>] Array of Chainer::Variable that represent the gradients.
+    def backward(target_indexes, grad_outputs)
+      [nil] * target_indexes.size
+    end
+    # Computes gradients w.r.t. specified inputs and accumulates them.
+    #
+    # This method provides a way to fuse the backward computation and the gradient accumulations
+    #   in the case that the multiple functions are applied to the same variable.
+    # Users have to override either of this method or `backward`.
+    # It is often simpler to implement `backward` and is recommended if you do not need to provide efficient gradient accumulation.
+    #
+    # @param [Array<Integer>] target_input_indexes Indices of the input variables w.r.t. which the gradients are required.
+    #   It is guaranteed that this tuple contains at least one element.
+    # @param [Array<Chainer::Variable>] grad_outputs Gradients w.r.t. the output variables.
+    #   If the gradient w.r.t. an output variable is not given, the corresponding element is `None`.
+    # @param [Array<Chainer::Variable>] grad_inputs Gradients w.r.t. the input variables specified by `target_input_indexes`.
+    #   These values are computed by other computation paths.
+    #   If there is no gradient value existing for the variable, the corresponding element is ``None``.
+    # @return [Array<Chainer::Variable>] Array of variables that represent the gradients w.r.t. specified input variables.
+    def backward_accumulate(target_input_indexes, grad_outputs, grad_inputs)
+      gxs = backward(target_input_indexes, grad_outputs)
+      len_gxs = gxs.size
+      if len_gxs == @inputs.size
+        gxs = target_input_indexes.map { |i| gxs[i] }
+      elsif len_gxs != target_input_indexes.size
+        raise ArgumentError, "number of gradients returned by #{impl_name} (#{label}) is incorrect."
+      end
+      gxs.zip(grad_inputs).map do |gx, g_input|
+        if g_input.nil?
+          gx
+        elsif gx.nil?
+          g_input
+        else
+          gx + g_input
+        end
+      end
+    end
+    # Returns a Array of retained input variables.
+    #
+    # This method is used to retrieve the input variables retained in `forward`.
+    #
+    # @return [Array] a Array of retained input variables.
+    def get_retained_inputs
+      @input_indexes_to_retain.map { |index| @inputs[index].get_variable }
+    end
+    # Returns a Array of retained output variables.
+    #
+    # This method is used to retrieve the input variables retained in `forward`.
+    #
+    # @return [Array] a Array of retained input variables.
+    def get_retained_outputs
+      ret = []
+      outputs = @outputs
+      new_outputs = outputs.dup
+      outputs_modified = false
+      @output_indexes_to_retain.zip(@retained_output_data) do |index, data|
+        output =  outputs[index].__getobj__
+        if output.nil?
+          output_var = Chainer::Variable.new(data)
+          output_var.creator_node = self
+          new_outputs[index] = WeakRef.new(output_var)
+          outputs_modified = true
+        else
+          output_var = output.get_variable
+        end
+        ret << output_var
+      end
+      if outputs_modified
+        @outputs = Array(new_outputs)
+      end
+      ret
+    end
+    # Purges in/out nodes and this function node itself from the graph.
+    def unchain
+      @outputs.each do |y|
+        y_ref = y.()
+        unless y_ref.nil?
+          y_ref.unchain
+        end
+      end
+      @inputs = nil
+    end
+    private
+    def impl_name
+      self.class.name
+    end
+  end
+  def self.grad(outputs, inputs, grad_outputs: nil, grad_inputs: nil, set_grad: false, retain_grad: false, enable_double_backprop: false)
+    # The implementation consists of three steps.
+    if !outputs.is_a?(Array)
+      raise TypeError, "outputs must be Array, not #{outputs.class}"
+    end
+    if !inputs.is_a?(Array)
+      raise TypeError, "inputs must be Array, not #{inputs.class}"
+    end
+    if !grad_outputs.nil? && !grad_outputs.is_a?(Array)
+      raise TypeError, "grad_outputs must be Array, not #{grad_outputs.class}"
+    end
+    if !grad_inputs.nil? && !grad_inputs.is_a?(Array)
+      raise TypeError, "grad_inputs must be Array, not #{grad_inputs.class}"
+    end
+    # 1. Backward enumeration: all the nodes reachable backward from the output
+    #    nodes are enumerated. The forward direction links are collected in
+    #    this step. Note that the variable nodes whose requires_grad is false
+    #    are ignored and their creators are not searched.
+    candidate_funcs = outputs.map(&:creator_node).compact
+    visited_funcs = Set.new
+    forward_graph = {}
+    while func = candidate_funcs.pop
+      next if visited_funcs.include?(func)
+      visited_funcs.add(func)
+      func.inputs.each do |x|
+        next unless x.requires_grad
+        forward_graph[x] = [] if forward_graph[x].nil?
+        forward_graph[x] << func
+        creator = x.creator_node
+        if creator && !visited_funcs.include?(creator)
+          candidate_funcs << creator
+        end
+      end
+    end
+    # 2. Forward enumeration: all the nodes in the subgraph reachable from the
+    #    input nodes are enumerated. The extracted (sub-)subgraph is the union
+    #    of all paths that backpropagation will visit.
+    candidate_vars = inputs.map(&:node)
+    visited_funcs = Set.new
+    grad_required = Set.new
+    while x = candidate_vars.pop
+      grad_required.add(x)
+      forward_graph[x].each do |func|
+        next if visited_funcs.include?(func)
+        visited_funcs.add(func)
+        func.outputs.each do |y_ref|
+          y = y_ref.__getobj__
+          if y && forward_graph[y]
+            candidate_vars << y
+          end
+        end
+      end
+    end
+    # 3. Backpropagation: the backpropagation is executed along the
+    #    (sub-)subgraph. It uses the topological order of the subgraph which is
+    #    induced by the reversed order of function applications ("rank").
+    grads = {}  # mapping from variable nodes to their gradients
+    # Initialize the gradient mapping.
+    grad_outputs = [nil] * outputs.size if grad_outputs.nil?
+    outputs.zip(grad_outputs).each do |y, gy|
+      if gy.nil?
+        gy_data = y.data.new_ones
+        gy = Chainer::Variable.new(gy_data, requires_grad: false)
+      end
+      grads[y.node] = gy
+    end
+    unless grad_inputs.nil?
+      inputs.zip(grad_inputs).each do |x, gx|
+        grads[x.node] = gx unless gx.nil?
+      end
+    end
+    # Backprop implementation. It edits grads which will only contain the
+    # gradients w.r.t. the inputs.
+    old_enable_backprop = Chainer.configuration.enable_backprop
+    Chainer.configuration.enable_backprop = enable_double_backprop
+    backprop(outputs, inputs, grad_required, retain_grad, grads)
+    Chainer.configuration.enable_backprop = old_enable_backprop
+    # Extract the gradients w.r.t. the inputs and return them.
+    ret = inputs.map { |x| grads[x.node] }
+    if set_grad
+      inputs.zip(ret).each do |x, gx|
+        x.grad_var = gx
+      end
+    end
+    ret
+  end
+  def self.backprop(outputs, inputs, grad_required, retain_grad, grads)
+    candidate_funcs = []
+    visited_funcs = Set.new
+    push_candidate = -> (func) do
+      return if visited_funcs.include?(func)
+      # Negate since heapq is min-heap
+      # The second element is used to make each item unique
+      visited_funcs.add(func)
+      candidate_funcs.unshift(func)
+      candidate_funcs.sort_by! { |f| f.rank }
+    end
+    pop_candidate = -> () do
+      candidate_funcs.pop
+    end
+    outputs.each do |y|
+      creator = y.creator_node
+      next if creator.nil?
+      push_candidate.(creator)
+    end
+    input_nodes = Set.new(inputs.map(&:node))
+    while func = pop_candidate.()
+      # Collect the gradients w.r.t. the outputs
+      gys = []
+      func.outputs.each do |y_ref|
+        y = y_ref.__getobj__
+        if y.nil?
+          gys << nil
+          next
+        end
+        gys << grads[y]
+      end
+      # Collect the gradients w.r.t. the inputs
+      #
+      # Note (Tokui): when the same variable is passed multiple times as
+      # inputs in the same function (e.g. an expression like f(x, x)), the
+      # current implementation passes None as the current gradient w.r.t.
+      # such an input except for the first one (i.e., it builds gxs like
+      # (gx, None) where gx is the current gradient w.r.t. x).
+      gxs = []
+      input_indexes = []
+      selected_inputs = Set.new
+      func.inputs.each_with_index do |x, i|
+        next unless grad_required.include?(x)
+        input_indexes << i
+        if selected_inputs.include?(x)
+          gxs << nil
+        else
+          gxs << grads[x]
+          selected_inputs.add(x)
+        end
+      end
+      next if input_indexes.empty?
+      # Do backward
+      new_gxs = func.backward_accumulate(input_indexes, gys, gxs)
+      # Delete output gradients that are not required to return
+      func.outputs.each do |y_ref|
+        y = y_ref.__getobj__
+        if y && grads[y] && !input_nodes.include?(y)
+          grads.delete(y)
+        end
+      end
+      # Update grads
+      selected_inputs = Set.new
+      input_indexes.zip(new_gxs).each do |i, g|
+        next if g.nil?
+        node = func.inputs[i]
+        if selected_inputs.include?(node)
+          # Accumulate the duplicated gradients here
+          cur_gx = grads[node]
+          if cur_gx
+            g = g + cur_gx
+          end
+        else
+          selected_inputs.add(node)
+        end
+        grads[node] = g
+        if retain_grad
+          v = node.get_variable
+          if v
+            v.grad_var = g
+          end
+        end
+        creator = node.creator_node
+        if creator
+          push_candidate.(creator)
+        end
+      end
+    end
+  end
+  private_class_method :backprop
+end