RubyGems - red-chainer - Versions diffs - 0.3.2 → 0.4.0 - Mend

red-chainer 0.3.2 → 0.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (81) hide show

checksums.yaml +4 -4
data/.gitignore +2 -2
data/.travis.yml +8 -3
data/.yardopts +1 -0
data/Gemfile +6 -1
data/README.md +34 -3
data/examples/cifar/train_cifar.rb +13 -2
data/examples/iris/iris.rb +9 -5
data/examples/mnist/mnist.rb +16 -4
data/lib/chainer.rb +17 -1
data/lib/chainer/backend.rb +27 -0
data/lib/chainer/cuda.rb +37 -15
data/lib/chainer/dataset/convert.rb +20 -16
data/lib/chainer/datasets/cifar.rb +8 -6
data/lib/chainer/datasets/mnist.rb +14 -55
data/lib/chainer/device.rb +88 -0
data/lib/chainer/function.rb +103 -41
data/lib/chainer/function_node.rb +454 -0
data/lib/chainer/functions/activation/leaky_relu.rb +38 -13
data/lib/chainer/functions/activation/log_softmax.rb +46 -9
data/lib/chainer/functions/activation/relu.rb +8 -8
data/lib/chainer/functions/activation/relu_grad2.rb +34 -0
data/lib/chainer/functions/activation/sigmoid.rb +13 -11
data/lib/chainer/functions/activation/sigmoid_grad.rb +25 -0
data/lib/chainer/functions/activation/tanh.rb +48 -11
data/lib/chainer/functions/array/broadcast_to.rb +56 -0
data/lib/chainer/functions/array/cast.rb +41 -0
data/lib/chainer/functions/array/reshape.rb +28 -0
data/lib/chainer/functions/array/rollaxis.rb +57 -0
data/lib/chainer/functions/array/select_item.rb +72 -0
data/lib/chainer/functions/array/squeeze.rb +78 -0
data/lib/chainer/functions/array/transpose.rb +44 -0
data/lib/chainer/functions/connection/convolution_2d.rb +43 -26
data/lib/chainer/functions/connection/convolution_2d_grad_w.rb +48 -0
data/lib/chainer/functions/connection/deconvolution_2d.rb +159 -0
data/lib/chainer/functions/connection/linear.rb +29 -22
data/lib/chainer/functions/evaluation/accuracy.rb +5 -5
data/lib/chainer/functions/loss/mean_squared_error.rb +21 -12
data/lib/chainer/functions/loss/softmax_cross_entropy.rb +98 -71
data/lib/chainer/functions/math/basic_math.rb +36 -30
data/lib/chainer/functions/math/exp.rb +28 -0
data/lib/chainer/functions/math/identity.rb +4 -3
data/lib/chainer/functions/math/sum.rb +52 -0
data/lib/chainer/functions/noise/dropout.rb +20 -4
data/lib/chainer/functions/normalization/batch_normalization.rb +257 -104
data/lib/chainer/functions/pooling/average_pooling_2d.rb +29 -6
data/lib/chainer/functions/pooling/max_pooling_2d.rb +67 -12
data/lib/chainer/functions/pooling/pooling_2d.rb +6 -4
data/lib/chainer/gradient_check.rb +157 -73
data/lib/chainer/gradient_method.rb +3 -2
data/lib/chainer/initializers/init.rb +5 -5
data/lib/chainer/initializers/normal.rb +4 -2
data/lib/chainer/initializers/uniform.rb +15 -0
data/lib/chainer/iterators/serial_iterator.rb +5 -3
data/lib/chainer/link.rb +4 -2
data/lib/chainer/links/connection/convolution_2d.rb +2 -2
data/lib/chainer/links/model/classifier.rb +24 -5
data/lib/chainer/links/normalization/batch_normalization.rb +7 -10
data/lib/chainer/optimizer.rb +42 -11
data/lib/chainer/optimizers/adam.rb +3 -2
data/lib/chainer/optimizers/momentum_sgd.rb +1 -1
data/lib/chainer/parameter.rb +7 -6
data/lib/chainer/serializer.rb +4 -4
data/lib/chainer/serializers/marshal.rb +10 -8
data/lib/chainer/testing/array.rb +1 -1
data/lib/chainer/training/extensions/evaluator.rb +2 -3
data/lib/chainer/training/extensions/exponential_shift.rb +1 -1
data/lib/chainer/training/extensions/progress_bar.rb +1 -0
data/lib/chainer/training/trainer.rb +4 -9
data/lib/chainer/training/triggers/interval.rb +7 -2
data/lib/chainer/utils/array.rb +80 -1
data/lib/chainer/utils/conv.rb +10 -2
data/lib/chainer/utils/initializer.rb +2 -2
data/lib/chainer/variable.rb +159 -69
data/lib/chainer/variable_node.rb +64 -10
data/lib/chainer/version.rb +1 -1
data/red-chainer.gemspec +4 -3
data/templates/default/layout/html/layout.erb +40 -0
data/templates/default/onefile/html/layout.erb +33 -0
metadata +44 -11
data/lib/chainer/dataset/download.rb +0 -56

checksums.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 SHA256:
-  metadata.gz: 33a95bf098a08c334e6a9d29ff791350e6ac0bd9de843054f3ed14f2a005b79b
-  data.tar.gz: 6f4e53b84e93d01e26363b5d43dba73ec4fc515ecbebbd1574ac6a864f52fb83
+  metadata.gz: e7ed2df404bfc36275381f523c0439f2e73debcf36f3b5edb063e985502d7a70
+  data.tar.gz: 357c983134aae985808568113d3f4f82bacebf6d25e5cf7c4f9197b1825455dc
 SHA512:
-  metadata.gz: 40054365541bb8956c4a8211fbd489e75d1557a9e5c23bcb49f2cc2b393f0d96574d18259bad8e147525a3b720a5329f904be18c7c4f0891f1d886241b72a65d
-  data.tar.gz: fcb8e641d0efc1ffacc2014c2954d1c5a1e5f947fdcc18306f8946fb307c659e37bb3ccf08b9661d17e13184463b0282ae3594a6c252813d23a53fa0c6182a67
+  metadata.gz: 40eb83d14d6efd140a4cb9748f04f50cfa325c9831d8020890a20fe88fc1485547f4dcab48cdcadfda317b46b3f4a6bc936eb8204ae39a876e053878caa7359f
+  data.tar.gz: af4133b975c5b4b5ca6e2ce9fb05eddd2b1de5a8a30df9c776531a5acdcf5bc4d8322dc7d6875c49800587a4d98031d0eb62054dbd87ced964093c501da32c95

data/.gitignore CHANGED Viewed

@@ -1,13 +1,13 @@
 /.bundle/
-/.yardoc
+/.yardoc/
 /Gemfile.lock
-/_yardoc/
 /coverage/
 /doc/
 /pkg/
 /spec/reports/
 /tmp/
 result
+Gemfile.local
 # rspec failure tracking
 .rspec_status

data/.travis.yml CHANGED Viewed

@@ -1,8 +1,13 @@
+notifications:
+  webhooks:
+    - https://webhook.commit-email.info/
 sudo: false
 language: ruby
 rvm:
-  - 2.3.6
   - 2.4.3
   - 2.5.0
-before_install: gem install bundler -v 1.15.1
-script: ruby test/run_test.rb
+  - 2.6.0
+before_install: gem install bundler
+script:
+  - ruby test/run_test.rb
+  - yardoc --fail-on-warning

data/.yardopts ADDED Viewed

	@@ -0,0 +1 @@
1	+ -p templates

data/Gemfile CHANGED Viewed

@@ -1,4 +1,9 @@
 source "https://rubygems.org"
-# Specify your gem's dependencies in red-chainer.gemspec
 gemspec
+local_gemfile = File.join(File.dirname(__FILE__), "Gemfile.local")
+if File.exist?(local_gemfile)
+  puts "Loading Gemfile.local ..." if $DEBUG # `ruby -d` or `bundle -v`
+  instance_eval File.read(local_gemfile)
+end

data/README.md CHANGED Viewed

@@ -8,7 +8,7 @@ It ported python's [Chainer](https://github.com/chainer/chainer) with Ruby.
 ## Requirements
-* Ruby 2.3 or later
+* Ruby 2.4 or later
 ## Installation
@@ -31,7 +31,10 @@ $ gem install red-chainer
 ```
 ## Usage
-mnist sample program is [here](./examples/mnist/mnist.rb)
+### Run MNIST example
+MNIST sample program is [here](./examples/mnist/mnist.rb)
 ```bash
 # when install Gemfile
@@ -40,6 +43,34 @@ $ bundle exec ruby examples/mnist/mnist.rb
 $ ruby examples/mnist/mnist.rb
 ```
+### Run MNIST example with GPU
+On GPU machine, add `gem 'cumo'` on Gemfile and do `bundle install`.
+Run the example with `--gpu` option whose value indicates GPU device ID such as:
+```
+$ bundle exec ruby examples/mnist/mnist.rb --gpu 0
+```
+## Development
+### Run tests
+```
+$ bundle exec ruby test/run_test.rb
+```
+### Run tests with Cumo
+On GPU machine, add `gem 'cumo'` on Gemfile and do `bundle install`.
+Run tests with `RED_CHAINER_GPU` environment variable whose value indicates GPU device ID such as:
+```
+$ bundle exec env RED_CHAINER_GPU=0 ruby test/run_test.rb
+```
 ## License
 The MIT license. See [LICENSE.txt](./LICENSE.txt) for details.
@@ -54,4 +85,4 @@ The MIT license. See [LICENSE.txt](./LICENSE.txt) for details.
 |  [connection](https://github.com/red-data-tools/red-chainer/tree/master/lib/chainer/functions/connection)  |  12  | 2 | Linear, Convolution2D |
 |  [pooling](https://github.com/red-data-tools/red-chainer/tree/master/lib/chainer/functions/pooling)  |  14  | 3 | Pooling2D, MaxPooling2D, AveragePooling2D |
 |  [example](https://github.com/red-data-tools/red-chainer/tree/master/examples)  |  31  | 3 | MNIST, Iris, CIFAR |
-|  GPU  | use cupy  | ToDo | want to support [Cumo](https://github.com/sonots/cumo) |
+|  GPU  | use CuPy  | use [Cumo](https://github.com/sonots/cumo) ||

data/examples/cifar/train_cifar.rb CHANGED Viewed

@@ -9,6 +9,7 @@ args = {
   batchsize: 64,
   learnrate: 0.05,
   epoch: 300,
+  gpu: Integer(ENV['RED_CHAINER_GPU'] || -1),
   out: 'result',
   resume: nil,
   model: 'vgg',
@@ -21,11 +22,21 @@ opt.on('-b', '--batchsize VALUE', "Number of images in each mini-batch (default:
 opt.on('-f', '--frequency VALUE', "Frequency of taking a snapshot (default: #{args[:frequency]})") { |v| args[:frequency] = v.to_i }
 opt.on('-l', '--learnrate VALUE', "Learning rate for SGD (default: #{args[:learnrate]})") { |v| args[:learnrate] = v.to_f }
 opt.on('-e', '--epoch VALUE', "Number of sweeps over the dataset to train (default: #{args[:epoch]})") { |v| args[:epoch] = v.to_i }
+opt.on('-g', '--gpu VALUE', "GPU ID (negative value indicates CPU) (default: #{args[:gpu]})") { |v| args[:gpu] = v.to_i }
 opt.on('-o', '--out VALUE', "Directory to output the result (default: #{args[:out]})") { |v| args[:out] = v }
 opt.on('-r', '--resume VALUE', "Resume the training from snapshot") { |v| args[:resume] = v }
 opt.on('-m', '--model VALUE', "Use model") { |v| args[:model] = v }
 opt.parse!(ARGV)
+puts "GPU: #{args[:gpu]}"
+puts "# unit: #{args[:unit]}"
+puts "# Minibatch-size: #{args[:batchsize]}"
+puts "# epoch: #{args[:epoch]}"
+puts
+device = Chainer::Device.create(args[:gpu])
+Chainer::Device.change_default(device)
 # Set up a neural network to train.
 # Classifier reports softmax cross entropy loss and accuracy at every
 # iteration, which will be used by the PrintReport extension below.
@@ -57,10 +68,10 @@ optimizer.setup(model)
 train_iter = Chainer::Iterators::SerialIterator.new(train, args[:batchsize])
 test_iter = Chainer::Iterators::SerialIterator.new(test, args[:batchsize], repeat: false, shuffle: false)
-updater = Chainer::Training::StandardUpdater.new(train_iter, optimizer, device: -1)
+updater = Chainer::Training::StandardUpdater.new(train_iter, optimizer, device: device)
 trainer = Chainer::Training::Trainer.new(updater, stop_trigger: [args[:epoch], 'epoch'], out: args[:out])
-trainer.extend(Chainer::Training::Extensions::Evaluator.new(test_iter, model, device: -1))
+trainer.extend(Chainer::Training::Extensions::Evaluator.new(test_iter, model, device: device))
 trainer.extend(Chainer::Training::Extensions::ExponentialShift.new('lr', 0.5), trigger: [25, 'epoch'])

data/examples/iris/iris.rb CHANGED Viewed

@@ -25,6 +25,10 @@ class IrisChain < Chainer::Chain
   end
 end
+device = Chainer::Device.create(Integer(ENV['RED_CHAINER_GPU'] || -1))
+Chainer::Device.change_default(device)
+xm = device.xm
 model = IrisChain.new(6,3)
 optimizer = Chainer::Optimizers::Adam.new
@@ -35,7 +39,7 @@ iris_table = iris.to_table
 x = iris_table.fetch_values(:sepal_length, :sepal_width, :petal_length, :petal_width).transpose
 # target
-y_class = iris_table[:class]
+y_class = iris_table[:label]
 # class index array
 # ["Iris-setosa", "Iris-versicolor", "Iris-virginica"]
@@ -46,7 +50,7 @@ y = y_class.map{|s|
 }
 # y_onehot => One-hot [[1.0, 0.0, 0.0], [1.0, 0.0, 0.0],,, [0.0, 1.0, 0.0], ,, [0.0, 0.0, 1.0]]
-y_onehot = Numo::SFloat.eye(class_name.size)[y,false]
+y_onehot = xm::SFloat.eye(class_name.size)[y, false]
 puts "Iris Datasets"
 puts "No. [sepal_length, sepal_width, petal_length, petal_width] one-hot #=> class"
@@ -57,9 +61,9 @@ x.each_with_index{|r, i|
 # [7.0, 3.2, 4.7, 1.4, "Iris-versicolor"] => 50 data
 # [6.3, 3.3, 6.0, 2.5, "Iris-virginica"]  => 50 data
-x = Numo::SFloat.cast(x)
-y = Numo::SFloat.cast(y)
-y_onehot = Numo::SFloat.cast(y_onehot)
+x = xm::SFloat.cast(x)
+y = xm::SFloat.cast(y)
+y_onehot = xm::SFloat.cast(y_onehot)
 x_train = x[(1..-1).step(2), true]        #=> 75 data (Iris-setosa : 25, Iris-versicolor : 25, Iris-virginica : 25)
 y_train = y_onehot[(1..-1).step(2), true] #=> 75 data (Iris-setosa : 25, Iris-versicolor : 25, Iris-virginica : 25)

data/examples/mnist/mnist.rb CHANGED Viewed

@@ -27,6 +27,7 @@ args = {
   batchsize: 100,
   frequency: -1,
   epoch: 20,
+  gpu: Integer(ENV['RED_CHAINER_GPU'] || -1),
   resume: nil,
   unit: 1000,
   out: 'result'
@@ -35,25 +36,36 @@ args = {
 opt = OptionParser.new
 opt.on('-b', '--batchsize VALUE', "Number of images in each mini-batch (default: #{args[:batchsize]})") { |v| args[:batchsize] = v.to_i }
 opt.on('-e', '--epoch VALUE', "Number of sweeps over the dataset to train (default: #{args[:epoch]})") { |v| args[:epoch] = v.to_i }
+opt.on('-g', '--gpu VALUE', "GPU ID (negative value indicates CPU) (default: #{args[:gpu]})") { |v| args[:gpu] = v.to_i }
 opt.on('-f', '--frequency VALUE', "Frequency of taking a snapshot (default: #{args[:frequency]})") { |v| args[:frequency] = v.to_i }
 opt.on('-o', '--out VALUE', "Directory to output the result (default: #{args[:out]})") { |v| args[:out] = v }
 opt.on('-r', '--resume VALUE', "Resume the training from snapshot") { |v| args[:resume] = v }
 opt.on('-u', '--unit VALUE', "Number of units (default: #{args[:unit]})") { |v| args[:unit] = v.to_i }
 opt.parse!(ARGV)
-model = Chainer::Links::Model::Classifier.new(MLP.new(args[:unit], 10))
+puts "GPU: #{args[:gpu]}"
+puts "# unit: #{args[:unit]}"
+puts "# Minibatch-size: #{args[:batchsize]}"
+puts "# epoch: #{args[:epoch]}"
+puts
+device = Chainer::Device.create(args[:gpu])
+Chainer::Device.change_default(device)
+lossfun = -> (x, t) { Chainer::Functions::Loss::SoftmaxCrossEntropy.new(ignore_label: nil).(x, t) }
+model = Chainer::Links::Model::Classifier.new(MLP.new(args[:unit], 10), lossfun)
 optimizer = Chainer::Optimizers::Adam.new
 optimizer.setup(model)
-train, test = Chainer::Datasets::Mnist.get_mnist
+train, test = Chainer::Datasets::MNIST.get_mnist
 train_iter = Chainer::Iterators::SerialIterator.new(train, args[:batchsize])
 test_iter = Chainer::Iterators::SerialIterator.new(test, args[:batchsize], repeat: false, shuffle: false)
-updater = Chainer::Training::StandardUpdater.new(train_iter, optimizer, device: -1)
+updater = Chainer::Training::StandardUpdater.new(train_iter, optimizer, device: device)
 trainer = Chainer::Training::Trainer.new(updater, stop_trigger: [args[:epoch], 'epoch'], out: args[:out])
-trainer.extend(Chainer::Training::Extensions::Evaluator.new(test_iter, model, device: -1))
+trainer.extend(Chainer::Training::Extensions::Evaluator.new(test_iter, model, device: args[:gpu]))
 # Take a snapshot for each specified epoch
 frequency = args[:frequency] == -1 ? args[:epoch] : [1, args[:frequency]].max

data/lib/chainer.rb CHANGED Viewed

@@ -3,8 +3,11 @@ require "weakref"
 require "chainer/version"
 require 'chainer/cuda'
+require 'chainer/backend'
 require 'chainer/configuration'
+require 'chainer/device'
 require 'chainer/function'
+require 'chainer/function_node'
 require 'chainer/optimizer'
 require 'chainer/gradient_method'
 require 'chainer/gradient_check'
@@ -15,6 +18,7 @@ require 'chainer/initializer'
 require 'chainer/initializers/init'
 require 'chainer/initializers/constant'
 require 'chainer/initializers/normal'
+require 'chainer/initializers/uniform'
 require 'chainer/iterators/serial_iterator'
 require 'chainer/link'
 require 'chainer/links/connection/convolution_2d'
@@ -30,15 +34,28 @@ require 'chainer/utils/variable'
 require 'chainer/utils/array'
 require 'chainer/functions/activation/leaky_relu'
 require 'chainer/functions/activation/relu'
+require 'chainer/functions/activation/relu_grad2'
 require 'chainer/functions/activation/sigmoid'
+require 'chainer/functions/activation/sigmoid_grad'
 require 'chainer/functions/activation/tanh'
 require 'chainer/functions/activation/log_softmax'
+require 'chainer/functions/array/broadcast_to'
+require 'chainer/functions/array/cast'
+require 'chainer/functions/array/reshape'
+require 'chainer/functions/array/rollaxis'
+require 'chainer/functions/array/select_item'
+require 'chainer/functions/array/squeeze'
+require 'chainer/functions/array/transpose'
 require 'chainer/functions/evaluation/accuracy'
 require 'chainer/functions/math/basic_math'
 require 'chainer/functions/math/identity'
+require 'chainer/functions/math/sum'
+require 'chainer/functions/math/exp'
 require 'chainer/functions/loss/mean_squared_error'
 require 'chainer/functions/loss/softmax_cross_entropy'
 require 'chainer/functions/connection/convolution_2d'
+require 'chainer/functions/connection/deconvolution_2d'
+require 'chainer/functions/connection/convolution_2d_grad_w'
 require 'chainer/functions/connection/linear'
 require 'chainer/functions/noise/dropout'
 require 'chainer/functions/normalization/batch_normalization'
@@ -61,7 +78,6 @@ require 'chainer/training/triggers/interval'
 require 'chainer/parameter'
 require 'chainer/optimizers/adam'
 require 'chainer/optimizers/momentum_sgd'
-require 'chainer/dataset/download'
 require 'chainer/datasets/mnist'
 require 'chainer/datasets/cifar'
 require 'chainer/datasets/tuple_dataset'

data/lib/chainer/backend.rb ADDED Viewed

@@ -0,0 +1,27 @@
+module Chainer
+  # Gets an appropriate one from +Numo::NArray+ or +Cumo::NArray+ from given arrays.
+  #
+  # @param [Array<Chainer::Variable> or Array<Numo::NArray> or Array<Cumo::NArray>] args Values to determine whether Numo or Cumo should be used.
+  # @return [Class] +Cumo::NArray+ or +Numo::NArray+ is returned based on the types of the arguments.
+  def get_array_module(*args)
+    arrays = args.map {|v| v.kind_of?(Chainer::Variable) ? v.data : v }
+    if CUDA.available?
+      return Cumo if arrays.any? {|a| a.kind_of?(Cumo::NArray) }
+    end
+    return Numo
+  end
+  module_function :get_array_module
+  # Returns true if the argument is either of +Numo::NArray+ or +Cumo::NArray+.
+  #
+  # @param [Object] obj
+  # @return [Boolean]
+  def array?(obj)
+    if CUDA.available?
+      return true if obj.kind_of?(Cumo::NArray)
+    end
+    return true if obj.kind_of?(Numo::NArray)
+    false
+  end
+  module_function :array?
+end

data/lib/chainer/cuda.rb CHANGED Viewed

@@ -1,18 +1,40 @@
+begin
+  require 'cumo'
+  $chainer_cuda_available = true
+rescue LoadError => e
+  $chainer_cuda_available = false
+  # A trick to make Cumo::NArray always exists
+  module Cumo
+    class NArray; end
+    class NMath; end
+    class Bit; end
+  end
+end
 module Chainer
-  # Gets an appropriate one from +Numo::NArray+ or +Cumo::NArray+.
-  #
-  # This is almost equivalent to +Chainer::get_array_module+. The differences
-  # are that this function can be used even if CUDA is not available and that
-  # it will return their data arrays' array module for
-  # +Chainer::Variable+ arguments.
-  #
-  # @param [Array<Chainer::Variable> or Array<Numo::NArray> or Array<Cumo::NArray>] args Values to determine whether Numo or Cumo should be used.
-  # @return [Numo::NArray] +Cumo::NArray+ or +Numo::NArray+ is returned based on the types of
-  #   the arguments.
-  # @todo CUDA is not supported, yet.
-  #
-  def get_array_module(*args)
-    return Numo::NArray
+  module CUDA
+    # Returns whether CUDA is available.
+    #
+    # @param [Integer or nil] id If a non negative integer is given, check availability of GPU ID.
+    # @return [Boolean]
+    def available?(id = nil)
+      return false unless $chainer_cuda_available
+      if id
+        raise 'id must be non negative' if id < 0
+        @device_count ||= Cumo::CUDA::Runtime.cudaGetDeviceCount
+        return @device_count > id
+      end
+      true
+    end
+    module_function :available?
+    # Checks if CUDA is available.
+    #
+    # @param [Integer or nil] id If a non negative integer is given, check availability of GPU ID.
+    # @raise [RuntimeError] if not available
+    def check_available(id = nil)
+      raise 'CUDA is not available' unless available?(id)
+    end
+    module_function :check_available
   end
-  module_function :get_array_module
 end

data/lib/chainer/dataset/convert.rb CHANGED Viewed

@@ -2,12 +2,13 @@ module Chainer
   module Dataset
     module Convert
       def self.to_device(device, x)
-        # TODO: support cuda
+        # TODO(sonots): Implement after Cumo supports transferring between devices
         x
       end
       def self.concat_examples(batch, device: nil, padding: nil)
         raise "batch is empty" if batch.size == 0
+        device = device ? Chainer::Device.create(device) : Chainer::Device.default # takes care of int and nil
         first_elem = batch[0]
         if first_elem.kind_of?(Array)
@@ -17,28 +18,29 @@ module Chainer
           end
           first_elem.size.times do |i|
-            x = concat_arrays(batch.map { |b| b[i] }, padding[i])
+            x = _concat_arrays(batch.map { |b| b[i] }, padding[i], device)
             result.push(to_device(device, x))
           end
           return result
         else
-          return to_device(device, concat_arrays(batch, padding))
+          return _concat_arrays(batch, padding, device)
         end
       end
-      def self.concat_arrays(arrays, padding)
-        unless arrays[0].kind_of?(Numo::NArray)
+      def self._concat_arrays(arrays, padding, device)
+        xm = device.xm
+        unless arrays[0].kind_of?(xm::NArray)
           # [1, 2, 3, 4] => Numo::Int32[1, 2, 3, 4]
-          arrays = Numo::NArray.cast(arrays)
+          arrays = xm::NArray.cast(arrays)
           if padding
-            return concat_arrays_with_padding(arrays, padding)
+            return _concat_arrays_with_padding(arrays, padding, device)
           end
           return arrays
         end
         if padding
-          return concat_arrays_with_padding(arrays, padding)
+          return _concat_arrays_with_padding(arrays, padding, device)
         end
         # [Numo::SFloat[1, 2], Numo::SFloat[3, 4]]
@@ -48,12 +50,14 @@ module Chainer
         a[0].concatenate(*a[1..-1])
       end
-      def self.concat_arrays_with_padding(arrays, padding)
-        if arrays[0].is_a? Numo::NArray
-          shape = Numo::Int32.cast(arrays[0].shape)
+      def self._concat_arrays_with_padding(arrays, padding, device)
+        xm = device.xm
+        if Chainer.array?(arrays[0]) and arrays[0].ndim > 0
+          xm = Chainer.get_array_module(arrays[0])
+          shape = xm::Int32.cast(arrays[0].shape)
           arrays[1..-1].each do |array|
-            if Numo::Bit.[](shape != array.shape).any?
-              shape = Numo::Int32.maximum(shape, array.shape)
+            if xm::Bit.[](shape != array.shape).any?
+              shape = xm::Int32.maximum(shape, array.shape)
             end
           end
         else # Integer
@@ -61,15 +65,15 @@ module Chainer
         end
         shape = shape.insert(0, arrays.size).to_a
-        if arrays[0].is_a? Numo::NArray
+        if Chainer.array?(arrays[0]) and arrays[0].ndim > 0
           result = arrays[0].class.new(shape).fill(padding)
         else # Integer
-          result = Numo::Int32.new(shape).fill(padding)
+          result = xm::Int32.new(shape).fill(padding)
         end
         arrays.size.times do |i|
           src = arrays[i]
-          if src.is_a? Numo::NArray
+          if Chainer.array?(src) and src.ndim > 0
             result[i, 0...src.shape[0], 0...src.shape[1]] = src
           else # Integer
             result[i] = src