RubyGems - torch-rb - Versions diffs - 0.3.0 → 0.3.5 - Mend

torch-rb 0.3.0 → 0.3.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (18) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +27 -0
data/README.md +6 -2
data/ext/torch/ext.cpp +45 -4
data/ext/torch/extconf.rb +3 -4
data/ext/torch/templates.hpp +16 -33
data/lib/torch.rb +33 -0
data/lib/torch/hub.rb +11 -10
data/lib/torch/native/function.rb +5 -1
data/lib/torch/native/generator.rb +9 -20
data/lib/torch/native/parser.rb +5 -1
data/lib/torch/nn/functional.rb +5 -1
data/lib/torch/tensor.rb +35 -41
data/lib/torch/utils/data.rb +23 -0
data/lib/torch/utils/data/data_loader.rb +22 -6
data/lib/torch/utils/data/subset.rb +25 -0
data/lib/torch/version.rb +1 -1
metadata +4 -2

checksums.yaml CHANGED

@@ -1,7 +1,7 @@
 ---
 SHA256:
-  metadata.gz: 33636e58063f25c2b9f122d29332e4136bb6a4de0fd227349f75d65a9db94931
-  data.tar.gz: 9349dd0b050a4c9e0714d92bb451bdd916e55fb47a5c4d90a74720d53564a1d6
+  metadata.gz: 93271ffd62be6e35c6ea3a2219a7bc3dccbe8489d6f4aca1a1f00f99bab1a4bb
+  data.tar.gz: df2755ac3e6221502430d780d116a1145c461f97857e7b1b2b809095afaad9e5
 SHA512:
-  metadata.gz: 692e8dc3531426377413fc9325c2b03dd7fcbbbce0c05cbd5d7c3182a08bbe733bb9a6b0aa62a56fb27917073e1f1f5859aa0dd3f6f40e74043bba242ede6267
-  data.tar.gz: f57d0411c18c7c4753f5edc82e48b666ad3154c72bf189a8ec2c4dceb08cd1f37a9421b9a6eae3d20e10c4c9236a1136d76559a31989ce22868a9f44ef3e0e66
+  metadata.gz: 9e02de90a7a83e5d4421941a0ceea69c6367f42be2e97e4229812f35c27f83475fbace86f42285128da724343dcfd85050b7846d81d43fce100749be0072ad4c
+  data.tar.gz: 884873c3c965f16b0a833087909019ebc6f228511a9b0ecbf4c436cc546e28012e63899651aeab6befddbe7b057676b170cd3eb858b997f42289c103252a2834

data/CHANGELOG.md CHANGED

@@ -1,3 +1,30 @@
+## 0.3.5 (2020-09-04)
+- Fixed error with data loader (due to `dtype` of `randperm`)
+## 0.3.4 (2020-08-26)
+- Added `Torch.clamp` method
+## 0.3.3 (2020-08-25)
+- Added spectral ops
+- Fixed tensor indexing
+## 0.3.2 (2020-08-24)
+- Added `enable_grad` method
+- Added `random_split` method
+- Added `collate_fn` option to `DataLoader`
+- Added `grad=` method to `Tensor`
+- Fixed error with `grad` method when empty
+- Fixed `EmbeddingBag`
+## 0.3.1 (2020-08-17)
+- Added `create_graph` and `retain_graph` options to `backward` method
+- Fixed error when `set` not required
 ## 0.3.0 (2020-07-29)
 - Updated LibTorch to 1.6.0

data/README.md CHANGED

@@ -2,7 +2,11 @@
 :fire: Deep learning for Ruby, powered by [LibTorch](https://pytorch.org)
-For computer vision tasks, also check out [TorchVision](https://github.com/ankane/torchvision)
+Check out:
+- [TorchVision](https://github.com/ankane/torchvision) for computer vision tasks
+- [TorchText](https://github.com/ankane/torchtext) for text and NLP tasks
+- [TorchAudio](https://github.com/ankane/torchaudio) for audio tasks
 [![Build Status](https://travis-ci.org/ankane/torch.rb.svg?branch=master)](https://travis-ci.org/ankane/torch.rb)
@@ -411,7 +415,7 @@ Here’s the list of compatible versions.
 Torch.rb | LibTorch
 --- | ---
-0.3.0 | 1.6.0
+0.3.0-0.3.4 | 1.6.0
 0.2.0-0.2.7 | 1.5.0-1.5.1
 0.1.8 | 1.4.0
 0.1.0-0.1.7 | 1.3.1

data/ext/torch/ext.cpp CHANGED

@@ -16,6 +16,7 @@
 #include "nn_functions.hpp"
 using namespace Rice;
+using torch::indexing::TensorIndex;
 // need to make a distinction between parameters and tensors
 class Parameter: public torch::autograd::Variable {
@@ -28,6 +29,15 @@ void handle_error(torch::Error const & ex)
   throw Exception(rb_eRuntimeError, ex.what_without_backtrace());
 }
+std::vector<TensorIndex> index_vector(Array a) {
+  auto indices = std::vector<TensorIndex>();
+  indices.reserve(a.size());
+  for (size_t i = 0; i < a.size(); i++) {
+    indices.push_back(from_ruby<TensorIndex>(a[i]));
+  }
+  return indices;
+}
 extern "C"
 void Init_ext()
 {
@@ -58,6 +68,13 @@ void Init_ext()
         return generator.seed();
       });
+  Class rb_cTensorIndex = define_class_under<TensorIndex>(rb_mTorch, "TensorIndex")
+    .define_singleton_method("boolean", *[](bool value) { return TensorIndex(value); })
+    .define_singleton_method("integer", *[](int64_t value) { return TensorIndex(value); })
+    .define_singleton_method("tensor", *[](torch::Tensor& value) { return TensorIndex(value); })
+    .define_singleton_method("slice", *[](torch::optional<int64_t> start_index, torch::optional<int64_t> stop_index) { return TensorIndex(torch::indexing::Slice(start_index, stop_index)); })
+    .define_singleton_method("none", *[]() { return TensorIndex(torch::indexing::None); });
   // https://pytorch.org/cppdocs/api/structc10_1_1_i_value.html
   Class rb_cIValue = define_class_under<torch::IValue>(rb_mTorch, "IValue")
     .add_handler<torch::Error>(handle_error)
@@ -330,6 +347,18 @@ void Init_ext()
     .define_method("numel", &torch::Tensor::numel)
     .define_method("element_size", &torch::Tensor::element_size)
     .define_method("requires_grad", &torch::Tensor::requires_grad)
+    .define_method(
+      "_index",
+      *[](Tensor& self, Array indices) {
+        auto vec = index_vector(indices);
+        return self.index(vec);
+      })
+    .define_method(
+      "_index_put_custom",
+      *[](Tensor& self, Array indices, torch::Tensor& value) {
+        auto vec = index_vector(indices);
+        return self.index_put_(vec, value);
+      })
     .define_method(
       "contiguous?",
       *[](Tensor& self) {
@@ -352,13 +381,19 @@ void Init_ext()
       })
     .define_method(
       "_backward",
-      *[](Tensor& self, Object gradient) {
-        return gradient.is_nil() ? self.backward() : self.backward(from_ruby<torch::Tensor>(gradient));
+      *[](Tensor& self, OptionalTensor gradient, bool create_graph, bool retain_graph) {
+        return self.backward(gradient, create_graph, retain_graph);
       })
     .define_method(
       "grad",
       *[](Tensor& self) {
-        return self.grad();
+        auto grad = self.grad();
+        return grad.defined() ? to_ruby<torch::Tensor>(grad) : Nil;
+      })
+    .define_method(
+      "grad=",
+      *[](Tensor& self, torch::Tensor& grad) {
+        self.grad() = grad;
       })
     .define_method(
       "_dtype",
@@ -502,6 +537,7 @@ void Init_ext()
       });
   Module rb_mInit = define_module_under(rb_mNN, "Init")
+    .add_handler<torch::Error>(handle_error)
     .define_singleton_method(
       "_calculate_gain",
       *[](NonlinearityType nonlinearity, double param) {
@@ -580,11 +616,16 @@ void Init_ext()
       *[](Parameter& self) {
         auto grad = self.grad();
         return grad.defined() ? to_ruby<torch::Tensor>(grad) : Nil;
+      })
+    .define_method(
+      "grad=",
+      *[](Parameter& self, torch::Tensor& grad) {
+        self.grad() = grad;
       });
   Class rb_cDevice = define_class_under<torch::Device>(rb_mTorch, "Device")
-    .define_constructor(Constructor<torch::Device, std::string>())
     .add_handler<torch::Error>(handle_error)
+    .define_constructor(Constructor<torch::Device, std::string>())
     .define_method("index", &torch::Device::index)
     .define_method("index?", &torch::Device::has_index)
     .define_method(

data/ext/torch/extconf.rb CHANGED

@@ -7,17 +7,16 @@ $CXXFLAGS += " -std=c++14"
 # change to 0 for Linux pre-cxx11 ABI version
 $CXXFLAGS += " -D_GLIBCXX_USE_CXX11_ABI=1"
-# TODO check compiler name
-clang = RbConfig::CONFIG["host_os"] =~ /darwin/i
+apple_clang = RbConfig::CONFIG["CC_VERSION_MESSAGE"] =~ /apple clang/i
 # check omp first
 if have_library("omp") || have_library("gomp")
   $CXXFLAGS += " -DAT_PARALLEL_OPENMP=1"
-  $CXXFLAGS += " -Xclang" if clang
+  $CXXFLAGS += " -Xclang" if apple_clang
   $CXXFLAGS += " -fopenmp"
 end
-if clang
+if apple_clang
   # silence ruby/intern.h warning
   $CXXFLAGS += " -Wno-deprecated-register"

data/ext/torch/templates.hpp CHANGED

@@ -9,6 +9,10 @@
 using namespace Rice;
+using torch::Device;
+using torch::ScalarType;
+using torch::Tensor;
 // need to wrap torch::IntArrayRef() since
 // it doesn't own underlying data
 class IntArrayRef {
@@ -174,8 +178,6 @@ MyReduction from_ruby<MyReduction>(Object x)
   return MyReduction(x);
 }
-typedef torch::Tensor Tensor;
 class OptionalTensor {
   Object value;
   public:
@@ -197,47 +199,28 @@ OptionalTensor from_ruby<OptionalTensor>(Object x)
   return OptionalTensor(x);
 }
-class ScalarType {
-  Object value;
-  public:
-    ScalarType(Object o) {
-      value = o;
-    }
-    operator at::ScalarType() {
-      throw std::runtime_error("ScalarType arguments not implemented yet");
-    }
-};
 template<>
 inline
-ScalarType from_ruby<ScalarType>(Object x)
+torch::optional<torch::ScalarType> from_ruby<torch::optional<torch::ScalarType>>(Object x)
 {
-  return ScalarType(x);
+  if (x.is_nil()) {
+    return torch::nullopt;
+  } else {
+    return torch::optional<torch::ScalarType>{from_ruby<torch::ScalarType>(x)};
+  }
 }
-class OptionalScalarType {
-  Object value;
-  public:
-    OptionalScalarType(Object o) {
-      value = o;
-    }
-    operator c10::optional<at::ScalarType>() {
-      if (value.is_nil()) {
-        return c10::nullopt;
-      }
-      return ScalarType(value);
-    }
-};
 template<>
 inline
-OptionalScalarType from_ruby<OptionalScalarType>(Object x)
+torch::optional<int64_t> from_ruby<torch::optional<int64_t>>(Object x)
 {
-  return OptionalScalarType(x);
+  if (x.is_nil()) {
+    return torch::nullopt;
+  } else {
+    return torch::optional<int64_t>{from_ruby<int64_t>(x)};
+  }
 }
-typedef torch::Device Device;
 Object wrap(std::tuple<torch::Tensor, torch::Tensor> x);
 Object wrap(std::tuple<torch::Tensor, torch::Tensor, torch::Tensor> x);
 Object wrap(std::tuple<torch::Tensor, torch::Tensor, torch::Tensor, torch::Tensor> x);

data/lib/torch.rb CHANGED

@@ -4,6 +4,7 @@ require "torch/ext"
 # stdlib
 require "fileutils"
 require "net/http"
+require "set"
 require "tmpdir"
 # native functions
@@ -178,8 +179,10 @@ require "torch/nn/functional"
 require "torch/nn/init"
 # utils
+require "torch/utils/data"
 require "torch/utils/data/data_loader"
 require "torch/utils/data/dataset"
+require "torch/utils/data/subset"
 require "torch/utils/data/tensor_dataset"
 # hub
@@ -315,6 +318,16 @@ module Torch
       end
     end
+    def enable_grad
+      previous_value = grad_enabled?
+      begin
+        _set_grad_enabled(true)
+        yield
+      ensure
+        _set_grad_enabled(previous_value)
+      end
+    end
     def device(str)
       Device.new(str)
     end
@@ -375,6 +388,10 @@ module Torch
     end
     def randperm(n, **options)
+      # dtype hack in Python
+      # https://github.com/pytorch/pytorch/blob/v1.6.0/tools/autograd/gen_python_functions.py#L1307-L1311
+      options[:dtype] ||= :int64
       _randperm(n, tensor_options(**options))
     end
@@ -447,6 +464,22 @@ module Torch
       zeros(input.size, **like_options(input, options))
     end
+    def stft(input, n_fft, hop_length: nil, win_length: nil, window: nil, center: true, pad_mode: "reflect", normalized: false, onesided: true)
+      if center
+        signal_dim = input.dim
+        extended_shape = [1] * (3 - signal_dim) + input.size
+        pad = n_fft.div(2).to_i
+        input = NN::F.pad(input.view(extended_shape), [pad, pad], mode: pad_mode)
+        input = input.view(input.shape[-signal_dim..-1])
+      end
+      _stft(input, n_fft, hop_length, win_length, window, normalized, onesided)
+    end
+    def clamp(tensor, min, max)
+      tensor = _clamp_min(tensor, min)
+      _clamp_max(tensor, max)
+    end
     private
     def to_ivalue(obj)

data/lib/torch/hub.rb CHANGED

@@ -7,25 +7,26 @@ module Torch
       def download_url_to_file(url, dst)
         uri = URI(url)
-        tmp = "#{Dir.tmpdir}/#{Time.now.to_f}" # TODO better name
+        tmp = nil
         location = nil
+        puts "Downloading #{url}..."
         Net::HTTP.start(uri.host, uri.port, use_ssl: uri.scheme == "https") do |http|
           request = Net::HTTP::Get.new(uri)
-          puts "Downloading #{url}..."
-          File.open(tmp, "wb") do |f|
-            http.request(request) do |response|
-              case response
-              when Net::HTTPRedirection
-                location = response["location"]
-              when Net::HTTPSuccess
+          http.request(request) do |response|
+            case response
+            when Net::HTTPRedirection
+              location = response["location"]
+            when Net::HTTPSuccess
+              tmp = "#{Dir.tmpdir}/#{Time.now.to_f}" # TODO better name
+              File.open(tmp, "wb") do |f|
                 response.read_body do |chunk|
                   f.write(chunk)
                 end
-              else
-                raise Error, "Bad response"
               end
+            else
+              raise Error, "Bad response"
             end
           end
         end

data/lib/torch/native/function.rb CHANGED

@@ -1,10 +1,14 @@
 module Torch
   module Native
     class Function
-      attr_reader :function
+      attr_reader :function, :tensor_options
       def initialize(function)
         @function = function
+        tensor_options_str = ", *, ScalarType? dtype=None, Layout? layout=None, Device? device=None, bool? pin_memory=None)"
+        @tensor_options = @function["func"].include?(tensor_options_str)
+        @function["func"].sub!(tensor_options_str, ")")
       end
       def func

data/lib/torch/native/generator.rb CHANGED

@@ -33,30 +33,14 @@ module Torch
               f.args.any? do |a|
                 a[:type].include?("?") && !["Tensor?", "Generator?", "int?", "ScalarType?", "Tensor?[]"].include?(a[:type]) ||
                 skip_args.any? { |sa| a[:type].include?(sa) } ||
+                # call to 'range' is ambiguous
+                f.cpp_name == "_range" ||
                 # native_functions.yaml is missing size argument for normal
                 # https://pytorch.org/cppdocs/api/function_namespacetorch_1a80253fe5a3ded4716ec929a348adb4b9.html
                 (f.base_name == "normal" && !f.out?)
               end
             end
-          # generate additional functions for optional arguments
-          # there may be a better way to do this
-          optional_functions, functions = functions.partition { |f| f.args.any? { |a| a[:type] == "int?" } }
-          optional_functions.each do |f|
-            next if f.ruby_name == "cross"
-            next if f.ruby_name.start_with?("avg_pool") && f.out?
-            opt_args = f.args.select { |a| a[:type] == "int?" }
-            if opt_args.size == 1
-              sep = f.name.include?(".") ? "_" : "."
-              f1 = Function.new(f.function.merge("func" => f.func.sub("(", "#{sep}#{opt_args.first[:name]}(").gsub("int?", "int")))
-              # TODO only remove some arguments
-              f2 = Function.new(f.function.merge("func" => f.func.sub(/, int\?.+\) ->/, ") ->")))
-              functions << f1
-              functions << f2
-            end
-          end
           # todo_functions.each do |f|
           #   puts f.func
           #   puts
@@ -97,7 +81,8 @@ void add_%{type}_functions(Module m) {
           cpp_defs = []
           functions.sort_by(&:cpp_name).each do |func|
-            fargs = func.args #.select { |a| a[:type] != "Generator?" }
+            fargs = func.args.dup #.select { |a| a[:type] != "Generator?" }
+            fargs << {name: "options", type: "TensorOptions"} if func.tensor_options
             cpp_args = []
             fargs.each do |a|
@@ -109,7 +94,7 @@ void add_%{type}_functions(Module m) {
                   # TODO better signature
                   "OptionalTensor"
                 when "ScalarType?"
-                  "OptionalScalarType"
+                  "torch::optional<ScalarType>"
                 when "Tensor[]"
                   "TensorList"
                 when "Tensor?[]"
@@ -117,6 +102,8 @@ void add_%{type}_functions(Module m) {
                   "TensorList"
                 when "int"
                   "int64_t"
+                when "int?"
+                  "torch::optional<int64_t>"
                 when "float"
                   "double"
                 when /\Aint\[/
@@ -125,6 +112,8 @@ void add_%{type}_functions(Module m) {
                   "Tensor &"
                 when "str"
                   "std::string"
+                when "TensorOptions"
+                  "const torch::TensorOptions &"
                 else
                   a[:type]
                 end

data/lib/torch/native/parser.rb CHANGED

@@ -83,6 +83,8 @@ module Torch
                 else
                   v.is_a?(Integer)
                 end
+              when "int?"
+                v.is_a?(Integer) || v.nil?
               when "float"
                 v.is_a?(Numeric)
               when /int\[.*\]/
@@ -126,9 +128,11 @@ module Torch
         end
         func = candidates.first
+        args = func.args.map { |a| final_values[a[:name]] }
+        args << TensorOptions.new.dtype(6) if func.tensor_options
         {
           name: func.cpp_name,
-          args: func.args.map { |a| final_values[a[:name]] }
+          args: args
         }
       end
     end

data/lib/torch/nn/functional.rb CHANGED

@@ -373,7 +373,8 @@ module Torch
             end
           # weight and input swapped
-          Torch.embedding_bag(weight, input, offsets, scale_grad_by_freq, mode_enum, sparse, per_sample_weights)
+          ret, _, _, _ = Torch.embedding_bag(weight, input, offsets, scale_grad_by_freq, mode_enum, sparse, per_sample_weights)
+          ret
         end
         # distance functions
@@ -426,6 +427,9 @@ module Torch
         end
         def mse_loss(input, target, reduction: "mean")
+          if target.size != input.size
+            warn "Using a target size (#{target.size}) that is different to the input size (#{input.size}). This will likely lead to incorrect results due to broadcasting. Please ensure they have the same size."
+          end
           NN.mse_loss(input, target, reduction)
         end

data/lib/torch/tensor.rb CHANGED

@@ -103,8 +103,9 @@ module Torch
       Torch.empty(0, dtype: dtype)
     end
-    def backward(gradient = nil)
-      _backward(gradient)
+    def backward(gradient = nil, retain_graph: nil, create_graph: false)
+      retain_graph = create_graph if retain_graph.nil?
+      _backward(gradient, retain_graph, create_graph)
     end
     # TODO read directly from memory
@@ -187,49 +188,15 @@ module Torch
     # based on python_variable_indexing.cpp and
     # https://pytorch.org/cppdocs/notes/tensor_indexing.html
     def [](*indexes)
-      result = self
-      dim = 0
-      indexes.each do |index|
-        if index.is_a?(Numeric)
-          result = result._select_int(dim, index)
-        elsif index.is_a?(Range)
-          finish = index.end
-          finish += 1 unless index.exclude_end?
-          result = result._slice_tensor(dim, index.begin, finish, 1)
-          dim += 1
-        elsif index.is_a?(Tensor)
-          result = result.index([index])
-        elsif index.nil?
-          result = result.unsqueeze(dim)
-          dim += 1
-        elsif index == true
-          result = result.unsqueeze(dim)
-          # TODO handle false
-        else
-          raise Error, "Unsupported index type: #{index.class.name}"
-        end
-      end
-      result
+      _index(tensor_indexes(indexes))
     end
     # based on python_variable_indexing.cpp and
     # https://pytorch.org/cppdocs/notes/tensor_indexing.html
-    def []=(index, value)
+    def []=(*indexes, value)
       raise ArgumentError, "Tensor does not support deleting items" if value.nil?
       value = Torch.tensor(value, dtype: dtype) unless value.is_a?(Tensor)
-      if index.is_a?(Numeric)
-        index_put!([Torch.tensor(index)], value)
-      elsif index.is_a?(Range)
-        finish = index.end
-        finish += 1 unless index.exclude_end?
-        _slice_tensor(0, index.begin, finish, 1).copy!(value)
-      elsif index.is_a?(Tensor)
-        index_put!([index], value)
-      else
-        raise Error, "Unsupported index type: #{index.class.name}"
-      end
+      _index_put_custom(tensor_indexes(indexes), value)
     end
     # native functions that need manually defined
@@ -243,13 +210,13 @@ module Torch
       end
     end
-    # native functions overlap, so need to handle manually
+    # parser can't handle overlap, so need to handle manually
     def random!(*args)
       case args.size
       when 1
         _random__to(*args)
       when 2
-        _random__from_to(*args)
+        _random__from(*args)
       else
         _random_(*args)
       end
@@ -259,5 +226,32 @@ module Torch
       _clamp_min_(min)
       _clamp_max_(max)
     end
+    private
+    def tensor_indexes(indexes)
+      indexes.map do |index|
+        case index
+        when Integer
+          TensorIndex.integer(index)
+        when Range
+          finish = index.end
+          if finish == -1 && !index.exclude_end?
+            finish = nil
+          else
+            finish += 1 unless index.exclude_end?
+          end
+          TensorIndex.slice(index.begin, finish)
+        when Tensor
+          TensorIndex.tensor(index)
+        when nil
+          TensorIndex.none
+        when true, false
+          TensorIndex.boolean(index)
+        else
+          raise Error, "Unsupported index type: #{index.class.name}"
+        end
+      end
+    end
   end
 end

data/lib/torch/utils/data.rb ADDED

@@ -0,0 +1,23 @@
+module Torch
+  module Utils
+    module Data
+      class << self
+        def random_split(dataset, lengths)
+          if lengths.sum != dataset.length
+            raise ArgumentError, "Sum of input lengths does not equal the length of the input dataset!"
+          end
+          indices = Torch.randperm(lengths.sum).to_a
+          _accumulate(lengths).zip(lengths).map { |offset, length| Subset.new(dataset, indices[(offset - length)...offset]) }
+        end
+        private
+        def _accumulate(iterable)
+          sum = 0
+          iterable.map { |x| sum += x }
+        end
+      end
+    end
+  end
+end

data/lib/torch/utils/data/data_loader.rb CHANGED

@@ -6,10 +6,22 @@ module Torch
         attr_reader :dataset
-        def initialize(dataset, batch_size: 1, shuffle: false)
+        def initialize(dataset, batch_size: 1, shuffle: false, collate_fn: nil)
           @dataset = dataset
           @batch_size = batch_size
           @shuffle = shuffle
+          @batch_sampler = nil
+          if collate_fn.nil?
+            if auto_collation?
+              collate_fn = method(:default_collate)
+            else
+              collate_fn = method(:default_convert)
+            end
+          end
+          @collate_fn = collate_fn
         end
         def each
@@ -25,8 +37,8 @@ module Torch
             end
           indexes.each_slice(@batch_size) do |idx|
-            batch = idx.map { |i| @dataset[i] }
-            yield collate(batch)
+            # TODO improve performance
+            yield @collate_fn.call(idx.map { |i| @dataset[i] })
           end
         end
@@ -36,7 +48,7 @@ module Torch
         private
-        def collate(batch)
+        def default_convert(batch)
           elem = batch[0]
           case elem
           when Tensor
@@ -44,11 +56,15 @@ module Torch
           when Integer
             Torch.tensor(batch)
           when Array
-            batch.transpose.map { |v| collate(v) }
+            batch.transpose.map { |v| default_convert(v) }
           else
-            raise NotImpelmentYet
+            raise NotImplementedYet
           end
         end
+        def auto_collation?
+          !@batch_sampler.nil?
+        end
       end
     end
   end

data/lib/torch/utils/data/subset.rb ADDED

@@ -0,0 +1,25 @@
+module Torch
+  module Utils
+    module Data
+      class Subset < Dataset
+        def initialize(dataset, indices)
+          @dataset = dataset
+          @indices = indices
+        end
+        def [](idx)
+          @dataset[@indices[idx]]
+        end
+        def length
+          @indices.length
+        end
+        alias_method :size, :length
+        def to_a
+          @indices.map { |i| @dataset[i] }
+        end
+      end
+    end
+  end
+end

data/lib/torch/version.rb CHANGED

@@ -1,3 +1,3 @@
 module Torch
-  VERSION = "0.3.0"
+  VERSION = "0.3.5"
 end

metadata CHANGED

@@ -1,14 +1,14 @@
 --- !ruby/object:Gem::Specification
 name: torch-rb
 version: !ruby/object:Gem::Version
-  version: 0.3.0
+  version: 0.3.5
 platform: ruby
 authors:
 - Andrew Kane
 autorequire:
 bindir: bin
 cert_chain: []
-date: 2020-07-29 00:00:00.000000000 Z
+date: 2020-09-04 00:00:00.000000000 Z
 dependencies:
 - !ruby/object:Gem::Dependency
   name: rice
@@ -259,8 +259,10 @@ files:
 - lib/torch/optim/rprop.rb
 - lib/torch/optim/sgd.rb
 - lib/torch/tensor.rb
+- lib/torch/utils/data.rb
 - lib/torch/utils/data/data_loader.rb
 - lib/torch/utils/data/dataset.rb
+- lib/torch/utils/data/subset.rb
 - lib/torch/utils/data/tensor_dataset.rb
 - lib/torch/version.rb
 homepage: https://github.com/ankane/torch.rb