RubyGems - torch-rb - Versions diffs - 0.1.2 → 0.1.7 - Mend

torch-rb 0.1.2 → 0.1.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (142) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +35 -0
data/LICENSE.txt +46 -22
data/README.md +18 -6
data/ext/torch/ext.cpp +148 -369
data/ext/torch/extconf.rb +6 -0
data/ext/torch/nn_functions.cpp +615 -0
data/ext/torch/nn_functions.hpp +6 -0
data/ext/torch/templates.cpp +55 -0
data/ext/torch/templates.hpp +242 -0
data/ext/torch/tensor_functions.cpp +1920 -0
data/ext/torch/tensor_functions.hpp +6 -0
data/ext/torch/torch_functions.cpp +2975 -0
data/ext/torch/torch_functions.hpp +6 -0
data/lib/torch.rb +240 -131
data/lib/torch/ext.bundle +0 -0
data/lib/torch/inspector.rb +27 -22
data/lib/torch/native/dispatcher.rb +48 -0
data/lib/torch/native/function.rb +109 -0
data/lib/torch/native/generator.rb +168 -0
data/lib/torch/native/native_functions.yaml +6837 -0
data/lib/torch/native/parser.rb +134 -0
data/lib/torch/nn/alpha_dropout.rb +9 -0
data/lib/torch/nn/avg_pool1d.rb +18 -0
data/lib/torch/nn/avg_pool2d.rb +19 -0
data/lib/torch/nn/avg_pool3d.rb +19 -0
data/lib/torch/nn/avg_poolnd.rb +9 -0
data/lib/torch/nn/batch_norm.rb +75 -0
data/lib/torch/nn/batch_norm1d.rb +11 -0
data/lib/torch/nn/batch_norm2d.rb +11 -0
data/lib/torch/nn/batch_norm3d.rb +11 -0
data/lib/torch/nn/bce_loss.rb +13 -0
data/lib/torch/nn/bce_with_logits_loss.rb +15 -0
data/lib/torch/nn/bilinear.rb +38 -0
data/lib/torch/nn/constant_pad1d.rb +10 -0
data/lib/torch/nn/constant_pad2d.rb +10 -0
data/lib/torch/nn/constant_pad3d.rb +10 -0
data/lib/torch/nn/constant_padnd.rb +18 -0
data/lib/torch/nn/conv1d.rb +22 -0
data/lib/torch/nn/conv2d.rb +16 -38
data/lib/torch/nn/conv3d.rb +22 -0
data/lib/torch/nn/convnd.rb +41 -0
data/lib/torch/nn/cosine_embedding_loss.rb +14 -0
data/lib/torch/nn/cosine_similarity.rb +15 -0
data/lib/torch/nn/cross_entropy_loss.rb +14 -0
data/lib/torch/nn/ctc_loss.rb +15 -0
data/lib/torch/nn/dropout.rb +9 -0
data/lib/torch/nn/dropout2d.rb +9 -0
data/lib/torch/nn/dropout3d.rb +9 -0
data/lib/torch/nn/dropoutnd.rb +15 -0
data/lib/torch/nn/embedding.rb +52 -0
data/lib/torch/nn/embedding_bag.rb +34 -0
data/lib/torch/nn/feature_alpha_dropout.rb +9 -0
data/lib/torch/nn/fold.rb +20 -0
data/lib/torch/nn/functional.rb +411 -22
data/lib/torch/nn/group_norm.rb +36 -0
data/lib/torch/nn/gru.rb +49 -0
data/lib/torch/nn/hardshrink.rb +18 -0
data/lib/torch/nn/hinge_embedding_loss.rb +14 -0
data/lib/torch/nn/identity.rb +14 -0
data/lib/torch/nn/init.rb +58 -1
data/lib/torch/nn/instance_norm.rb +20 -0
data/lib/torch/nn/instance_norm1d.rb +18 -0
data/lib/torch/nn/instance_norm2d.rb +11 -0
data/lib/torch/nn/instance_norm3d.rb +11 -0
data/lib/torch/nn/kl_div_loss.rb +13 -0
data/lib/torch/nn/l1_loss.rb +13 -0
data/lib/torch/nn/layer_norm.rb +35 -0
data/lib/torch/nn/leaky_relu.rb +20 -0
data/lib/torch/nn/linear.rb +12 -11
data/lib/torch/nn/local_response_norm.rb +21 -0
data/lib/torch/nn/log_sigmoid.rb +9 -0
data/lib/torch/nn/log_softmax.rb +14 -0
data/lib/torch/nn/loss.rb +10 -0
data/lib/torch/nn/lp_pool1d.rb +9 -0
data/lib/torch/nn/lp_pool2d.rb +9 -0
data/lib/torch/nn/lp_poolnd.rb +22 -0
data/lib/torch/nn/lstm.rb +66 -0
data/lib/torch/nn/margin_ranking_loss.rb +14 -0
data/lib/torch/nn/max_pool1d.rb +9 -0
data/lib/torch/nn/max_pool2d.rb +9 -0
data/lib/torch/nn/max_pool3d.rb +9 -0
data/lib/torch/nn/max_poolnd.rb +19 -0
data/lib/torch/nn/max_unpool1d.rb +16 -0
data/lib/torch/nn/max_unpool2d.rb +16 -0
data/lib/torch/nn/max_unpool3d.rb +16 -0
data/lib/torch/nn/max_unpoolnd.rb +9 -0
data/lib/torch/nn/module.rb +201 -20
data/lib/torch/nn/mse_loss.rb +2 -2
data/lib/torch/nn/multi_label_margin_loss.rb +13 -0
data/lib/torch/nn/multi_label_soft_margin_loss.rb +13 -0
data/lib/torch/nn/multi_margin_loss.rb +17 -0
data/lib/torch/nn/nll_loss.rb +14 -0
data/lib/torch/nn/pairwise_distance.rb +16 -0
data/lib/torch/nn/parameter.rb +2 -2
data/lib/torch/nn/poisson_nll_loss.rb +16 -0
data/lib/torch/nn/prelu.rb +19 -0
data/lib/torch/nn/reflection_pad1d.rb +10 -0
data/lib/torch/nn/reflection_pad2d.rb +10 -0
data/lib/torch/nn/reflection_padnd.rb +13 -0
data/lib/torch/nn/relu.rb +8 -3
data/lib/torch/nn/replication_pad1d.rb +10 -0
data/lib/torch/nn/replication_pad2d.rb +10 -0
data/lib/torch/nn/replication_pad3d.rb +10 -0
data/lib/torch/nn/replication_padnd.rb +13 -0
data/lib/torch/nn/rnn.rb +22 -0
data/lib/torch/nn/rnn_base.rb +198 -0
data/lib/torch/nn/sequential.rb +1 -10
data/lib/torch/nn/sigmoid.rb +9 -0
data/lib/torch/nn/smooth_l1_loss.rb +13 -0
data/lib/torch/nn/soft_margin_loss.rb +13 -0
data/lib/torch/nn/softmax.rb +18 -0
data/lib/torch/nn/softmax2d.rb +10 -0
data/lib/torch/nn/softmin.rb +14 -0
data/lib/torch/nn/softplus.rb +19 -0
data/lib/torch/nn/softshrink.rb +18 -0
data/lib/torch/nn/softsign.rb +9 -0
data/lib/torch/nn/tanh.rb +9 -0
data/lib/torch/nn/tanhshrink.rb +9 -0
data/lib/torch/nn/triplet_margin_loss.rb +18 -0
data/lib/torch/nn/unfold.rb +19 -0
data/lib/torch/nn/utils.rb +25 -0
data/lib/torch/nn/weighted_loss.rb +10 -0
data/lib/torch/nn/zero_pad2d.rb +9 -0
data/lib/torch/optim/adadelta.rb +57 -0
data/lib/torch/optim/adagrad.rb +71 -0
data/lib/torch/optim/adam.rb +81 -0
data/lib/torch/optim/adamax.rb +68 -0
data/lib/torch/optim/adamw.rb +82 -0
data/lib/torch/optim/asgd.rb +65 -0
data/lib/torch/optim/lr_scheduler/lr_scheduler.rb +33 -0
data/lib/torch/optim/lr_scheduler/step_lr.rb +17 -0
data/lib/torch/optim/optimizer.rb +56 -0
data/lib/torch/optim/rmsprop.rb +76 -0
data/lib/torch/optim/rprop.rb +68 -0
data/lib/torch/optim/sgd.rb +48 -16
data/lib/torch/random.rb +10 -0
data/lib/torch/tensor.rb +71 -30
data/lib/torch/utils/data/data_loader.rb +10 -4
data/lib/torch/utils/data/tensor_dataset.rb +3 -0
data/lib/torch/version.rb +1 -1
metadata +123 -6

checksums.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 SHA256:
-  metadata.gz: 30089078de4039df111087e5c27e0cb10d6f36398c0e8d5cc774e9b642a8e133
-  data.tar.gz: 89eb9e183b395dd67cd9cf228749cf26402993bb561de973f1ba7438bc372b04
+  metadata.gz: 51bcc56112e13ba206402857b379aee0df4c7695f75af354e833760adec67756
+  data.tar.gz: b2ff24940e4c219d88c5a001d4e8b4e44d0e55a35fc266989f0196e696d15bc8
 SHA512:
-  metadata.gz: 027a069b00ac1329c007ddaf471a21b57a82a823ad974a937f832d17720b8e26474c64c79e9a29ec71bac433abb3d74d6a7cf407f0a983bb3c0cafb5b5c7532f
-  data.tar.gz: 6d7ef10b53db0df39eda13d07aa9b52b4afac0965674919b5cc517e7b53f59a9010cb647e50d62bc06154f7d8f3ef632d5897e4f7774372d7ab1b44b2cb6ca82
+  metadata.gz: 95506016db5598333f0cb99a435d29951342af91f75ae4b1f01ef11df81891738888b90c7d27317071ad00bd9b81714cf41c0ea635c2578fd756c388b5e1da7f
+  data.tar.gz: 053c9c75e66fe54902f07413687deb6996afc7ae88217bd5dcc852ca59d535c663bb9fb3aed28b20dba953a42e714410867dbd6ecd747f96fe8e8dfd81da8d6c

data/CHANGELOG.md CHANGED Viewed

@@ -1,3 +1,38 @@
+## 0.1.7 (2019-01-10)
+- Fixed installation error with Ruby 2.7
+## 0.1.6 (2019-12-09)
+- Added recurrent layers
+- Added more pooling layers
+- Added normalization layers
+## 0.1.5 (2019-12-06)
+- Added many more functions
+- Added tensor classes - `FloatTensor`, `LongTensor`, etc
+- Improved modules
+## 0.1.4 (2019-12-01)
+- Added distance functions
+- Added more activations
+- Added more linear layers
+- Added more loss functions
+- Added more init methods
+- Added support for tensor assignment
+## 0.1.3 (2019-11-30)
+- Changed to BSD 3-Clause license to match PyTorch
+- Added many optimizers
+- Added `StepLR` learning rate scheduler
+- Added dropout
+- Added embedding
+- Added support for `bool` type
+- Improved performance of `from_numo`
 ## 0.1.2 (2019-11-27)
 - Added SGD optimizer

data/LICENSE.txt CHANGED Viewed

@@ -1,22 +1,46 @@
-Copyright (c) 2019 Andrew Kane
-MIT License
-Permission is hereby granted, free of charge, to any person obtaining
-a copy of this software and associated documentation files (the
-"Software"), to deal in the Software without restriction, including
-without limitation the rights to use, copy, modify, merge, publish,
-distribute, sublicense, and/or sell copies of the Software, and to
-permit persons to whom the Software is furnished to do so, subject to
-the following conditions:
-The above copyright notice and this permission notice shall be
-included in all copies or substantial portions of the Software.
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
-EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
-MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
-NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
-LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
-OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
-WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
+BSD 3-Clause License
+From Torch-rb:
+Copyright (c) 2019-     Andrew Kane
+From PyTorch (for ported code):
+Copyright (c) 2016-     Facebook, Inc            (Adam Paszke)
+Copyright (c) 2014-     Facebook, Inc            (Soumith Chintala)
+Copyright (c) 2011-2014 Idiap Research Institute (Ronan Collobert)
+Copyright (c) 2012-2014 Deepmind Technologies    (Koray Kavukcuoglu)
+Copyright (c) 2011-2012 NEC Laboratories America (Koray Kavukcuoglu)
+Copyright (c) 2011-2013 NYU                      (Clement Farabet)
+Copyright (c) 2006-2010 NEC Laboratories America (Ronan Collobert, Leon Bottou, Iain Melvin, Jason Weston)
+Copyright (c) 2006      Idiap Research Institute (Samy Bengio)
+Copyright (c) 2001-2004 Idiap Research Institute (Ronan Collobert, Samy Bengio, Johnny Mariethoz)
+All rights reserved.
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are met:
+1. Redistributions of source code must retain the above copyright
+   notice, this list of conditions and the following disclaimer.
+2. Redistributions in binary form must reproduce the above copyright
+   notice, this list of conditions and the following disclaimer in the
+   documentation and/or other materials provided with the distribution.
+3. Neither the names of Facebook, Deepmind Technologies, NYU, NEC Laboratories America
+   and IDIAP Research Institute nor the names of its contributors may be
+   used to endorse or promote products derived from this software without
+   specific prior written permission.
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
+AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
+INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
+CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
+ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
+POSSIBILITY OF SUCH DAMAGE.

data/README.md CHANGED Viewed

@@ -20,6 +20,8 @@ Add this line to your application’s Gemfile:
 gem 'torch-rb'
 ```
+It can take a few minutes to compile the extension.
 ## Getting Started
 This library follows the [PyTorch API](https://pytorch.org/docs/stable/torch.html). There are a few changes to make it more Ruby-like:
@@ -28,9 +30,11 @@ This library follows the [PyTorch API](https://pytorch.org/docs/stable/torch.htm
 - Methods that return booleans use `?` instead of `is_`  (`tensor?` instead of `is_tensor`)
 - Numo is used instead of NumPy (`x.numo` instead of `x.numpy()`)
-Many methods and options are missing at the moment. PRs welcome!
+Some methods and options are missing at the moment. PRs welcome!
+## Tutorial
-Some examples below are from [Deep Learning with PyTorch: A 60 Minutes Blitz](https://pytorch.org/tutorials/beginner/deep_learning_60min_blitz.html).
+Some examples below are from [Deep Learning with PyTorch: A 60 Minutes Blitz](https://pytorch.org/tutorials/beginner/deep_learning_60min_blitz.html)
 ### Tensors
@@ -145,7 +149,7 @@ Convert a Numo array to a tensor
 ```ruby
 b = Numo::NArray.cast([1, 2, 3])
-Torch.from_numpy(b)
+Torch.from_numo(b)
 ```
 ### Autograd
@@ -180,10 +184,10 @@ Stop autograd from tracking history
 ```ruby
 x.requires_grad # true
-(x ** 2).requires_grad # true
+(x**2).requires_grad # true
 Torch.no_grad do
-  (x ** 2).requires_grad # false
+  (x**2).requires_grad # false
 end
 ```
@@ -359,6 +363,14 @@ Here’s a list of functions to create tensors (descriptions from the [C++ docs]
   Torch.zeros(3) # tensor([0, 0, 0])
   ```
+## Examples
+Here are a few full examples:
+- [Image classification with MNIST](examples/mnist) ([日本語版](https://qiita.com/kojix2/items/c19c36dc1bf73ea93409))
+- [Collaborative filtering with MovieLens](examples/movielens)
+- [Sequence models and word embeddings](examples/nlp)
 ## LibTorch Installation
 [Download LibTorch](https://pytorch.org/). For Linux, use the `cxx11 ABI` version. Then run:
@@ -405,7 +417,7 @@ To get started with development:
 git clone https://github.com/ankane/torch-rb.git
 cd torch-rb
 bundle install
-bundle exec rake compile
+bundle exec rake compile -- --with-torch-dir=/path/to/libtorch
 bundle exec rake test
 ```

data/ext/torch/ext.cpp CHANGED Viewed

@@ -6,95 +6,29 @@
 #include <rice/Class.hpp>
 #include <rice/Constructor.hpp>
-using namespace Rice;
-template<>
-inline
-long long from_ruby<long long>(Object x)
-{
-  return NUM2LL(x);
-}
+#include "templates.hpp"
-template<>
-inline
-Object to_ruby<long long>(long long const & x)
-{
-  return LL2NUM(x);
-}
+// generated with:
+// rake generate:functions
+#include "torch_functions.hpp"
+#include "tensor_functions.hpp"
+#include "nn_functions.hpp"
-template<>
-inline
-unsigned long long from_ruby<unsigned long long>(Object x)
-{
-  return NUM2ULL(x);
-}
-template<>
-inline
-Object to_ruby<unsigned long long>(unsigned long long const & x)
-{
-  return ULL2NUM(x);
-}
-template<>
-inline
-short from_ruby<short>(Object x)
-{
-  return NUM2SHORT(x);
-}
-template<>
-inline
-Object to_ruby<short>(short const & x)
-{
-  return INT2NUM(x);
-}
-template<>
-inline
-unsigned short from_ruby<unsigned short>(Object x)
-{
-  return NUM2USHORT(x);
-}
+using namespace Rice;
-template<>
-inline
-Object to_ruby<unsigned short>(unsigned short const & x)
+extern "C"
+void Init_ext()
 {
-  return UINT2NUM(x);
-}
+  Module rb_mTorch = define_module("Torch");
+  add_torch_functions(rb_mTorch);
-// need to wrap torch::IntArrayRef() since
-// it doesn't own underlying data
-class IntArrayRef {
-  std::vector<int64_t> vec;
-  public:
-    IntArrayRef(Object o) {
-      Array a = Array(o);
-      for (size_t i = 0; i < a.size(); i++) {
-        vec.push_back(from_ruby<int64_t>(a[i]));
-      }
-    }
-    operator torch::IntArrayRef() {
-      return torch::IntArrayRef(vec);
-    }
-};
-template<>
-inline
-IntArrayRef from_ruby<IntArrayRef>(Object x)
-{
-  return IntArrayRef(x);
-}
+  Class rb_cTensor = define_class_under<torch::Tensor>(rb_mTorch, "Tensor");
+  add_tensor_functions(rb_cTensor);
-// for now
-typedef float Scalar;
+  Module rb_mNN = define_module_under(rb_mTorch, "NN");
+  add_nn_functions(rb_mNN);
-extern "C"
-void Init_ext()
-{
-  Module rb_mTorch = define_module("Torch")
-    .define_singleton_method(
+  rb_mTorch.define_singleton_method(
       "grad_enabled?",
       *[]() {
         return torch::GradMode::is_enabled();
@@ -104,11 +38,6 @@ void Init_ext()
       *[](bool enabled) {
         torch::GradMode::set_enabled(enabled);
       })
-    .define_singleton_method(
-      "floating_point?",
-      *[](torch::Tensor& input) {
-        return torch::is_floating_point(input);
-      })
     .define_singleton_method(
       "manual_seed",
       *[](uint64_t seed) {
@@ -177,321 +106,100 @@ void Init_ext()
       })
     // begin operations
     .define_singleton_method(
-      "_mean",
-      *[](torch::Tensor& input) {
-        return torch::mean(input);
-      })
-    .define_singleton_method(
-      "_mean_dim",
-      *[](torch::Tensor& input, int64_t dim, bool keepdim) {
-        return torch::mean(input, dim, keepdim);
-      })
-    .define_singleton_method(
-      "_sum",
-      *[](torch::Tensor& input) {
-        return torch::sum(input);
-      })
-    .define_singleton_method(
-      "_sum_dim",
-      *[](torch::Tensor& input, int64_t dim, bool keepdim) {
-        return torch::sum(input, dim, keepdim);
-      })
-    .define_singleton_method(
-      "_argmax",
-      *[](torch::Tensor& input) {
-        return torch::argmax(input);
-      })
-    .define_singleton_method(
-      "_argmax_dim",
-      *[](torch::Tensor& input, int64_t dim, bool keepdim) {
-        return torch::argmax(input, dim, keepdim);
-      })
-    .define_singleton_method(
-      "_norm",
-      *[](torch::Tensor& input) {
-        return torch::norm(input);
-      })
-    .define_singleton_method(
-      "_min",
-      *[](torch::Tensor& input) {
-        return torch::min(input);
-      })
-    .define_singleton_method(
-      "_max",
-      *[](torch::Tensor& input) {
-        return torch::max(input);
-      })
-    .define_singleton_method(
-      "_exp",
-      *[](torch::Tensor& input) {
-        return torch::exp(input);
-      })
-    .define_singleton_method(
-      "_log",
-      *[](torch::Tensor& input) {
-        return torch::log(input);
-      })
-    .define_singleton_method(
-      "_unsqueeze",
-      *[](torch::Tensor& input, int64_t dim) {
-        return torch::unsqueeze(input, dim);
-      })
-    .define_singleton_method(
-      "_dot",
-      *[](torch::Tensor& input, torch::Tensor& tensor) {
-        return torch::dot(input, tensor);
-      })
-    .define_singleton_method(
-      "_matmul",
-      *[](torch::Tensor& input, torch::Tensor& other) {
-        return torch::matmul(input, other);
-      })
-    .define_singleton_method(
-      "_eq",
-      *[](torch::Tensor& input, torch::Tensor& other) {
-        return torch::eq(input, other);
-      })
-    .define_singleton_method(
-      "_add",
-      *[](torch::Tensor& input, torch::Tensor& other) {
-        return torch::add(input, other);
-      })
-    .define_singleton_method(
-      "_add_scalar",
-      *[](torch::Tensor& input, float other) {
-        return torch::add(input, other);
-      })
-    .define_singleton_method(
-      "_add_out",
-      *[](torch::Tensor& out, torch::Tensor& input, torch::Tensor& other) {
-        return torch::add_out(out, input, other);
-      })
-    .define_singleton_method(
-      "_sub",
-      *[](torch::Tensor& input, torch::Tensor& other) {
-        return torch::sub(input, other);
-      })
-    .define_singleton_method(
-      "_sub_scalar",
-      *[](torch::Tensor& input, float other) {
-        return torch::sub(input, other);
-      })
-    .define_singleton_method(
-      "_mul",
-      *[](torch::Tensor& input, torch::Tensor& other) {
-        return torch::mul(input, other);
-      })
-    .define_singleton_method(
-      "_mul_scalar",
-      *[](torch::Tensor& input, float other) {
-        return torch::mul(input, other);
-      })
-    .define_singleton_method(
-      "_div",
-      *[](torch::Tensor& input, torch::Tensor& other) {
-        return torch::div(input, other);
-      })
-    .define_singleton_method(
-      "_div_scalar",
-      *[](torch::Tensor& input, float other) {
-        return torch::div(input, other);
-      })
-    .define_singleton_method(
-      "_remainder",
-      *[](torch::Tensor& input, torch::Tensor& other) {
-        return torch::remainder(input, other);
+      "_save",
+      *[](const Tensor &value) {
+        auto v = torch::pickle_save(value);
+        std::string str(v.begin(), v.end());
+        return str;
       })
     .define_singleton_method(
-      "_remainder_scalar",
-      *[](torch::Tensor& input, float other) {
-        return torch::remainder(input, other);
+      "_binary_cross_entropy_with_logits",
+      *[](const Tensor &input, const Tensor &target, OptionalTensor weight, OptionalTensor pos_weight, MyReduction reduction) {
+        return torch::binary_cross_entropy_with_logits(input, target, weight, pos_weight, reduction);
       })
     .define_singleton_method(
-      "_pow",
-      *[](torch::Tensor& input, Scalar exponent) {
-        return torch::pow(input, exponent);
-      })
-    .define_singleton_method(
-      "_neg",
-      *[](torch::Tensor& input) {
-        return torch::neg(input);
-      })
-    .define_singleton_method(
-      "_reshape",
-      *[](torch::Tensor& input, IntArrayRef shape) {
-        return torch::reshape(input, shape);
-      })
-    .define_singleton_method(
-      "relu",
-      *[](torch::Tensor& input) {
-        return torch::relu(input);
-      })
-    .define_singleton_method(
-      "prelu",
-      *[](torch::Tensor& input, torch::Tensor& weight) {
-        return torch::prelu(input, weight);
-      })
-    .define_singleton_method(
-      "leaky_relu",
-      *[](torch::Tensor& input, Scalar negative_slope = 0.01) {
-        return torch::leaky_relu(input, negative_slope);
-      })
-    .define_singleton_method(
-      "conv2d",
-      *[](torch::Tensor& input, torch::Tensor& weight, torch::Tensor& bias, IntArrayRef stride, IntArrayRef padding) {
-        return torch::conv2d(input, weight, bias, stride, padding);
-      })
-    .define_singleton_method(
-      "linear",
-      *[](torch::Tensor& input, torch::Tensor& weight, torch::Tensor& bias) {
-        return torch::linear(input, weight, bias);
-      })
-    .define_singleton_method(
-      "max_pool2d",
-      *[](torch::Tensor& input, IntArrayRef kernel_size) {
-        return torch::max_pool2d(input, kernel_size);
-      })
-    .define_singleton_method(
-      "avg_pool2d",
-      *[](torch::Tensor& input, IntArrayRef kernel_size) {
-        return torch::avg_pool2d(input, kernel_size);
-      })
-    .define_singleton_method(
-      "mse_loss",
-      *[](torch::Tensor& input, torch::Tensor& target, std::string reduction) {
-        auto red = reduction == "mean" ? Reduction::Mean : Reduction::Sum;
-        return torch::mse_loss(input, target, red);
-      })
-    .define_singleton_method(
-      "nll_loss",
-      *[](torch::Tensor& input, torch::Tensor& target) {
-        return torch::nll_loss(input, target);
+      "_from_blob",
+      *[](String s, IntArrayRef size, const torch::TensorOptions &options) {
+        void *data = const_cast<char *>(s.c_str());
+        return torch::from_blob(data, size, options);
       })
     .define_singleton_method(
       "_tensor",
       *[](Object o, IntArrayRef size, const torch::TensorOptions &options) {
         Array a = Array(o);
-        std::vector<float> vec;
-        for (size_t i = 0; i < a.size(); i++) {
-          vec.push_back(from_ruby<float>(a[i]));
+        auto dtype = options.dtype();
+        torch::Tensor t;
+        if (dtype == torch::kBool) {
+          throw std::runtime_error("Cannot create bool from tensor method yet");
+        } else {
+          std::vector<float> vec;
+          for (size_t i = 0; i < a.size(); i++) {
+            vec.push_back(from_ruby<float>(a[i]));
+          }
+          t = torch::tensor(vec, options);
         }
-        return torch::tensor(vec, options).reshape(size);
+        return t.reshape(size);
       });
-  Class rb_cTensor = define_class_under<torch::Tensor>(rb_mTorch, "Tensor")
+  rb_cTensor
     .define_method("cuda?", &torch::Tensor::is_cuda)
-    .define_method("distributed?", &torch::Tensor::is_distributed)
-    .define_method("complex?", &torch::Tensor::is_complex)
-    .define_method("floating_point?", &torch::Tensor::is_floating_point)
-    .define_method("signed?", &torch::Tensor::is_signed)
     .define_method("sparse?", &torch::Tensor::is_sparse)
     .define_method("quantized?", &torch::Tensor::is_quantized)
     .define_method("dim", &torch::Tensor::dim)
-    .define_method("numel", &torch::Tensor::numel)
     .define_method("element_size", &torch::Tensor::element_size)
     .define_method("requires_grad", &torch::Tensor::requires_grad)
     .define_method(
-      "zero!",
-      *[](torch::Tensor& self) {
-        return self.zero_();
-      })
-    .define_method(
-      "detach!",
-      *[](torch::Tensor& self) {
-        return self.detach_();
+      "addcmul!",
+      *[](Tensor& self, Scalar value, const Tensor & tensor1, const Tensor & tensor2) {
+        return self.addcmul_(tensor1, tensor2, value);
       })
     .define_method(
-      "_select",
-      *[](torch::Tensor& self, int64_t dim, int64_t index) {
-        return self.select(dim, index);
-      })
-    .define_method(
-      "_slice",
-      *[](torch::Tensor& self, int64_t dim, int64_t start, int64_t end, int64_t step) {
-        return self.slice(dim, start, end, step);
+      "addcdiv!",
+      *[](Tensor& self, Scalar value, const Tensor & tensor1, const Tensor & tensor2) {
+        return self.addcdiv_(tensor1, tensor2, value);
       })
     .define_method(
       "_requires_grad!",
-      *[](torch::Tensor& self, bool requires_grad) {
+      *[](Tensor& self, bool requires_grad) {
         return self.set_requires_grad(requires_grad);
       })
     .define_method(
       "_backward",
-      *[](torch::Tensor& self) {
-        return self.backward();
-      })
-    .define_method(
-      "_backward_gradient",
-      *[](torch::Tensor& self, const torch::Tensor& gradient) {
-        return self.backward(gradient);
+      *[](Tensor& self, Object gradient) {
+        return gradient.is_nil() ? self.backward() : self.backward(from_ruby<torch::Tensor>(gradient));
       })
     .define_method(
       "grad",
-      *[](torch::Tensor& self) {
+      *[](Tensor& self) {
         return self.grad();
       })
     .define_method(
       "_dtype",
-      *[](torch::Tensor& self) {
+      *[](Tensor& self) {
         return (int) at::typeMetaToScalarType(self.dtype());
       })
     .define_method(
       "_type",
-      *[](torch::Tensor& self, int dtype) {
+      *[](Tensor& self, int dtype) {
         return self.toType((torch::ScalarType) dtype);
       })
     .define_method(
       "_layout",
-      *[](torch::Tensor& self) {
+      *[](Tensor& self) {
         std::stringstream s;
         s << self.layout();
         return s.str();
       })
     .define_method(
       "device",
-      *[](torch::Tensor& self) {
+      *[](Tensor& self) {
         std::stringstream s;
         s << self.device();
         return s.str();
       })
     .define_method(
-      "_view",
-      *[](torch::Tensor& self, IntArrayRef size) {
-        return self.view(size);
-      })
-    .define_method(
-      "add!",
-      *[](torch::Tensor& self, torch::Tensor& other) {
-        self.add_(other);
-      })
-    .define_method(
-      "sub!",
-      *[](torch::Tensor& self, torch::Tensor& other) {
-        self.sub_(other);
-      })
-    .define_method(
-      "mul!",
-      *[](torch::Tensor& self, torch::Tensor& other) {
-        self.mul_(other);
-      })
-    .define_method(
-      "div!",
-      *[](torch::Tensor& self, torch::Tensor& other) {
-        self.div_(other);
-      })
-    .define_method(
-      "log_softmax",
-      *[](torch::Tensor& self, int64_t dim) {
-        return self.log_softmax(dim);
-      })
-    .define_method(
-      "data",
-      *[](torch::Tensor& self) {
-        return self.data();
-      })
-    .define_method(
-      "_data",
-      *[](torch::Tensor& self) {
+      "_flat_data",
+      *[](Tensor& self) {
         Array a;
         auto dtype = self.dtype();
@@ -532,21 +240,23 @@ void Init_ext()
             a.push(data[i]);
           }
         } else if (dtype == torch::kBool) {
-          // bool
-          throw std::runtime_error("Type not supported yet");
+          bool* data = self.data_ptr<bool>();
+          for (int i = 0; i < self.numel(); i++) {
+            a.push(data[i] ? True : False);
+          }
         } else {
           throw std::runtime_error("Unsupported type");
         }
         return a;
       })
     .define_method(
-      "_size",
-      *[](torch::Tensor& self, int i) {
-        return self.size(i);
+      "_to",
+      *[](Tensor& self, torch::Device device, int dtype, bool non_blocking, bool copy) {
+        return self.to(device, (torch::ScalarType) dtype, non_blocking, copy);
       })
     .define_singleton_method(
       "_make_subclass",
-      *[](torch::Tensor& rd, bool requires_grad) {
+      *[](Tensor& rd, bool requires_grad) {
         auto data = torch::autograd::as_variable_ref(rd).detach();
         data.unsafeGetTensorImpl()->set_allow_tensor_metadata_change(true);
         auto var = data.set_requires_grad(requires_grad);
@@ -593,30 +303,99 @@ void Init_ext()
         return self.requires_grad(requires_grad);
       });
-  Module rb_mNN = define_module_under(rb_mTorch, "NN");
   Module rb_mInit = define_module_under(rb_mNN, "Init")
     .define_singleton_method(
-      "kaiming_uniform_",
-      *[](torch::Tensor& input, double a) {
-        return torch::nn::init::kaiming_uniform_(input, a);
+      "_calculate_gain",
+      *[](NonlinearityType nonlinearity, double param) {
+        return torch::nn::init::calculate_gain(nonlinearity, param);
+      })
+    .define_singleton_method(
+      "_uniform!",
+      *[](Tensor tensor, double low, double high) {
+        return torch::nn::init::uniform_(tensor, low, high);
+      })
+    .define_singleton_method(
+      "_normal!",
+      *[](Tensor tensor, double mean, double std) {
+        return torch::nn::init::normal_(tensor, mean, std);
+      })
+    .define_singleton_method(
+      "_constant!",
+      *[](Tensor tensor, Scalar value) {
+        return torch::nn::init::constant_(tensor, value);
+      })
+    .define_singleton_method(
+      "_ones!",
+      *[](Tensor tensor) {
+        return torch::nn::init::ones_(tensor);
+      })
+    .define_singleton_method(
+      "_zeros!",
+      *[](Tensor tensor) {
+        return torch::nn::init::zeros_(tensor);
+      })
+    .define_singleton_method(
+      "_eye!",
+      *[](Tensor tensor) {
+        return torch::nn::init::eye_(tensor);
+      })
+    .define_singleton_method(
+      "_dirac!",
+      *[](Tensor tensor) {
+        return torch::nn::init::dirac_(tensor);
+      })
+    .define_singleton_method(
+      "_xavier_uniform!",
+      *[](Tensor tensor, double gain) {
+        return torch::nn::init::xavier_uniform_(tensor, gain);
+      })
+    .define_singleton_method(
+      "_xavier_normal!",
+      *[](Tensor tensor, double gain) {
+        return torch::nn::init::xavier_normal_(tensor, gain);
+      })
+    .define_singleton_method(
+      "_kaiming_uniform!",
+      *[](Tensor tensor, double a, FanModeType mode, NonlinearityType nonlinearity) {
+        return torch::nn::init::kaiming_uniform_(tensor, a, mode, nonlinearity);
+      })
+    .define_singleton_method(
+      "_kaiming_normal!",
+      *[](Tensor tensor, double a, FanModeType mode, NonlinearityType nonlinearity) {
+        return torch::nn::init::kaiming_normal_(tensor, a, mode, nonlinearity);
+      })
+    .define_singleton_method(
+      "_orthogonal!",
+      *[](Tensor tensor, double gain) {
+        return torch::nn::init::orthogonal_(tensor, gain);
       })
     .define_singleton_method(
-      "uniform_",
-      *[](torch::Tensor& input, double to, double from) {
-        return torch::nn::init::uniform_(input, to, from);
+      "_sparse!",
+      *[](Tensor tensor, double sparsity, double std) {
+        return torch::nn::init::sparse_(tensor, sparsity, std);
       });
   Class rb_cParameter = define_class_under<torch::autograd::Variable, torch::Tensor>(rb_mNN, "Parameter")
-    // TODO return grad or nil to remove need for 2nd function
     .define_method(
-      "_grad",
+      "grad",
       *[](torch::autograd::Variable& self) {
-        return self.grad();
-      })
+        auto grad = self.grad();
+        return grad.defined() ? to_ruby<torch::Tensor>(grad) : Nil;
+      });
+  Class rb_cDevice = define_class_under<torch::Device>(rb_mTorch, "Device")
+    .define_constructor(Constructor<torch::Device, std::string>())
+    .define_method("index", &torch::Device::index)
+    .define_method("index?", &torch::Device::has_index)
     .define_method(
-      "_grad_defined",
-      *[](torch::autograd::Variable& self) {
-        return self.grad().defined();
+      "type",
+      *[](torch::Device& self) {
+        std::stringstream s;
+        s << self.type();
+        return s.str();
       });
+  Module rb_mCUDA = define_module_under(rb_mTorch, "CUDA")
+    .define_singleton_method("available?", &torch::cuda::is_available)
+    .define_singleton_method("device_count", &torch::cuda::device_count);
 }