RubyGems - pnmatrix - Versions diffs - 1.2.4 - Mend

pnmatrix 1.2.4

Files changed (111) hide show

checksums.yaml +7 -0
data/ext/nmatrix/binary_format.txt +53 -0
data/ext/nmatrix/data/complex.h +388 -0
data/ext/nmatrix/data/data.cpp +274 -0
data/ext/nmatrix/data/data.h +651 -0
data/ext/nmatrix/data/meta.h +64 -0
data/ext/nmatrix/data/ruby_object.h +386 -0
data/ext/nmatrix/extconf.rb +70 -0
data/ext/nmatrix/math/asum.h +99 -0
data/ext/nmatrix/math/cblas_enums.h +36 -0
data/ext/nmatrix/math/cblas_templates_core.h +507 -0
data/ext/nmatrix/math/gemm.h +241 -0
data/ext/nmatrix/math/gemv.h +178 -0
data/ext/nmatrix/math/getrf.h +255 -0
data/ext/nmatrix/math/getrs.h +121 -0
data/ext/nmatrix/math/imax.h +82 -0
data/ext/nmatrix/math/laswp.h +165 -0
data/ext/nmatrix/math/long_dtype.h +62 -0
data/ext/nmatrix/math/magnitude.h +54 -0
data/ext/nmatrix/math/math.h +751 -0
data/ext/nmatrix/math/nrm2.h +165 -0
data/ext/nmatrix/math/rot.h +117 -0
data/ext/nmatrix/math/rotg.h +106 -0
data/ext/nmatrix/math/scal.h +71 -0
data/ext/nmatrix/math/trsm.h +336 -0
data/ext/nmatrix/math/util.h +162 -0
data/ext/nmatrix/math.cpp +1368 -0
data/ext/nmatrix/nm_memory.h +60 -0
data/ext/nmatrix/nmatrix.cpp +285 -0
data/ext/nmatrix/nmatrix.h +476 -0
data/ext/nmatrix/ruby_constants.cpp +151 -0
data/ext/nmatrix/ruby_constants.h +106 -0
data/ext/nmatrix/ruby_nmatrix.c +3130 -0
data/ext/nmatrix/storage/common.cpp +77 -0
data/ext/nmatrix/storage/common.h +183 -0
data/ext/nmatrix/storage/dense/dense.cpp +1096 -0
data/ext/nmatrix/storage/dense/dense.h +129 -0
data/ext/nmatrix/storage/list/list.cpp +1628 -0
data/ext/nmatrix/storage/list/list.h +138 -0
data/ext/nmatrix/storage/storage.cpp +730 -0
data/ext/nmatrix/storage/storage.h +99 -0
data/ext/nmatrix/storage/yale/class.h +1139 -0
data/ext/nmatrix/storage/yale/iterators/base.h +143 -0
data/ext/nmatrix/storage/yale/iterators/iterator.h +131 -0
data/ext/nmatrix/storage/yale/iterators/row.h +450 -0
data/ext/nmatrix/storage/yale/iterators/row_stored.h +140 -0
data/ext/nmatrix/storage/yale/iterators/row_stored_nd.h +169 -0
data/ext/nmatrix/storage/yale/iterators/stored_diagonal.h +124 -0
data/ext/nmatrix/storage/yale/math/transpose.h +110 -0
data/ext/nmatrix/storage/yale/yale.cpp +2074 -0
data/ext/nmatrix/storage/yale/yale.h +203 -0
data/ext/nmatrix/types.h +55 -0
data/ext/nmatrix/util/io.cpp +279 -0
data/ext/nmatrix/util/io.h +115 -0
data/ext/nmatrix/util/sl_list.cpp +627 -0
data/ext/nmatrix/util/sl_list.h +144 -0
data/ext/nmatrix/util/util.h +78 -0
data/lib/nmatrix/blas.rb +378 -0
data/lib/nmatrix/cruby/math.rb +744 -0
data/lib/nmatrix/enumerate.rb +253 -0
data/lib/nmatrix/homogeneous.rb +241 -0
data/lib/nmatrix/io/fortran_format.rb +138 -0
data/lib/nmatrix/io/harwell_boeing.rb +221 -0
data/lib/nmatrix/io/market.rb +263 -0
data/lib/nmatrix/io/point_cloud.rb +189 -0
data/lib/nmatrix/jruby/decomposition.rb +24 -0
data/lib/nmatrix/jruby/enumerable.rb +13 -0
data/lib/nmatrix/jruby/error.rb +4 -0
data/lib/nmatrix/jruby/math.rb +501 -0
data/lib/nmatrix/jruby/nmatrix_java.rb +840 -0
data/lib/nmatrix/jruby/operators.rb +283 -0
data/lib/nmatrix/jruby/slice.rb +264 -0
data/lib/nmatrix/lapack_core.rb +181 -0
data/lib/nmatrix/lapack_plugin.rb +44 -0
data/lib/nmatrix/math.rb +953 -0
data/lib/nmatrix/mkmf.rb +100 -0
data/lib/nmatrix/monkeys.rb +137 -0
data/lib/nmatrix/nmatrix.rb +1172 -0
data/lib/nmatrix/rspec.rb +75 -0
data/lib/nmatrix/shortcuts.rb +1163 -0
data/lib/nmatrix/version.rb +39 -0
data/lib/nmatrix/yale_functions.rb +118 -0
data/lib/nmatrix.rb +28 -0
data/spec/00_nmatrix_spec.rb +892 -0
data/spec/01_enum_spec.rb +196 -0
data/spec/02_slice_spec.rb +407 -0
data/spec/03_nmatrix_monkeys_spec.rb +80 -0
data/spec/2x2_dense_double.mat +0 -0
data/spec/4x4_sparse.mat +0 -0
data/spec/4x5_dense.mat +0 -0
data/spec/blas_spec.rb +215 -0
data/spec/elementwise_spec.rb +311 -0
data/spec/homogeneous_spec.rb +100 -0
data/spec/io/fortran_format_spec.rb +88 -0
data/spec/io/harwell_boeing_spec.rb +98 -0
data/spec/io/test.rua +9 -0
data/spec/io_spec.rb +159 -0
data/spec/lapack_core_spec.rb +482 -0
data/spec/leakcheck.rb +16 -0
data/spec/math_spec.rb +1363 -0
data/spec/nmatrix_yale_resize_test_associations.yaml +2802 -0
data/spec/nmatrix_yale_spec.rb +286 -0
data/spec/rspec_monkeys.rb +56 -0
data/spec/rspec_spec.rb +35 -0
data/spec/shortcuts_spec.rb +474 -0
data/spec/slice_set_spec.rb +162 -0
data/spec/spec_helper.rb +172 -0
data/spec/stat_spec.rb +214 -0
data/spec/test.pcd +20 -0
data/spec/utm5940.mtx +83844 -0
metadata +295 -0

data/ext/nmatrix/ruby_nmatrix.c ADDED Viewed

@@ -0,0 +1,3130 @@
+/////////////////////////////////////////////////////////////////////
+// = NMatrix
+//
+// A linear algebra library for scientific computation in Ruby.
+// NMatrix is part of SciRuby.
+//
+// NMatrix was originally inspired by and derived from NArray, by
+// Masahiro Tanaka: http://narray.rubyforge.org
+//
+// == Copyright Information
+//
+// SciRuby is Copyright (c) 2010 - 2014, Ruby Science Foundation
+// NMatrix is Copyright (c) 2012 - 2014, John Woods and the Ruby Science Foundation
+//
+// Please see LICENSE.txt for additional copyright notices.
+//
+// == Contributing
+//
+// By contributing source code to SciRuby, you agree to be bound by
+// our Contributor Agreement:
+//
+// * https://github.com/SciRuby/sciruby/wiki/Contributor-Agreement
+//
+// == ruby_nmatrix.c
+//
+// Ruby-facing NMatrix C functions. Not compiled directly -- included
+// into nmatrix.cpp.
+//
+/*
+ * Forward Declarations
+ */
+static VALUE nm_init(int argc, VALUE* argv, VALUE nm);
+static VALUE nm_init_copy(VALUE copy, VALUE original);
+static VALUE nm_init_transposed(VALUE self);
+static VALUE nm_read(int argc, VALUE* argv, VALUE self);
+static VALUE nm_write(int argc, VALUE* argv, VALUE self);
+static VALUE nm_init_yale_from_old_yale(VALUE shape, VALUE dtype, VALUE ia, VALUE ja, VALUE a, VALUE from_dtype, VALUE nm);
+static VALUE nm_alloc(VALUE klass);
+static VALUE nm_dtype(VALUE self);
+static VALUE nm_stype(VALUE self);
+static VALUE nm_default_value(VALUE self);
+static size_t effective_dim(STORAGE* s);
+static VALUE nm_effective_dim(VALUE self);
+static VALUE nm_dim(VALUE self);
+static VALUE nm_offset(VALUE self);
+static VALUE nm_shape(VALUE self);
+static VALUE nm_supershape(VALUE self);
+static VALUE nm_capacity(VALUE self);
+static VALUE nm_each_with_indices(VALUE nmatrix);
+static VALUE nm_each_stored_with_indices(VALUE nmatrix);
+static VALUE nm_each_ordered_stored_with_indices(VALUE nmatrix);
+static VALUE nm_map_stored(VALUE nmatrix);
+static void init_slice_no_alloc(SLICE* slice, size_t dim, int argc, VALUE* arg, size_t* shape);
+static VALUE nm_xslice(int argc, VALUE* argv, void* (*slice_func)(const STORAGE*, SLICE*), void (*delete_func)(NMATRIX*), VALUE self);
+static VALUE nm_mset(int argc, VALUE* argv, VALUE self);
+static VALUE nm_mget(int argc, VALUE* argv, VALUE self);
+static VALUE nm_mref(int argc, VALUE* argv, VALUE self);
+static VALUE nm_is_ref(VALUE self);
+static VALUE is_symmetric(VALUE self, bool hermitian);
+static VALUE nm_guess_dtype(VALUE self, VALUE v);
+static VALUE nm_min_dtype(VALUE self, VALUE v);
+static VALUE nm_data_pointer(VALUE self);
+/*
+ * Macro defines an element-wise accessor function for some operation.
+ *
+ * This is only responsible for the Ruby accessor! You still have to write the actual functions, obviously.
+ */
+#define DEF_ELEMENTWISE_RUBY_ACCESSOR(oper, name)                 \
+static VALUE nm_ew_##name(VALUE left_val, VALUE right_val) {  \
+  return elementwise_op(nm::EW_##oper, left_val, right_val);  \
+}
+#define DEF_UNARY_RUBY_ACCESSOR(oper, name)                 \
+static VALUE nm_unary_##name(VALUE self) {  \
+  return unary_op(nm::UNARY_##oper, self);  \
+}
+#define DEF_NONCOM_ELEMENTWISE_RUBY_ACCESSOR(oper, name) \
+static VALUE nm_noncom_ew_##name(int argc, VALUE* argv, VALUE self) { \
+  if (argc > 1) { \
+    return noncom_elementwise_op(nm::NONCOM_EW_##oper, self, argv[0], argv[1]); \
+  } else { \
+    return noncom_elementwise_op(nm::NONCOM_EW_##oper, self, argv[0], Qfalse); \
+  } \
+}
+/*
+ * Macro declares a corresponding accessor function prototype for some element-wise operation.
+ */
+#define DECL_ELEMENTWISE_RUBY_ACCESSOR(name)    static VALUE nm_ew_##name(VALUE left_val, VALUE right_val);
+#define DECL_UNARY_RUBY_ACCESSOR(name)          static VALUE nm_unary_##name(VALUE self);
+#define DECL_NONCOM_ELEMENTWISE_RUBY_ACCESSOR(name)    static VALUE nm_noncom_ew_##name(int argc, VALUE* argv, VALUE self);
+DECL_ELEMENTWISE_RUBY_ACCESSOR(add)
+DECL_ELEMENTWISE_RUBY_ACCESSOR(subtract)
+DECL_ELEMENTWISE_RUBY_ACCESSOR(multiply)
+DECL_ELEMENTWISE_RUBY_ACCESSOR(divide)
+DECL_ELEMENTWISE_RUBY_ACCESSOR(power)
+DECL_ELEMENTWISE_RUBY_ACCESSOR(mod)
+DECL_ELEMENTWISE_RUBY_ACCESSOR(eqeq)
+DECL_ELEMENTWISE_RUBY_ACCESSOR(neq)
+DECL_ELEMENTWISE_RUBY_ACCESSOR(lt)
+DECL_ELEMENTWISE_RUBY_ACCESSOR(gt)
+DECL_ELEMENTWISE_RUBY_ACCESSOR(leq)
+DECL_ELEMENTWISE_RUBY_ACCESSOR(geq)
+DECL_UNARY_RUBY_ACCESSOR(sin)
+DECL_UNARY_RUBY_ACCESSOR(cos)
+DECL_UNARY_RUBY_ACCESSOR(tan)
+DECL_UNARY_RUBY_ACCESSOR(asin)
+DECL_UNARY_RUBY_ACCESSOR(acos)
+DECL_UNARY_RUBY_ACCESSOR(atan)
+DECL_UNARY_RUBY_ACCESSOR(sinh)
+DECL_UNARY_RUBY_ACCESSOR(cosh)
+DECL_UNARY_RUBY_ACCESSOR(tanh)
+DECL_UNARY_RUBY_ACCESSOR(asinh)
+DECL_UNARY_RUBY_ACCESSOR(acosh)
+DECL_UNARY_RUBY_ACCESSOR(atanh)
+DECL_UNARY_RUBY_ACCESSOR(exp)
+DECL_UNARY_RUBY_ACCESSOR(log2)
+DECL_UNARY_RUBY_ACCESSOR(log10)
+DECL_UNARY_RUBY_ACCESSOR(sqrt)
+DECL_UNARY_RUBY_ACCESSOR(erf)
+DECL_UNARY_RUBY_ACCESSOR(erfc)
+DECL_UNARY_RUBY_ACCESSOR(cbrt)
+DECL_UNARY_RUBY_ACCESSOR(gamma)
+DECL_UNARY_RUBY_ACCESSOR(negate)
+DECL_UNARY_RUBY_ACCESSOR(floor)
+DECL_UNARY_RUBY_ACCESSOR(ceil)
+DECL_NONCOM_ELEMENTWISE_RUBY_ACCESSOR(atan2)
+DECL_NONCOM_ELEMENTWISE_RUBY_ACCESSOR(ldexp)
+DECL_NONCOM_ELEMENTWISE_RUBY_ACCESSOR(hypot)
+//log/round can be unary, but also take a base argument, as with Math.log
+static VALUE nm_unary_log(int argc, VALUE* argv, VALUE self);
+static VALUE nm_unary_round(int argc, VALUE* argv, VALUE self);
+static VALUE elementwise_op(nm::ewop_t op, VALUE left_val, VALUE right_val);
+static VALUE unary_op(nm::unaryop_t op, VALUE self);
+static VALUE noncom_elementwise_op(nm::noncom_ewop_t op, VALUE self, VALUE other, VALUE orderflip);
+static VALUE nm_symmetric(VALUE self);
+static VALUE nm_hermitian(VALUE self);
+static VALUE nm_eqeq(VALUE left, VALUE right);
+static VALUE matrix_multiply_scalar(NMATRIX* left, VALUE scalar);
+static VALUE matrix_multiply(NMATRIX* left, NMATRIX* right);
+static VALUE nm_multiply(VALUE left_v, VALUE right_v);
+static VALUE nm_det_exact(VALUE self);
+static VALUE nm_hessenberg(VALUE self, VALUE a);
+static VALUE nm_inverse(VALUE self, VALUE inverse, VALUE bang);
+static VALUE nm_inverse_exact(VALUE self, VALUE inverse, VALUE lda, VALUE ldb);
+static VALUE nm_complex_conjugate_bang(VALUE self);
+static VALUE nm_reshape_bang(VALUE self, VALUE arg);
+static nm::dtype_t  interpret_dtype(int argc, VALUE* argv, nm::stype_t stype);
+static void*    interpret_initial_value(VALUE arg, nm::dtype_t dtype);
+static size_t*  interpret_shape(VALUE arg, size_t* dim);
+static nm::stype_t  interpret_stype(VALUE arg);
+/* Singleton methods */
+static VALUE nm_upcast(VALUE self, VALUE t1, VALUE t2);
+#ifdef BENCHMARK
+static double get_time(void);
+#endif
+///////////////////
+// Ruby Bindings //
+///////////////////
+void Init_nmatrix() {
+  ///////////////////////
+  // Class Definitions //
+  ///////////////////////
+  cNMatrix = rb_define_class("NMatrix", rb_cObject);
+  // Special exceptions
+  /*
+   * Exception raised when there's a problem with data.
+   */
+  nm_eDataTypeError    = rb_define_class("DataTypeError", rb_eStandardError);
+  /*
+   * Exception raised when something goes wrong with the storage of a matrix.
+   */
+  nm_eStorageTypeError = rb_define_class("StorageTypeError", rb_eStandardError);
+  /*
+   * Exception raise when the matrix shape is not appropriate for a given operation.
+   */
+  nm_eShapeError = rb_define_class("ShapeError", rb_eStandardError);
+  /*
+   * Exception raise when an inverse is requested but the matrix is not invertible.
+   */
+  nm_eNotInvertibleError = rb_define_class("NotInvertibleError", rb_eStandardError);
+  /*
+   * :nodoc:
+   * Class that holds values in use by the C code.
+   */
+  cNMatrix_GC_holder = rb_define_class("NMGCHolder", rb_cObject);
+  ///////////////////
+  // Class Methods //
+  ///////////////////
+  rb_define_alloc_func(cNMatrix, nm_alloc);
+  ///////////////////////
+  // Singleton Methods //
+  ///////////////////////
+  rb_define_singleton_method(cNMatrix, "upcast", (METHOD)nm_upcast, 2); /* in ext/nmatrix/nmatrix.cpp */
+  rb_define_singleton_method(cNMatrix, "guess_dtype", (METHOD)nm_guess_dtype, 1);
+  rb_define_singleton_method(cNMatrix, "min_dtype", (METHOD)nm_min_dtype, 1);
+  //////////////////////
+  // Instance Methods //
+  //////////////////////
+  rb_define_method(cNMatrix, "initialize", (METHOD)nm_init, -1);
+  rb_define_method(cNMatrix, "initialize_copy", (METHOD)nm_init_copy, 1);
+  rb_define_singleton_method(cNMatrix, "read", (METHOD)nm_read, -1);
+  rb_define_method(cNMatrix, "write", (METHOD)nm_write, -1);
+  // Technically, the following function is a copy constructor.
+  rb_define_protected_method(cNMatrix, "clone_transpose", (METHOD)nm_init_transposed, 0);
+  rb_define_method(cNMatrix, "dtype", (METHOD)nm_dtype, 0);
+  rb_define_method(cNMatrix, "stype", (METHOD)nm_stype, 0);
+  rb_define_method(cNMatrix, "cast_full",  (METHOD)nm_cast, 3);
+  rb_define_method(cNMatrix, "default_value", (METHOD)nm_default_value, 0);
+  rb_define_protected_method(cNMatrix, "__list_default_value__", (METHOD)nm_list_default_value, 0);
+  rb_define_protected_method(cNMatrix, "__yale_default_value__", (METHOD)nm_yale_default_value, 0);
+  rb_define_method(cNMatrix, "[]", (METHOD)nm_mref, -1);
+  rb_define_method(cNMatrix, "slice", (METHOD)nm_mget, -1);
+  rb_define_method(cNMatrix, "[]=", (METHOD)nm_mset, -1);
+  rb_define_method(cNMatrix, "is_ref?", (METHOD)nm_is_ref, 0);
+  rb_define_method(cNMatrix, "dimensions", (METHOD)nm_dim, 0);
+  rb_define_method(cNMatrix, "effective_dimensions", (METHOD)nm_effective_dim, 0);
+  rb_define_protected_method(cNMatrix, "__list_to_hash__", (METHOD)nm_to_hash, 0); // handles list and dense, which are n-dimensional
+  rb_define_method(cNMatrix, "shape", (METHOD)nm_shape, 0);
+  rb_define_method(cNMatrix, "supershape", (METHOD)nm_supershape, 0);
+  rb_define_method(cNMatrix, "offset", (METHOD)nm_offset, 0);
+  rb_define_method(cNMatrix, "det_exact", (METHOD)nm_det_exact, 0);
+  rb_define_method(cNMatrix, "complex_conjugate!", (METHOD)nm_complex_conjugate_bang, 0);
+  rb_define_protected_method(cNMatrix, "reshape_bang", (METHOD)nm_reshape_bang, 1);
+  // Iterators public methods
+  rb_define_method(cNMatrix, "each_with_indices", (METHOD)nm_each_with_indices, 0);
+  rb_define_method(cNMatrix, "each_stored_with_indices", (METHOD)nm_each_stored_with_indices, 0);
+  rb_define_method(cNMatrix, "map_stored", (METHOD)nm_map_stored, 0);
+  rb_define_method(cNMatrix, "each_ordered_stored_with_indices", (METHOD)nm_each_ordered_stored_with_indices, 0);
+  // Iterators protected methods
+  rb_define_protected_method(cNMatrix, "__dense_each__", (METHOD)nm_dense_each, 0);
+  rb_define_protected_method(cNMatrix, "__dense_map__", (METHOD)nm_dense_map, 0);
+  rb_define_protected_method(cNMatrix, "__dense_map_pair__", (METHOD)nm_dense_map_pair, 1);
+  rb_define_protected_method(cNMatrix, "__list_map_merged_stored__", (METHOD)nm_list_map_merged_stored, 2);
+  rb_define_protected_method(cNMatrix, "__list_map_stored__", (METHOD)nm_list_map_stored, 1);
+  rb_define_protected_method(cNMatrix, "__yale_map_merged_stored__", (METHOD)nm_yale_map_merged_stored, 2);
+  rb_define_protected_method(cNMatrix, "__yale_map_stored__", (METHOD)nm_yale_map_stored, 0);
+  rb_define_protected_method(cNMatrix, "__yale_stored_diagonal_each_with_indices__", (METHOD)nm_yale_stored_diagonal_each_with_indices, 0);
+  rb_define_protected_method(cNMatrix, "__yale_stored_nondiagonal_each_with_indices__", (METHOD)nm_yale_stored_nondiagonal_each_with_indices, 0);
+  rb_define_method(cNMatrix, "==",    (METHOD)nm_eqeq,        1);
+  rb_define_method(cNMatrix, "+",      (METHOD)nm_ew_add,      1);
+  rb_define_method(cNMatrix, "-",      (METHOD)nm_ew_subtract,  1);
+  rb_define_method(cNMatrix, "*",      (METHOD)nm_ew_multiply,  1);
+  rb_define_method(cNMatrix, "/",      (METHOD)nm_ew_divide,    1);
+  rb_define_method(cNMatrix, "**",    (METHOD)nm_ew_power,    1);
+  rb_define_method(cNMatrix, "%",     (METHOD)nm_ew_mod,      1);
+  rb_define_method(cNMatrix, "atan2", (METHOD)nm_noncom_ew_atan2, -1);
+  rb_define_method(cNMatrix, "ldexp", (METHOD)nm_noncom_ew_ldexp, -1);
+  rb_define_method(cNMatrix, "hypot", (METHOD)nm_noncom_ew_hypot, -1);
+  rb_define_method(cNMatrix, "sin",   (METHOD)nm_unary_sin,   0);
+  rb_define_method(cNMatrix, "cos",   (METHOD)nm_unary_cos,   0);
+  rb_define_method(cNMatrix, "tan",   (METHOD)nm_unary_tan,   0);
+  rb_define_method(cNMatrix, "asin",  (METHOD)nm_unary_asin,  0);
+  rb_define_method(cNMatrix, "acos",  (METHOD)nm_unary_acos,  0);
+  rb_define_method(cNMatrix, "atan",  (METHOD)nm_unary_atan,  0);
+  rb_define_method(cNMatrix, "sinh",  (METHOD)nm_unary_sinh,  0);
+  rb_define_method(cNMatrix, "cosh",  (METHOD)nm_unary_cosh,  0);
+  rb_define_method(cNMatrix, "tanh",  (METHOD)nm_unary_tanh,  0);
+  rb_define_method(cNMatrix, "asinh", (METHOD)nm_unary_asinh, 0);
+  rb_define_method(cNMatrix, "acosh", (METHOD)nm_unary_acosh, 0);
+  rb_define_method(cNMatrix, "atanh", (METHOD)nm_unary_atanh, 0);
+  rb_define_method(cNMatrix, "exp",   (METHOD)nm_unary_exp,   0);
+  rb_define_method(cNMatrix, "log2",  (METHOD)nm_unary_log2,  0);
+  rb_define_method(cNMatrix, "log10", (METHOD)nm_unary_log10, 0);
+  rb_define_method(cNMatrix, "sqrt",  (METHOD)nm_unary_sqrt,  0);
+  rb_define_method(cNMatrix, "erf",   (METHOD)nm_unary_erf,   0);
+  rb_define_method(cNMatrix, "erfc",  (METHOD)nm_unary_erfc,  0);
+  rb_define_method(cNMatrix, "cbrt",  (METHOD)nm_unary_cbrt,  0);
+  rb_define_method(cNMatrix, "gamma", (METHOD)nm_unary_gamma, 0);
+  rb_define_method(cNMatrix, "log",   (METHOD)nm_unary_log,  -1);
+  rb_define_method(cNMatrix, "-@",    (METHOD)nm_unary_negate,0);
+  rb_define_method(cNMatrix, "floor", (METHOD)nm_unary_floor, 0);
+  rb_define_method(cNMatrix, "ceil", (METHOD)nm_unary_ceil, 0);
+  rb_define_method(cNMatrix, "round", (METHOD)nm_unary_round, -1);
+  rb_define_method(cNMatrix, "=~", (METHOD)nm_ew_eqeq, 1);
+  rb_define_method(cNMatrix, "!~", (METHOD)nm_ew_neq, 1);
+  rb_define_method(cNMatrix, "<=", (METHOD)nm_ew_leq, 1);
+  rb_define_method(cNMatrix, ">=", (METHOD)nm_ew_geq, 1);
+  rb_define_method(cNMatrix, "<", (METHOD)nm_ew_lt, 1);
+  rb_define_method(cNMatrix, ">", (METHOD)nm_ew_gt, 1);
+  /////////////////////////////
+  // Helper Instance Methods //
+  /////////////////////////////
+  rb_define_protected_method(cNMatrix, "__yale_vector_set__", (METHOD)nm_vector_set, -1);
+  /////////////////////////
+  // Matrix Math Methods //
+  /////////////////////////
+  rb_define_method(cNMatrix, "dot", (METHOD)nm_multiply, 1);
+  rb_define_method(cNMatrix, "symmetric?", (METHOD)nm_symmetric, 0);
+  rb_define_method(cNMatrix, "hermitian?", (METHOD)nm_hermitian, 0);
+  rb_define_method(cNMatrix, "capacity", (METHOD)nm_capacity, 0);
+  // protected methods
+  rb_define_protected_method(cNMatrix, "__inverse__", (METHOD)nm_inverse, 2);
+  rb_define_protected_method(cNMatrix, "__inverse_exact__", (METHOD)nm_inverse_exact, 3);
+  // private methods
+  rb_define_private_method(cNMatrix, "__hessenberg__", (METHOD)nm_hessenberg, 1);
+  /////////////////
+  // FFI Methods //
+  /////////////////
+  rb_define_method(cNMatrix, "data_pointer", (METHOD)nm_data_pointer, 0);
+  /////////////
+  // Aliases //
+  /////////////
+  rb_define_alias(cNMatrix, "dim", "dimensions");
+  rb_define_alias(cNMatrix, "effective_dim", "effective_dimensions");
+  rb_define_alias(cNMatrix, "equal?", "eql?");
+  ////////////
+  //Epsilons//
+  ////////////
+  rb_define_const(cNMatrix, "FLOAT64_EPSILON", rb_const_get(rb_cFloat, rb_intern("EPSILON")));
+  rb_define_const(cNMatrix, "FLOAT32_EPSILON", DBL2NUM(FLT_EPSILON));
+  ///////////////////////
+  // Symbol Generation //
+  ///////////////////////
+  nm_init_ruby_constants();
+  //////////////////////////
+  // YaleFunctions module //
+  //////////////////////////
+  nm_init_yale_functions();
+  /////////////////
+  // BLAS module //
+  /////////////////
+  nm_math_init_blas();
+  ///////////////
+  // IO module //
+  ///////////////
+  nm_init_io();
+  /////////////////////////////////////////////////
+  // Force compilation of necessary constructors //
+  /////////////////////////////////////////////////
+  nm_init_data();
+}
+//////////////////
+// Ruby Methods //
+//////////////////
+/*
+ * Allocator.
+ */
+static VALUE nm_alloc(VALUE klass) {
+  NMATRIX* mat = NM_ALLOC(NMATRIX);
+  mat->storage = NULL;
+  // DO NOT MARK This STRUCT. It has no storage allocated, and no stype, so mark will do an invalid something.
+  return Data_Wrap_Struct(klass, NULL, nm_delete, mat);
+}
+/*
+ * Find the capacity of an NMatrix. The capacity only differs from the size for
+ * Yale matrices, which occasionally allocate more space than they need. For
+ * list and dense, capacity gives the number of elements in the matrix.
+ *
+ * If you call this on a slice, it may behave unpredictably. Most likely it'll
+ * just return the original matrix's capacity.
+ */
+static VALUE nm_capacity(VALUE self) {
+  NM_CONSERVATIVE(nm_register_value(&self));
+  VALUE cap;
+  switch(NM_STYPE(self)) {
+  case nm::YALE_STORE:
+    cap = UINT2NUM(reinterpret_cast<YALE_STORAGE*>(NM_STORAGE_YALE(self)->src)->capacity);
+    break;
+  case nm::DENSE_STORE:
+    cap = UINT2NUM(nm_storage_count_max_elements( NM_STORAGE_DENSE(self) ));
+    break;
+  case nm::LIST_STORE:
+    cap = UINT2NUM(nm_list_storage_count_elements( NM_STORAGE_LIST(self) ));
+    break;
+  default:
+    NM_CONSERVATIVE(nm_unregister_value(&self));
+    rb_raise(nm_eStorageTypeError, "unrecognized stype in nm_capacity()");
+  }
+  NM_CONSERVATIVE(nm_unregister_value(&self));
+  return cap;
+}
+/*
+ * Mark function.
+ */
+void nm_mark(NMATRIX* mat) {
+  STYPE_MARK_TABLE(mark)
+  mark[mat->stype](mat->storage);
+}
+/*
+ * Destructor.
+ */
+void nm_delete(NMATRIX* mat) {
+  static void (*ttable[nm::NUM_STYPES])(STORAGE*) = {
+    nm_dense_storage_delete,
+    nm_list_storage_delete,
+    nm_yale_storage_delete
+  };
+  ttable[mat->stype](mat->storage);
+  NM_FREE(mat);
+}
+/*
+ * Slicing destructor.
+ */
+void nm_delete_ref(NMATRIX* mat) {
+  static void (*ttable[nm::NUM_STYPES])(STORAGE*) = {
+    nm_dense_storage_delete_ref,
+    nm_list_storage_delete_ref,
+    nm_yale_storage_delete_ref
+  };
+  ttable[mat->stype](mat->storage);
+  NM_FREE(mat);
+}
+/**
+ * These variables hold a linked list of VALUEs that are registered to be in
+ * use by nmatrix so that they can be marked when GC runs.
+ */
+static VALUE* gc_value_holder = NULL;
+static NM_GC_HOLDER* gc_value_holder_struct = NULL;
+static NM_GC_HOLDER* allocated_pool = NULL; // an object pool for linked list nodes; using pooling is in some cases a substantial performance improvement
+/**
+ * GC Marking function for the values that have been registered.
+ */
+static void __nm_mark_value_container(NM_GC_HOLDER* gc_value_holder_struct) {
+  if (gc_value_holder_struct && gc_value_holder_struct->start) {
+    NM_GC_LL_NODE* curr = gc_value_holder_struct->start;
+    while (curr) {
+      rb_gc_mark_locations(curr->val, curr->val + curr->n);
+      curr = curr->next;
+    }
+  }
+}
+/**
+ * Initilalizes the linked list of in-use VALUEs if it hasn't been done
+ * already.
+ */
+static void __nm_initialize_value_container() {
+  if (gc_value_holder == NULL) {
+    gc_value_holder_struct = NM_ALLOC_NONRUBY(NM_GC_HOLDER);
+    allocated_pool = NM_ALLOC_NONRUBY(NM_GC_HOLDER);
+    gc_value_holder = NM_ALLOC_NONRUBY(VALUE);
+    gc_value_holder_struct->start = NULL;
+    allocated_pool->start = NULL;
+    *gc_value_holder = Data_Wrap_Struct(cNMatrix_GC_holder, __nm_mark_value_container, NULL, gc_value_holder_struct);
+    rb_global_variable(gc_value_holder);
+  }
+}
+/*
+ * Register an array of VALUEs to avoid their collection
+ * while using them internally.
+ */
+void nm_register_values(VALUE* values, size_t n) {
+  if (!gc_value_holder_struct)
+    __nm_initialize_value_container();
+  if (values) {
+    NM_GC_LL_NODE* to_insert = NULL;
+    if (allocated_pool->start) {
+      to_insert = allocated_pool->start;
+      allocated_pool->start = to_insert->next;
+    } else {
+      to_insert = NM_ALLOC_NONRUBY(NM_GC_LL_NODE);
+    }
+    to_insert->val = values;
+    to_insert->n = n;
+    to_insert->next = gc_value_holder_struct->start;
+    gc_value_holder_struct->start = to_insert;
+  }
+}
+/*
+ * Unregister an array of VALUEs with the gc to allow normal
+ * garbage collection to occur again.
+ */
+void nm_unregister_values(VALUE* values, size_t n) {
+  if (values) {
+    if (gc_value_holder_struct) {
+      NM_GC_LL_NODE* curr = gc_value_holder_struct->start;
+      NM_GC_LL_NODE* last = NULL;
+      while (curr) {
+        if (curr->val == values) {
+          if (last) {
+            last->next = curr->next;
+          } else {
+            gc_value_holder_struct->start = curr->next;
+          }
+          curr->next = allocated_pool->start;
+          curr->val = NULL;
+          curr->n = 0;
+          allocated_pool->start = curr;
+          break;
+        }
+        last = curr;
+        curr = curr->next;
+      }
+    }
+  }
+}
+/**
+ * Register a single VALUE as in use to avoid garbage collection.
+ */
+void nm_register_value(VALUE* val) {
+  nm_register_values(val, 1);
+}
+/**
+ * Unregister a single VALUE to allow normal garbage collection.
+ */
+void nm_unregister_value(VALUE* val) {
+  nm_unregister_values(val, 1);
+}
+/**
+ * Removes all instances of a single VALUE in the gc list.  This can be
+ * dangerous.  Primarily used when something is about to be
+ * freed and replaced so that and residual registrations won't access after
+ * free.
+ **/
+void nm_completely_unregister_value(VALUE* val) {
+  if (gc_value_holder_struct) {
+    NM_GC_LL_NODE* curr = gc_value_holder_struct->start;
+    NM_GC_LL_NODE* last = NULL;
+    while (curr) {
+      if (curr->val == val) {
+        if (last) {
+          last->next = curr->next;
+        } else {
+          gc_value_holder_struct->start = curr->next;
+        }
+        NM_GC_LL_NODE* temp_next = curr->next;
+        curr->next = allocated_pool->start;
+        curr->val = NULL;
+        curr->n = 0;
+        allocated_pool->start = curr;
+        curr = temp_next;
+      } else {
+        last = curr;
+        curr = curr->next;
+      }
+    }
+  }
+}
+/**
+ * Register a STORAGE struct of the supplied stype to avoid garbage collection
+ * of its internals.
+ *
+ * Delegates to the storage-specific methods.  They will check dtype and ignore
+ * non-rubyobject dtypes, so it's safe to pass any storage in.
+ */
+void nm_register_storage(nm::stype_t stype, const STORAGE* storage) {
+  STYPE_REGISTER_TABLE(ttable);
+  ttable[stype](storage);
+}
+/**
+ * Unregister a STORAGE struct of the supplied stype to allow normal garbage collection
+ * of its internals.
+ *
+ * Delegates to the storage-specific methods.  They will check dtype and ignore
+ * non-rubyobject dtypes, so it's safe to pass any storage in.
+ *
+ */
+void nm_unregister_storage(nm::stype_t stype, const STORAGE* storage) {
+  STYPE_UNREGISTER_TABLE(ttable);
+  ttable[stype](storage);
+}
+/**
+ * Registers an NMATRIX struct to avoid garbage collection of its internals.
+ */
+void nm_register_nmatrix(NMATRIX* nmatrix) {
+  if (nmatrix)
+    nm_register_storage(nmatrix->stype, nmatrix->storage);
+}
+/**
+ * Unregisters an NMATRIX struct to avoid garbage collection of its internals.
+ */
+void nm_unregister_nmatrix(NMATRIX* nmatrix) {
+  if (nmatrix)
+    nm_unregister_storage(nmatrix->stype, nmatrix->storage);
+}
+/*
+ * call-seq:
+ *     dtype -> Symbol
+ *
+ * Get the data type (dtype) of a matrix, e.g., :byte, :int8, :int16, :int32,
+ * :int64, :float32, :float64, :complex64, :complex128,
+ * or :object (the last is a Ruby object).
+ */
+static VALUE nm_dtype(VALUE self) {
+  ID dtype = rb_intern(DTYPE_NAMES[NM_DTYPE(self)]);
+  return ID2SYM(dtype);
+}
+/*
+ * call-seq:
+ *     upcast(first_dtype, second_dtype) -> Symbol
+ *
+ * Given a binary operation between types t1 and t2, what type will be returned?
+ *
+ * This is a singleton method on NMatrix, e.g., NMatrix.upcast(:int32, :int64)
+ */
+static VALUE nm_upcast(VALUE self, VALUE t1, VALUE t2) {
+  nm::dtype_t d1    = nm_dtype_from_rbsymbol(t1),
+              d2    = nm_dtype_from_rbsymbol(t2);
+  return ID2SYM(rb_intern( DTYPE_NAMES[ Upcast[d1][d2] ] ));
+}
+/*
+ * call-seq:
+       default_value -> ...
+ *
+ * Get the default value for the matrix. For dense, this is undefined and will return Qnil. For list, it is user-defined.
+ * For yale, it's going to be some variation on zero, but may be Qfalse or Qnil.
+ */
+static VALUE nm_default_value(VALUE self) {
+  switch(NM_STYPE(self)) {
+  case nm::YALE_STORE:
+    return nm_yale_default_value(self);
+  case nm::LIST_STORE:
+    return nm_list_default_value(self);
+  case nm::DENSE_STORE:
+  default:
+    return Qnil;
+  }
+}
+/*
+ * call-seq:
+ *     each_with_indices -> Enumerator
+ *
+ * Iterate over all entries of any matrix in standard storage order (as with #each), and include the indices.
+ */
+static VALUE nm_each_with_indices(VALUE nmatrix) {
+  NM_CONSERVATIVE(nm_register_value(&nmatrix));
+  VALUE to_return = Qnil;
+  switch(NM_STYPE(nmatrix)) {
+  case nm::YALE_STORE:
+    to_return = nm_yale_each_with_indices(nmatrix);
+    break;
+  case nm::DENSE_STORE:
+    to_return = nm_dense_each_with_indices(nmatrix);
+    break;
+  case nm::LIST_STORE:
+    to_return = nm_list_each_with_indices(nmatrix, false);
+    break;
+  default:
+    NM_CONSERVATIVE(nm_unregister_value(&nmatrix));
+    rb_raise(nm_eDataTypeError, "Not a proper storage type");
+  }
+  NM_CONSERVATIVE(nm_unregister_value(&nmatrix));
+  return to_return;
+}
+/*
+ * call-seq:
+ *     each_stored_with_indices -> Enumerator
+ *
+ * Iterate over the stored entries of any matrix. For dense and yale, this iterates over non-zero
+ * entries; for list, this iterates over non-default entries. Yields dim+1 values for each entry:
+ * i, j, ..., and the entry itself.
+ */
+static VALUE nm_each_stored_with_indices(VALUE nmatrix) {
+  NM_CONSERVATIVE(nm_register_value(&nmatrix));
+  VALUE to_return = Qnil;
+  switch(NM_STYPE(nmatrix)) {
+  case nm::YALE_STORE:
+    to_return = nm_yale_each_stored_with_indices(nmatrix);
+    break;
+  case nm::DENSE_STORE:
+    to_return = nm_dense_each_with_indices(nmatrix);
+    break;
+  case nm::LIST_STORE:
+    to_return = nm_list_each_with_indices(nmatrix, true);
+    break;
+  default:
+    NM_CONSERVATIVE(nm_unregister_value(&nmatrix));
+    rb_raise(nm_eDataTypeError, "Not a proper storage type");
+  }
+  NM_CONSERVATIVE(nm_unregister_value(&nmatrix));
+  return to_return;
+}
+/*
+ * call-seq:
+ *     map_stored -> Enumerator
+ *
+ * Iterate over the stored entries of any matrix. For dense and yale, this iterates over non-zero
+ * entries; for list, this iterates over non-default entries. Yields dim+1 values for each entry:
+ * i, j, ..., and the entry itself.
+ */
+static VALUE nm_map_stored(VALUE nmatrix) {
+  NM_CONSERVATIVE(nm_register_value(&nmatrix));
+  VALUE to_return = Qnil;
+  switch(NM_STYPE(nmatrix)) {
+  case nm::YALE_STORE:
+    to_return = nm_yale_map_stored(nmatrix);
+    break;
+  case nm::DENSE_STORE:
+    to_return = nm_dense_map(nmatrix);
+    break;
+  case nm::LIST_STORE:
+    to_return = nm_list_map_stored(nmatrix, Qnil);
+    break;
+  default:
+    NM_CONSERVATIVE(nm_unregister_value(&nmatrix));
+    rb_raise(nm_eDataTypeError, "Not a proper storage type");
+  }
+  NM_CONSERVATIVE(nm_unregister_value(&nmatrix));
+  return to_return;
+}
+/*
+ * call-seq:
+ *     each_ordered_stored_with_indices -> Enumerator
+ *
+ * Very similar to #each_stored_with_indices. The key difference is that it enforces matrix ordering rather
+ * than storage ordering, which only matters if your matrix is Yale.
+ */
+static VALUE nm_each_ordered_stored_with_indices(VALUE nmatrix) {
+  NM_CONSERVATIVE(nm_register_value(&nmatrix));
+  VALUE to_return = Qnil;
+  switch(NM_STYPE(nmatrix)) {
+  case nm::YALE_STORE:
+    to_return = nm_yale_each_ordered_stored_with_indices(nmatrix);
+    break;
+  case nm::DENSE_STORE:
+    to_return = nm_dense_each_with_indices(nmatrix);
+    break;
+  case nm::LIST_STORE:
+    to_return = nm_list_each_with_indices(nmatrix, true);
+    break;
+  default:
+    NM_CONSERVATIVE(nm_unregister_value(&nmatrix));
+    rb_raise(nm_eDataTypeError, "Not a proper storage type");
+  }
+  NM_CONSERVATIVE(nm_unregister_value(&nmatrix));
+  return to_return;
+}
+/*
+ * Equality operator. Returns a single true or false value indicating whether
+ * the matrices are equivalent.
+ *
+ * For elementwise, use =~ instead.
+ *
+ * This method will raise an exception if dimensions do not match.
+ *
+ * When stypes differ, this function calls a protected Ruby method.
+ */
+static VALUE nm_eqeq(VALUE left, VALUE right) {
+  NM_CONSERVATIVE(nm_register_value(&left));
+  NM_CONSERVATIVE(nm_register_value(&right));
+  NMATRIX *l, *r;
+  CheckNMatrixType(left);
+  CheckNMatrixType(right);
+  UnwrapNMatrix(left, l);
+  UnwrapNMatrix(right, r);
+  bool result = false;
+  // Check that the shapes match before going any further.
+  if (l->storage->dim != r->storage->dim) {
+    NM_CONSERVATIVE(nm_unregister_value(&left));
+    NM_CONSERVATIVE(nm_unregister_value(&right));
+    rb_raise(nm_eShapeError, "cannot compare matrices with different dimension");
+  }
+  size_t dim = l->storage->dim;
+  for (size_t i=0; i<dim; i++) {
+    if (l->storage->shape[i] != r->storage->shape[i]) {
+      NM_CONSERVATIVE(nm_unregister_value(&left));
+      NM_CONSERVATIVE(nm_unregister_value(&right));
+      rb_raise(nm_eShapeError, "cannot compare matrices with different shapes");
+    }
+  }
+  if (l->stype != r->stype) { // DIFFERENT STYPES
+    if (l->stype == nm::DENSE_STORE)
+      result = rb_funcall(left, rb_intern("dense_eql_sparse?"), 1, right);
+    else if (r->stype == nm::DENSE_STORE)
+      result = rb_funcall(right, rb_intern("dense_eql_sparse?"), 1, left);
+    else
+      result = rb_funcall(left, rb_intern("sparse_eql_sparse?"), 1, right);
+  } else {
+    switch(l->stype) {       // SAME STYPES
+    case nm::DENSE_STORE:
+      result = nm_dense_storage_eqeq(l->storage, r->storage);
+      break;
+    case nm::LIST_STORE:
+      result = nm_list_storage_eqeq(l->storage, r->storage);
+      break;
+    case nm::YALE_STORE:
+      result = nm_yale_storage_eqeq(l->storage, r->storage);
+      break;
+    }
+  }
+  NM_CONSERVATIVE(nm_unregister_value(&left));
+  NM_CONSERVATIVE(nm_unregister_value(&right));
+  return result ? Qtrue : Qfalse;
+}
+DEF_ELEMENTWISE_RUBY_ACCESSOR(ADD, add)
+DEF_ELEMENTWISE_RUBY_ACCESSOR(SUB, subtract)
+DEF_ELEMENTWISE_RUBY_ACCESSOR(MUL, multiply)
+DEF_ELEMENTWISE_RUBY_ACCESSOR(DIV, divide)
+DEF_ELEMENTWISE_RUBY_ACCESSOR(POW, power)
+DEF_ELEMENTWISE_RUBY_ACCESSOR(MOD, mod)
+DEF_ELEMENTWISE_RUBY_ACCESSOR(EQEQ, eqeq)
+DEF_ELEMENTWISE_RUBY_ACCESSOR(NEQ, neq)
+DEF_ELEMENTWISE_RUBY_ACCESSOR(LEQ, leq)
+DEF_ELEMENTWISE_RUBY_ACCESSOR(GEQ, geq)
+DEF_ELEMENTWISE_RUBY_ACCESSOR(LT, lt)
+DEF_ELEMENTWISE_RUBY_ACCESSOR(GT, gt)
+DEF_UNARY_RUBY_ACCESSOR(SIN, sin)
+DEF_UNARY_RUBY_ACCESSOR(COS, cos)
+DEF_UNARY_RUBY_ACCESSOR(TAN, tan)
+DEF_UNARY_RUBY_ACCESSOR(ASIN, asin)
+DEF_UNARY_RUBY_ACCESSOR(ACOS, acos)
+DEF_UNARY_RUBY_ACCESSOR(ATAN, atan)
+DEF_UNARY_RUBY_ACCESSOR(SINH, sinh)
+DEF_UNARY_RUBY_ACCESSOR(COSH, cosh)
+DEF_UNARY_RUBY_ACCESSOR(TANH, tanh)
+DEF_UNARY_RUBY_ACCESSOR(ASINH, asinh)
+DEF_UNARY_RUBY_ACCESSOR(ACOSH, acosh)
+DEF_UNARY_RUBY_ACCESSOR(ATANH, atanh)
+DEF_UNARY_RUBY_ACCESSOR(EXP, exp)
+DEF_UNARY_RUBY_ACCESSOR(LOG2, log2)
+DEF_UNARY_RUBY_ACCESSOR(LOG10, log10)
+DEF_UNARY_RUBY_ACCESSOR(SQRT, sqrt)
+DEF_UNARY_RUBY_ACCESSOR(ERF, erf)
+DEF_UNARY_RUBY_ACCESSOR(ERFC, erfc)
+DEF_UNARY_RUBY_ACCESSOR(CBRT, cbrt)
+DEF_UNARY_RUBY_ACCESSOR(GAMMA, gamma)
+DEF_UNARY_RUBY_ACCESSOR(NEGATE, negate)
+DEF_UNARY_RUBY_ACCESSOR(FLOOR, floor)
+DEF_UNARY_RUBY_ACCESSOR(CEIL, ceil)
+DEF_NONCOM_ELEMENTWISE_RUBY_ACCESSOR(ATAN2, atan2)
+DEF_NONCOM_ELEMENTWISE_RUBY_ACCESSOR(LDEXP, ldexp)
+DEF_NONCOM_ELEMENTWISE_RUBY_ACCESSOR(HYPOT, hypot)
+static VALUE nm_unary_log(int argc, VALUE* argv, VALUE self) {
+  NM_CONSERVATIVE(nm_register_values(argv, argc));
+  const double default_log_base = exp(1.0);
+  NMATRIX* left;
+  UnwrapNMatrix(self, left);
+  std::string sym;
+  switch(left->stype) {
+  case nm::DENSE_STORE:
+    sym = "__dense_unary_log__";
+    break;
+  case nm::YALE_STORE:
+    sym = "__yale_unary_log__";
+    break;
+  case nm::LIST_STORE:
+    sym = "__list_unary_log__";
+    break;
+  }
+  NM_CONSERVATIVE(nm_unregister_values(argv, argc));
+  if (argc > 0) { //supplied a base
+    return rb_funcall(self, rb_intern(sym.c_str()), 1, argv[0]);
+  }
+  return rb_funcall(self, rb_intern(sym.c_str()), 1, nm::RubyObject(default_log_base).rval);
+}
+static VALUE nm_unary_round(int argc, VALUE* argv, VALUE self) {
+  NM_CONSERVATIVE(nm_register_values(argv, argc));
+  const int default_precision = 0;
+  NMATRIX* left;
+  UnwrapNMatrix(self, left);
+  std::string sym;
+  switch(left->stype) {
+  case nm::DENSE_STORE:
+    sym = "__dense_unary_round__";
+    break;
+  case nm::YALE_STORE:
+    sym = "__yale_unary_round__";
+    break;
+  case nm::LIST_STORE:
+    sym = "__list_unary_round__";
+    break;
+  }
+  NM_CONSERVATIVE(nm_unregister_values(argv, argc));
+  if (argc > 0) { //supplied precision
+    return rb_funcall(self, rb_intern(sym.c_str()), 1, argv[0]);
+  }
+  return rb_funcall(self, rb_intern(sym.c_str()), 1, nm::RubyObject(default_precision).rval);
+}
+//DEF_ELEMENTWISE_RUBY_ACCESSOR(ATAN2, atan2)
+//DEF_ELEMENTWISE_RUBY_ACCESSOR(LDEXP, ldexp)
+//DEF_ELEMENTWISE_RUBY_ACCESSOR(HYPOT, hypot)
+/*
+ * call-seq:
+ *     hermitian? -> Boolean
+ *
+ * Is this matrix hermitian?
+ *
+ * Definition: http://en.wikipedia.org/wiki/Hermitian_matrix
+ *
+ * For non-complex matrices, this function should return the same result as symmetric?.
+ */
+static VALUE nm_hermitian(VALUE self) {
+  return is_symmetric(self, true);
+}
+/*
+ * call-seq:
+ *     complex_conjugate_bang -> NMatrix
+ *
+ * Transform the matrix (in-place) to its complex conjugate. Only works on complex matrices.
+ *
+ * Bang should imply that no copy is being made, even temporarily.
+ */
+static VALUE nm_complex_conjugate_bang(VALUE self) {
+  NMATRIX* m;
+  void* elem;
+  size_t size, p;
+  UnwrapNMatrix(self, m);
+  if (m->stype == nm::DENSE_STORE) {
+    size = nm_storage_count_max_elements(NM_STORAGE(self));
+    elem = NM_STORAGE_DENSE(self)->elements;
+  } else if (m->stype == nm::YALE_STORE) {
+    size = nm_yale_storage_get_size(NM_STORAGE_YALE(self));
+    elem = NM_STORAGE_YALE(self)->a;
+  } else {
+    rb_raise(rb_eNotImpError, "please cast to yale or dense (complex) first");
+  }
+  // Walk through and negate the imaginary component
+  if (NM_DTYPE(self) == nm::COMPLEX64) {
+    for (p = 0; p < size; ++p) {
+      reinterpret_cast<nm::Complex64*>(elem)[p].i = -reinterpret_cast<nm::Complex64*>(elem)[p].i;
+    }
+  } else if (NM_DTYPE(self) == nm::COMPLEX128) {
+    for (p = 0; p < size; ++p) {
+      reinterpret_cast<nm::Complex128*>(elem)[p].i = -reinterpret_cast<nm::Complex128*>(elem)[p].i;
+    }
+  }
+  return self;
+}
+/*
+ * call-seq:
+ *     __reshape!__ -> NMatrix
+ *
+ * Reshapes the matrix (in-place) to the desired shape. Note that this function does not do a resize; the product of
+ * the new and old shapes' components must be equal.
+ *
+ */
+static VALUE nm_reshape_bang(VALUE self, VALUE arg){
+  NMATRIX* m;
+  UnwrapNMatrix(self, m);
+  if(m->stype == nm::DENSE_STORE){
+    DENSE_STORAGE* s   = NM_STORAGE_DENSE(self);
+    VALUE shape_ary = arg;
+    size_t dim;
+    size_t size = nm_storage_count_max_elements(s);
+    size_t new_size = 1;
+    size_t* shape = interpret_shape(shape_ary, &dim);
+    for (size_t index = 0; index < dim; ++index){
+      new_size *= shape[index];}
+    if (size == new_size){
+      s->shape = shape;
+      s->dim = dim;
+      NM_FREE(s->offset);
+      s->offset = NM_ALLOC_N(size_t, dim);
+      memset(s->offset, 0, sizeof(size_t)*dim);
+      size_t i, j;
+      size_t* stride = NM_ALLOC_N(size_t, dim);
+      for (i = 0; i < dim; ++i) {
+        stride[i] = 1;
+        for (j = i+1; j < dim; ++j) {
+          stride[i] *= shape[j];
+        }
+      }
+      NM_FREE(s->stride);
+      s->stride = stride;
+      return self;
+     }
+     else
+       rb_raise(rb_eArgError, "reshape cannot resize; size of new and old matrices must match");
+  }
+  else {
+    rb_raise(rb_eNotImpError, "reshape in place only for dense stype");
+  }
+}
+/*
+ * Helper function for creating a matrix. You have to create the storage and pass it in, but you don't
+ * need to worry about deleting it.
+ */
+NMATRIX* nm_create(nm::stype_t stype, STORAGE* storage) {
+  nm_register_storage(stype, storage);
+  NMATRIX* mat = NM_ALLOC(NMATRIX);
+  mat->stype   = stype;
+  mat->storage = storage;
+  nm_unregister_storage(stype, storage);
+  return mat;
+}
+/*
+ * @see nm_init
+ */
+static VALUE nm_init_new_version(int argc, VALUE* argv, VALUE self) {
+  NM_CONSERVATIVE(nm_register_values(argv, argc));
+  NM_CONSERVATIVE(nm_register_value(&self));
+  VALUE shape_ary, initial_ary, hash;
+  //VALUE shape_ary, default_val, capacity, initial_ary, dtype_sym, stype_sym;
+  // Mandatory args: shape, dtype, stype
+  rb_scan_args(argc, argv, "11:", &shape_ary, &initial_ary, &hash); // &stype_sym, &dtype_sym, &default_val, &capacity);
+  NM_CONSERVATIVE(nm_register_value(&shape_ary));
+  NM_CONSERVATIVE(nm_register_value(&initial_ary));
+  NM_CONSERVATIVE(nm_register_value(&hash));
+  // Get the shape.
+  size_t  dim;
+  size_t* shape = interpret_shape(shape_ary, &dim);
+  void*   init;
+  void*   v = NULL;
+  size_t  v_size = 0;
+  nm::stype_t stype = nm::DENSE_STORE;
+  nm::dtype_t dtype = nm::RUBYOBJ;
+  VALUE dtype_sym = Qnil, stype_sym = Qnil, default_val_num = Qnil, capacity_num = Qnil;
+  size_t capacity = 0;
+  if (!NIL_P(hash)) {
+    dtype_sym       = rb_hash_aref(hash, ID2SYM(nm_rb_dtype));
+    stype_sym       = rb_hash_aref(hash, ID2SYM(nm_rb_stype));
+    capacity_num    = rb_hash_aref(hash, ID2SYM(nm_rb_capacity));
+    NM_CONSERVATIVE(nm_register_value(&capacity_num));
+    default_val_num = rb_hash_aref(hash, ID2SYM(nm_rb_default));
+    NM_CONSERVATIVE(nm_register_value(&default_val_num));
+  }
+  //     stype ||= :dense
+  stype = !NIL_P(stype_sym) ? nm_stype_from_rbsymbol(stype_sym) : nm::DENSE_STORE;
+  //     dtype ||= h[:dtype] || guess_dtype(initial_ary) || :object
+  if (NIL_P(initial_ary) && NIL_P(dtype_sym))
+    dtype = nm::RUBYOBJ;
+  else if (NIL_P(dtype_sym))
+    dtype = nm_dtype_guess(initial_ary);
+  else
+    dtype = nm_dtype_from_rbsymbol(dtype_sym);
+  //   if stype != :dense
+  //     if initial_ary.nil?
+  //       init = h[:default] || 0
+  //     elsif initial_ary.is_a?(Array)
+  //       init = initial_ary.size > 1 ? (h[:default] || 0) : initial_ary[0]
+  //     else
+  //       init = initial_ary # not an array, just a value
+  //     end
+  //   end
+  if (stype != nm::DENSE_STORE) {
+    if (!NIL_P(default_val_num))
+      init = rubyobj_to_cval(default_val_num, dtype);
+    else if (NIL_P(initial_ary))
+      init = NULL;
+    else if (RB_TYPE_P(initial_ary, T_ARRAY))
+      init = RARRAY_LEN(initial_ary) == 1 ? rubyobj_to_cval(rb_ary_entry(initial_ary, 0), dtype) : NULL;
+    else
+      init = rubyobj_to_cval(initial_ary, dtype);
+    if (dtype == nm::RUBYOBJ) {
+      nm_register_values(reinterpret_cast<VALUE*>(init), 1);
+    }
+  }
+  // capacity = h[:capacity] || 0
+  if (stype == nm::YALE_STORE) {
+    if (!NIL_P(capacity_num)) capacity = FIX2INT(capacity_num);
+  }
+  if (!NIL_P(initial_ary)) {
+    if (RB_TYPE_P(initial_ary, T_ARRAY)) v_size = RARRAY_LEN(initial_ary);
+    else                                 v_size = 1;
+    v = interpret_initial_value(initial_ary, dtype);
+    if (dtype == nm::RUBYOBJ) {
+      nm_register_values(reinterpret_cast<VALUE*>(v), v_size);
+    }
+  }
+  // :object matrices MUST be initialized.
+  else if (stype == nm::DENSE_STORE && dtype == nm::RUBYOBJ) {
+    // Pretend [nil] was passed for RUBYOBJ.
+    v          = NM_ALLOC(VALUE);
+    *(VALUE*)v = Qnil;
+    v_size = 1;
+  }
+  NMATRIX* nmatrix;
+  UnwrapNMatrix(self, nmatrix);
+  nmatrix->stype = stype;
+  switch (stype) {
+    case nm::DENSE_STORE:
+      nmatrix->storage = (STORAGE*)nm_dense_storage_create(dtype, shape, dim, v, v_size);
+      break;
+    case nm::LIST_STORE:
+      nmatrix->storage = (STORAGE*)nm_list_storage_create(dtype, shape, dim, init);
+      break;
+    case nm::YALE_STORE:
+      nmatrix->storage = (STORAGE*)nm_yale_storage_create(dtype, shape, dim, capacity);
+      nm_yale_storage_init((YALE_STORAGE*)(nmatrix->storage), init);
+      break;
+  }
+  nm_register_storage(stype, nmatrix->storage);
+  // If we're not creating a dense, and an initial array was provided, use that and multi-slice-set
+  // to set the contents of the matrix right now.
+  if (stype != nm::DENSE_STORE && v_size > 1) {
+    VALUE* slice_argv = NM_ALLOCA_N(VALUE, dim);
+    nm_register_values(slice_argv, dim);
+    size_t* tmp_shape = NM_ALLOC_N(size_t, dim);
+    for (size_t m = 0; m < dim; ++m) {
+      slice_argv[m] = ID2SYM(nm_rb_mul); // :* -- full range
+      tmp_shape[m]  = shape[m];
+    }
+    SLICE slice_s;
+    SLICE* slice = &slice_s;
+    slice->coords = NM_ALLOCA_N(size_t, dim);
+    slice->lengths = NM_ALLOCA_N(size_t, dim);
+    init_slice_no_alloc(slice, dim, dim, slice_argv, shape);
+    // Create a temporary dense matrix and use it to do a slice assignment on self.
+    NMATRIX* tmp = nm_create(nm::DENSE_STORE, (STORAGE*)nm_dense_storage_create(dtype, tmp_shape, dim, v, v_size));
+    nm_register_nmatrix(tmp);
+    VALUE rb_tmp = Data_Wrap_Struct(CLASS_OF(self), nm_mark, nm_delete, tmp);
+    nm_unregister_nmatrix(tmp);
+    nm_register_value(&rb_tmp);
+    if (stype == nm::YALE_STORE)  nm_yale_storage_set(self, slice, rb_tmp);
+    else                          nm_list_storage_set(self, slice, rb_tmp);
+    // We need to free v if it's not the same size as tmp -- because tmp will have made a copy instead.
+    //if (nm_storage_count_max_elements(tmp->storage) != v_size)
+    //  NM_FREE(v);
+    // nm_delete(tmp); // This seems to enrage the garbage collector (because rb_tmp is still available). It'd be better if we could force it to free immediately, but no sweat.
+    nm_unregister_value(&rb_tmp);
+    nm_unregister_values(slice_argv, dim);
+  }
+  if (!NIL_P(initial_ary) && dtype == nm::RUBYOBJ) {
+    nm_unregister_values(reinterpret_cast<VALUE*>(v), v_size);
+  }
+  if (stype != nm::DENSE_STORE && dtype == nm::RUBYOBJ) {
+    nm_unregister_values(reinterpret_cast<VALUE*>(init), 1);
+  }
+  if (!NIL_P(hash)) {
+    NM_CONSERVATIVE(nm_unregister_value(&capacity_num));
+    NM_CONSERVATIVE(nm_unregister_value(&default_val_num));
+  }
+  NM_CONSERVATIVE(nm_unregister_value(&shape_ary));
+  NM_CONSERVATIVE(nm_unregister_value(&initial_ary));
+  NM_CONSERVATIVE(nm_unregister_value(&hash));
+  NM_CONSERVATIVE(nm_unregister_value(&self));
+  NM_CONSERVATIVE(nm_unregister_values(argv, argc));
+  nm_unregister_storage(stype, nmatrix->storage);
+  return self;
+}
+/*
+ * call-seq:
+ *     new(shape) -> NMatrix
+ *     new(shape, initial_value) -> NMatrix
+ *     new(shape, initial_array) -> NMatrix
+ *     new(shape, initial_value, options) -> NMatrix
+ *     new(shape, initial_array, options) -> NMatrix
+ *
+ * Create a new NMatrix.
+ *
+ * The only mandatory argument is shape, which may be a positive integer or an array of positive integers.
+ *
+ * It is recommended that you supply an initialization value or array of values. Without one, Yale and List matrices will
+ * be initialized to 0; and dense matrices will be undefined.
+ *
+ * Additional options may be provided using keyword arguments. The keywords are +:dtype, +:stype+, +:capacity+, and
+ * +:default+. Only Yale uses a capacity argument, which is used to reserve the initial size of its storage vectors.
+ * List and Yale both accept a default value (which itself defaults to 0). This default is taken from the initial value
+ * if such a value is given; it is more likely to be required when an initial array is provided.
+ *
+ * The storage type, or stype, is used to specify whether we want a +:dense+, +:list+, or +:yale+ matrix; dense is the
+ * default.
+ *
+ * The data type, or dtype, can be one of: :byte, :int8, :int16, :int32, :int64, :float32, :float64, :complex64,
+ * :complex128, or :object. The constructor will attempt to guess it from the initial value/array/default
+ * provided, if any. Otherwise, the default is :object, which stores any type of Ruby object.
+ *
+ * In addition to the above, there is a legacy constructor from the alpha version. To use that version, you must be
+ * providing exactly four arguments. It is now deprecated.
+ *
+ * There is one additional constructor for advanced users, which takes seven arguments and is only for creating Yale
+ * matrices with known IA, JA, and A arrays. This is used primarily internally for IO, e.g., reading Matlab matrices,
+ * which are stored in old Yale (not our Yale) format. But be careful; there are no overflow warnings. All of these
+ * constructors are defined for power-users. Everyone else should probably resort to the shortcut functions defined in
+ * shortcuts.rb.
+ */
+static VALUE nm_init(int argc, VALUE* argv, VALUE nm) {
+  NM_CONSERVATIVE(nm_register_value(&nm));
+  NM_CONSERVATIVE(nm_register_values(argv, argc));
+  if (argc <= 3) { // Call the new constructor unless all four arguments are given (or the 7-arg version is given)
+    NM_CONSERVATIVE(nm_unregister_values(argv, argc));
+    NM_CONSERVATIVE(nm_unregister_value(&nm));
+    return nm_init_new_version(argc, argv, nm);
+  }
+  /* First, determine stype (dense by default) */
+  nm::stype_t stype;
+  size_t  offset = 0;
+  if (!SYMBOL_P(argv[0]) && !RB_TYPE_P(argv[0], T_STRING)) {
+    stype = nm::DENSE_STORE;
+  } else {
+    // 0: String or Symbol
+    stype  = interpret_stype(argv[0]);
+    offset = 1;
+  }
+  // If there are 7 arguments and Yale, refer to a different init function with fewer sanity checks.
+  if (argc == 7) {
+    if (stype == nm::YALE_STORE) {
+      NM_CONSERVATIVE(nm_unregister_values(argv, argc));
+      NM_CONSERVATIVE(nm_unregister_value(&nm));
+      return nm_init_yale_from_old_yale(argv[1], argv[2], argv[3], argv[4], argv[5], argv[6], nm);
+    } else {
+      NM_CONSERVATIVE(nm_unregister_values(argv, argc));
+      NM_CONSERVATIVE(nm_unregister_value(&nm));
+      rb_raise(rb_eArgError, "Expected 2-4 arguments (or 7 for internal Yale creation)");
+    }
+  }
+  // 1: Array or Fixnum
+  size_t dim;
+  size_t* shape = interpret_shape(argv[offset], &dim);
+  // 2-3: dtype
+  nm::dtype_t dtype = interpret_dtype(argc-1-offset, argv+offset+1, stype);
+  size_t init_cap = 0, init_val_len = 0;
+  void* init_val  = NULL;
+  if (!SYMBOL_P(argv[1+offset]) || RB_TYPE_P(argv[1+offset], T_ARRAY)) {
+    // Initial value provided (could also be initial capacity, if yale).
+    if (stype == nm::YALE_STORE && NM_RUBYVAL_IS_NUMERIC(argv[1+offset])) {
+      init_cap = FIX2UINT(argv[1+offset]);
+    } else {
+      // 4: initial value / dtype
+      init_val = interpret_initial_value(argv[1+offset], dtype);
+      if (RB_TYPE_P(argv[1+offset], T_ARRAY)) init_val_len = RARRAY_LEN(argv[1+offset]);
+      else                                    init_val_len = 1;
+    }
+  } else {
+    // DType is RUBYOBJ.
+    if (stype == nm::DENSE_STORE) {
+      /*
+       * No need to initialize dense with any kind of default value unless it's
+       * an RUBYOBJ matrix.
+       */
+      if (dtype == nm::RUBYOBJ) {
+        // Pretend [nil] was passed for RUBYOBJ.
+        init_val = NM_ALLOC(VALUE);
+        *(VALUE*)init_val = Qnil;
+        init_val_len = 1;
+      } else {
+        init_val = NULL;
+      }
+    } else if (stype == nm::LIST_STORE) {
+      init_val = NM_ALLOC_N(char, DTYPE_SIZES[dtype]);
+      std::memset(init_val, 0, DTYPE_SIZES[dtype]);
+    }
+  }
+  if (dtype == nm::RUBYOBJ) {
+    nm_register_values(reinterpret_cast<VALUE*>(init_val), init_val_len);
+  }
+  // TODO: Update to allow an array as the initial value.
+  NMATRIX* nmatrix;
+  UnwrapNMatrix(nm, nmatrix);
+  nmatrix->stype = stype;
+  switch (stype) {
+    case nm::DENSE_STORE:
+      nmatrix->storage = (STORAGE*)nm_dense_storage_create(dtype, shape, dim, init_val, init_val_len);
+      break;
+    case nm::LIST_STORE:
+      nmatrix->storage = (STORAGE*)nm_list_storage_create(dtype, shape, dim, init_val);
+      break;
+    case nm::YALE_STORE:
+      nmatrix->storage = (STORAGE*)nm_yale_storage_create(dtype, shape, dim, init_cap);
+      nm_yale_storage_init((YALE_STORAGE*)(nmatrix->storage), NULL);
+      break;
+  }
+  if (dtype == nm::RUBYOBJ) {
+    nm_unregister_values(reinterpret_cast<VALUE*>(init_val), init_val_len);
+  }
+  NM_CONSERVATIVE(nm_unregister_values(argv, argc));
+  NM_CONSERVATIVE(nm_unregister_value(&nm));
+  return nm;
+}
+/*
+ * Helper for nm_cast_with_types which uses the C types instead of the Ruby objects.
+ * Called by nm_cast_with_types.
+ */
+NMATRIX* nm_cast_with_ctype_args(NMATRIX* self, nm::stype_t new_stype, nm::dtype_t new_dtype, void* init_ptr) {
+  nm_register_nmatrix(self);
+  NMATRIX* lhs = NM_ALLOC(NMATRIX);
+  lhs->stype   = new_stype;
+  // Copy the storage
+  CAST_TABLE(cast_copy);
+  lhs->storage = cast_copy[lhs->stype][self->stype](self->storage, new_dtype, init_ptr);
+  nm_unregister_nmatrix(self);
+  return lhs;
+}
+/*
+ * Cast NMatrix with given new_stype and new_dtype. Called by nm_cast.
+ */
+VALUE nm_cast_with_types(VALUE self, nm::stype_t new_stype, nm::dtype_t new_dtype,
+        void* init_ptr) {
+  NMATRIX *rhs;
+  UnwrapNMatrix( self, rhs );
+  NMATRIX* m = nm_cast_with_ctype_args(rhs, new_stype, new_dtype, init_ptr);
+  nm_register_nmatrix(m);
+  VALUE to_return = Data_Wrap_Struct(CLASS_OF(self), nm_mark, nm_delete, m);
+  nm_unregister_nmatrix(m);
+  return to_return;
+}
+/*
+ * call-seq:
+ *     cast_full(stype) -> NMatrix
+ *     cast_full(stype, dtype, sparse_basis) -> NMatrix
+ *
+ * Copy constructor for changing dtypes and stypes.
+ */
+VALUE nm_cast(VALUE self, VALUE new_stype_symbol, VALUE new_dtype_symbol, VALUE init) {
+  NM_CONSERVATIVE(nm_register_value(&self));
+  NM_CONSERVATIVE(nm_register_value(&init));
+  nm::dtype_t new_dtype = nm_dtype_from_rbsymbol(new_dtype_symbol);
+  nm::stype_t new_stype = nm_stype_from_rbsymbol(new_stype_symbol);
+  CheckNMatrixType(self);
+  void* init_ptr = NM_ALLOCA_N(char, DTYPE_SIZES[new_dtype]);
+  rubyval_to_cval(init, new_dtype, init_ptr);
+  VALUE to_return = nm_cast_with_types(self, new_stype, new_dtype, init_ptr);
+  NM_CONSERVATIVE(nm_unregister_value(&self));
+  NM_CONSERVATIVE(nm_unregister_value(&init));
+  return to_return;
+}
+/*
+ * Copy constructor for transposing.
+ */
+static VALUE nm_init_transposed(VALUE self) {
+  NM_CONSERVATIVE(nm_register_value(&self));
+  static STORAGE* (*storage_copy_transposed[nm::NUM_STYPES])(const STORAGE* rhs_base) = {
+    nm_dense_storage_copy_transposed,
+    nm_list_storage_copy_transposed,
+    nm_yale_storage_copy_transposed
+  };
+  NMATRIX* lhs = nm_create( NM_STYPE(self),
+                            storage_copy_transposed[NM_STYPE(self)]( NM_STORAGE(self) )
+                          );
+  nm_register_nmatrix(lhs);
+  VALUE to_return = Data_Wrap_Struct(CLASS_OF(self), nm_mark, nm_delete, lhs);
+  nm_unregister_nmatrix(lhs);
+  NM_CONSERVATIVE(nm_unregister_value(&self));
+  return to_return;
+}
+/*
+ * Copy constructor for no change of dtype or stype (used for #initialize_copy hook).
+ */
+static VALUE nm_init_copy(VALUE copy, VALUE original) {
+  NM_CONSERVATIVE(nm_register_value(&copy));
+  NM_CONSERVATIVE(nm_register_value(&original));
+  NMATRIX *lhs, *rhs;
+  CheckNMatrixType(original);
+  if (copy == original) {
+    NM_CONSERVATIVE(nm_unregister_value(&copy));
+    NM_CONSERVATIVE(nm_unregister_value(&original));
+    return copy;
+  }
+  UnwrapNMatrix( original, rhs );
+  UnwrapNMatrix( copy,     lhs );
+  lhs->stype = rhs->stype;
+  // Copy the storage
+  CAST_TABLE(ttable);
+  lhs->storage = ttable[lhs->stype][rhs->stype](rhs->storage, rhs->storage->dtype, NULL);
+  NM_CONSERVATIVE(nm_unregister_value(&copy));
+  NM_CONSERVATIVE(nm_unregister_value(&original));
+  return copy;
+}
+/*
+ * Get major, minor, and release components of NMatrix::VERSION. Store in function parameters. Doesn't get
+ * the "pre" field currently (beta1/rc1/etc).
+ */
+static void get_version_info(uint16_t& major, uint16_t& minor, uint16_t& release) {
+  // Get VERSION and split it on periods. Result is an Array.
+  VALUE cVersion = rb_const_get(cNMatrix, rb_intern("VERSION"));
+  // Convert each to an integer
+  major   = FIX2INT(rb_const_get(cVersion, rb_intern("MAJOR")));
+  minor   = FIX2INT(rb_const_get(cVersion, rb_intern("MINOR")));
+  release = FIX2INT(rb_const_get(cVersion, rb_intern("TINY")));
+}
+/*
+ * Interpret the NMatrix::write symmetry argument (which should be nil or a symbol). Return a symm_t (enum).
+ */
+static nm::symm_t interpret_symm(VALUE symm) {
+  if (symm == Qnil) return nm::NONSYMM;
+  ID rb_symm = rb_intern("symmetric"),
+     rb_skew = rb_intern("skew"),
+     rb_herm = rb_intern("hermitian");
+     // nm_rb_upper, nm_rb_lower already set
+  ID symm_id = rb_to_id(symm);
+  if (symm_id == rb_symm)            return nm::SYMM;
+  else if (symm_id == rb_skew)       return nm::SKEW;
+  else if (symm_id == rb_herm)       return nm::HERM;
+  else if (symm_id == nm_rb_upper)   return nm::UPPER;
+  else if (symm_id == nm_rb_lower)   return nm::LOWER;
+  else                            rb_raise(rb_eArgError, "unrecognized symmetry argument");
+  return nm::NONSYMM;
+}
+void read_padded_shape(std::ifstream& f, size_t dim, size_t* shape) {
+  size_t bytes_read = 0;
+  // Read shape
+  for (size_t i = 0; i < dim; ++i) {
+    size_t s;
+    f.read(reinterpret_cast<char*>(&s), sizeof(size_t));
+    shape[i] = s;
+    bytes_read += sizeof(size_t);
+  }
+  // Ignore padding
+  f.ignore(bytes_read % 8);
+}
+void write_padded_shape(std::ofstream& f, size_t dim, size_t* shape) {
+  size_t bytes_written = 0;
+  // Write shape
+  for (size_t i = 0; i < dim; ++i) {
+    size_t s = shape[i];
+    f.write(reinterpret_cast<const char*>(&s), sizeof(size_t));
+    bytes_written += sizeof(size_t);
+  }
+  // Pad with zeros
+  size_t zero = 0;
+  while (bytes_written % 8) {
+    f.write(reinterpret_cast<const char*>(&zero), sizeof(size_t));
+    bytes_written += sizeof(IType);
+  }
+}
+void read_padded_yale_elements(std::ifstream& f, YALE_STORAGE* storage, size_t length, nm::symm_t symm, nm::dtype_t dtype) {
+  NAMED_DTYPE_TEMPLATE_TABLE_NO_ROBJ(ttable, nm::read_padded_yale_elements, void, std::ifstream&, YALE_STORAGE*, size_t, nm::symm_t)
+  ttable[dtype](f, storage, length, symm);
+}
+void write_padded_yale_elements(std::ofstream& f, YALE_STORAGE* storage, size_t length, nm::symm_t symm, nm::dtype_t dtype) {
+  NAMED_DTYPE_TEMPLATE_TABLE_NO_ROBJ(ttable, nm::write_padded_yale_elements, void, std::ofstream& f, YALE_STORAGE*, size_t, nm::symm_t)
+  ttable[dtype](f, storage, length, symm);
+}
+void read_padded_dense_elements(std::ifstream& f, DENSE_STORAGE* storage, nm::symm_t symm, nm::dtype_t dtype) {
+  NAMED_DTYPE_TEMPLATE_TABLE_NO_ROBJ(ttable, nm::read_padded_dense_elements, void, std::ifstream&, DENSE_STORAGE*, nm::symm_t)
+  ttable[dtype](f, storage, symm);
+}
+void write_padded_dense_elements(std::ofstream& f, DENSE_STORAGE* storage, nm::symm_t symm, nm::dtype_t dtype) {
+  NAMED_DTYPE_TEMPLATE_TABLE_NO_ROBJ(ttable, nm::write_padded_dense_elements, void, std::ofstream& f, DENSE_STORAGE*, nm::symm_t)
+  ttable[dtype](f, storage, symm);
+}
+/*
+ * Helper function to get exceptions in the module Errno (e.g., ENOENT). Example:
+ *
+ *     rb_raise(rb_get_errno_exc("ENOENT"), RSTRING_PTR(filename));
+ */
+static VALUE rb_get_errno_exc(const char* which) {
+  return rb_const_get(rb_const_get(rb_cObject, rb_intern("Errno")), rb_intern(which));
+}
+/*
+ * Binary file writer for NMatrix standard format. file should be a path, which we aren't going to
+ * check very carefully (in other words, this function should generally be called from a Ruby
+ * helper method). Function also takes a symmetry argument, which allows us to specify that we only want to
+ * save the upper triangular portion of the matrix (or if the matrix is a lower triangular matrix, only
+ * the lower triangular portion). nil means regular storage.
+ */
+static VALUE nm_write(int argc, VALUE* argv, VALUE self) {
+  using std::ofstream;
+  if (argc < 1 || argc > 2) {
+    rb_raise(rb_eArgError, "Expected one or two arguments");
+  }
+  NM_CONSERVATIVE(nm_register_values(argv, argc));
+  NM_CONSERVATIVE(nm_register_value(&self));
+  VALUE file = argv[0],
+        symm = argc == 1 ? Qnil : argv[1];
+  NMATRIX* nmatrix;
+  UnwrapNMatrix( self, nmatrix );
+  nm::symm_t symm_ = interpret_symm(symm);
+  if (nmatrix->storage->dtype == nm::RUBYOBJ) {
+    NM_CONSERVATIVE(nm_unregister_values(argv, argc));
+    NM_CONSERVATIVE(nm_unregister_value(&self));
+    rb_raise(rb_eNotImpError, "Ruby Object writing is not implemented yet");
+  }
+  // Get the dtype, stype, itype, and symm and ensure they're the correct number of bytes.
+  uint8_t st = static_cast<uint8_t>(nmatrix->stype),
+          dt = static_cast<uint8_t>(nmatrix->storage->dtype),
+          sm = static_cast<uint8_t>(symm_);
+  uint16_t dim = nmatrix->storage->dim;
+  //FIXME: Cast the matrix to the smallest possible index type. Write that in the place of IType.
+  // Check arguments before starting to write.
+  if (nmatrix->stype == nm::LIST_STORE) {
+    NM_CONSERVATIVE(nm_unregister_values(argv, argc));
+    NM_CONSERVATIVE(nm_unregister_value(&self));
+    rb_raise(nm_eStorageTypeError, "cannot save list matrix; cast to yale or dense first");
+  }
+  if (symm_ != nm::NONSYMM) {
+    NM_CONSERVATIVE(nm_unregister_values(argv, argc));
+    NM_CONSERVATIVE(nm_unregister_value(&self));
+    if (dim != 2) rb_raise(rb_eArgError, "symmetry/triangularity not defined for a non-2D matrix");
+    if (nmatrix->storage->shape[0] != nmatrix->storage->shape[1])
+      rb_raise(rb_eArgError, "symmetry/triangularity not defined for a non-square matrix");
+    if (symm_ == nm::HERM &&
+          dt != static_cast<uint8_t>(nm::COMPLEX64) && dt != static_cast<uint8_t>(nm::COMPLEX128) && dt != static_cast<uint8_t>(nm::RUBYOBJ))
+      rb_raise(rb_eArgError, "cannot save a non-complex matrix as hermitian");
+  }
+  ofstream f(RSTRING_PTR(file), std::ios::out | std::ios::binary);
+  // Get the NMatrix version information.
+  uint16_t major, minor, release, null16 = 0;
+  get_version_info(major, minor, release);
+  // WRITE FIRST 64-BIT BLOCK
+  f.write(reinterpret_cast<const char*>(&major),   sizeof(uint16_t));
+  f.write(reinterpret_cast<const char*>(&minor),   sizeof(uint16_t));
+  f.write(reinterpret_cast<const char*>(&release), sizeof(uint16_t));
+  f.write(reinterpret_cast<const char*>(&null16),  sizeof(uint16_t));
+  uint8_t ZERO = 0;
+  // WRITE SECOND 64-BIT BLOCK
+  f.write(reinterpret_cast<const char*>(&dt), sizeof(uint8_t));
+  f.write(reinterpret_cast<const char*>(&st), sizeof(uint8_t));
+  f.write(reinterpret_cast<const char*>(&ZERO),sizeof(uint8_t));
+  f.write(reinterpret_cast<const char*>(&sm), sizeof(uint8_t));
+  f.write(reinterpret_cast<const char*>(&null16), sizeof(uint16_t));
+  f.write(reinterpret_cast<const char*>(&dim), sizeof(uint16_t));
+  // Write shape (in 64-bit blocks)
+  write_padded_shape(f, nmatrix->storage->dim, nmatrix->storage->shape);
+  if (nmatrix->stype == nm::DENSE_STORE) {
+    write_padded_dense_elements(f, reinterpret_cast<DENSE_STORAGE*>(nmatrix->storage), symm_, nmatrix->storage->dtype);
+  } else if (nmatrix->stype == nm::YALE_STORE) {
+    YALE_STORAGE* s = reinterpret_cast<YALE_STORAGE*>(nmatrix->storage);
+    uint32_t ndnz   = s->ndnz,
+             length = nm_yale_storage_get_size(s);
+    f.write(reinterpret_cast<const char*>(&ndnz),   sizeof(uint32_t));
+    f.write(reinterpret_cast<const char*>(&length), sizeof(uint32_t));
+    write_padded_yale_elements(f, s, length, symm_, s->dtype);
+  }
+  f.close();
+  NM_CONSERVATIVE(nm_unregister_values(argv, argc));
+  NM_CONSERVATIVE(nm_unregister_value(&self));
+  return Qtrue;
+}
+/*
+ * Binary file reader for NMatrix standard format. file should be a path, which we aren't going to
+ * check very carefully (in other words, this function should generally be called from a Ruby
+ * helper method).
+ *
+ * Note that currently, this function will by default refuse to read files that are newer than
+ * your version of NMatrix. To force an override, set the second argument to anything other than nil.
+ *
+ * Returns an NMatrix Ruby object.
+ */
+static VALUE nm_read(int argc, VALUE* argv, VALUE self) {
+  using std::ifstream;
+  NM_CONSERVATIVE(nm_register_values(argv, argc));
+  NM_CONSERVATIVE(nm_register_value(&self));
+  VALUE file, force_;
+  // Read the arguments
+  rb_scan_args(argc, argv, "11", &file, &force_);
+  bool force   = (force_ != Qnil && force_ != Qfalse);
+  if (!RB_FILE_EXISTS(file)) { // FIXME: Errno::ENOENT
+    NM_CONSERVATIVE(nm_unregister_values(argv, argc));
+    NM_CONSERVATIVE(nm_unregister_value(&self));
+    rb_raise(rb_get_errno_exc("ENOENT"), "%s", RSTRING_PTR(file));
+  }
+  // Open a file stream
+  ifstream f(RSTRING_PTR(file), std::ios::in | std::ios::binary);
+  uint16_t major, minor, release;
+  get_version_info(major, minor, release); // compare to NMatrix version
+  uint16_t fmajor, fminor, frelease, null16;
+  // READ FIRST 64-BIT BLOCK
+  f.read(reinterpret_cast<char*>(&fmajor),   sizeof(uint16_t));
+  f.read(reinterpret_cast<char*>(&fminor),   sizeof(uint16_t));
+  f.read(reinterpret_cast<char*>(&frelease), sizeof(uint16_t));
+  f.read(reinterpret_cast<char*>(&null16),   sizeof(uint16_t));
+  int ver  = major * 10000 + minor * 100 + release,
+      fver = fmajor * 10000 + fminor * 100 + release;
+  if (fver > ver && force == false) {
+    NM_CONSERVATIVE(nm_unregister_values(argv, argc));
+    NM_CONSERVATIVE(nm_unregister_value(&self));
+    rb_raise(rb_eIOError, "File was created in newer version of NMatrix than current (%u.%u.%u)", fmajor, fminor, frelease);
+  }
+  if (null16 != 0) rb_warn("nm_read: Expected zero padding was not zero (0)\n");
+  uint8_t dt, st, it, sm;
+  uint16_t dim;
+  // READ SECOND 64-BIT BLOCK
+  f.read(reinterpret_cast<char*>(&dt), sizeof(uint8_t));
+  f.read(reinterpret_cast<char*>(&st), sizeof(uint8_t));
+  f.read(reinterpret_cast<char*>(&it), sizeof(uint8_t)); // FIXME: should tell how few bytes indices are stored as
+  f.read(reinterpret_cast<char*>(&sm), sizeof(uint8_t));
+  f.read(reinterpret_cast<char*>(&null16), sizeof(uint16_t));
+  f.read(reinterpret_cast<char*>(&dim), sizeof(uint16_t));
+  if (null16 != 0) rb_warn("nm_read: Expected zero padding was not zero (1)");
+  nm::stype_t stype = static_cast<nm::stype_t>(st);
+  nm::dtype_t dtype = static_cast<nm::dtype_t>(dt);
+  nm::symm_t  symm  = static_cast<nm::symm_t>(sm);
+  //nm::itype_t itype = static_cast<nm::itype_t>(it);
+  // READ NEXT FEW 64-BIT BLOCKS
+  size_t* shape = NM_ALLOC_N(size_t, dim);
+  read_padded_shape(f, dim, shape);
+  STORAGE* s;
+  if (stype == nm::DENSE_STORE) {
+    s = nm_dense_storage_create(dtype, shape, dim, NULL, 0);
+    nm_register_storage(stype, s);
+    read_padded_dense_elements(f, reinterpret_cast<DENSE_STORAGE*>(s), symm, dtype);
+  } else if (stype == nm::YALE_STORE) {
+    uint32_t ndnz, length;
+    // READ YALE-SPECIFIC 64-BIT BLOCK
+    f.read(reinterpret_cast<char*>(&ndnz),     sizeof(uint32_t));
+    f.read(reinterpret_cast<char*>(&length),   sizeof(uint32_t));
+    s = nm_yale_storage_create(dtype, shape, dim, length); // set length as init capacity
+    nm_register_storage(stype, s);
+    read_padded_yale_elements(f, reinterpret_cast<YALE_STORAGE*>(s), length, symm, dtype);
+  } else {
+    NM_CONSERVATIVE(nm_unregister_values(argv, argc));
+    NM_CONSERVATIVE(nm_unregister_value(&self));
+    rb_raise(nm_eStorageTypeError, "please convert to yale or dense before saving");
+  }
+  NMATRIX* nm = nm_create(stype, s);
+  // Return the appropriate matrix object (Ruby VALUE)
+  // FIXME: This should probably return CLASS_OF(self) instead of cNMatrix, but I don't know how that works for
+  // FIXME: class methods.
+  nm_register_nmatrix(nm);
+  VALUE to_return = Data_Wrap_Struct(cNMatrix, nm_mark, nm_delete, nm);
+  nm_unregister_nmatrix(nm);
+  NM_CONSERVATIVE(nm_unregister_values(argv, argc));
+  NM_CONSERVATIVE(nm_unregister_value(&self));
+  nm_unregister_storage(stype, s);
+  switch(stype) {
+  case nm::DENSE_STORE:
+  case nm::YALE_STORE:
+    return to_return;
+  default: // this case never occurs (due to earlier rb_raise)
+    return Qnil;
+  }
+}
+/*
+ * Create a new NMatrix helper for handling internal ia, ja, and a arguments.
+ *
+ * This constructor is only called by Ruby code, so we can skip most of the
+ * checks.
+ */
+static VALUE nm_init_yale_from_old_yale(VALUE shape, VALUE dtype, VALUE ia, VALUE ja, VALUE a, VALUE from_dtype, VALUE nm) {
+  size_t dim     = 2;
+  size_t* shape_  = interpret_shape(shape, &dim);
+  nm::dtype_t dtype_  = nm_dtype_from_rbsymbol(dtype);
+  char *ia_       = RSTRING_PTR(ia),
+       *ja_       = RSTRING_PTR(ja),
+       *a_        = RSTRING_PTR(a);
+  nm::dtype_t from_dtype_ = nm_dtype_from_rbsymbol(from_dtype);
+  NMATRIX* nmatrix;
+  UnwrapNMatrix( nm, nmatrix );
+  nmatrix->stype   = nm::YALE_STORE;
+  nmatrix->storage = (STORAGE*)nm_yale_storage_create_from_old_yale(dtype_, shape_, ia_, ja_, a_, from_dtype_);
+  return nm;
+}
+/*
+ * Check to determine whether matrix is a reference to another matrix.
+ */
+static VALUE nm_is_ref(VALUE self) {
+  if (NM_SRC(self) == NM_STORAGE(self)) return Qfalse;
+  return Qtrue;
+}
+/*
+ * call-seq:
+ *     slice -> ...
+ *
+ * Access the contents of an NMatrix at given coordinates, using copying.
+ *
+ *     n.slice(3,3)  # => 5.0
+ *     n.slice(0..1,0..1) #=> matrix [2,2]
+ *
+ */
+static VALUE nm_mget(int argc, VALUE* argv, VALUE self) {
+  static void* (*ttable[nm::NUM_STYPES])(const STORAGE*, SLICE*) = {
+    nm_dense_storage_get,
+    nm_list_storage_get,
+    nm_yale_storage_get
+  };
+  nm::stype_t stype = NM_STYPE(self);
+  return nm_xslice(argc, argv, ttable[stype], nm_delete, self);
+}
+/*
+ * call-seq:
+ *     matrix[indices] -> ...
+ *
+ * Access the contents of an NMatrix at given coordinates by reference.
+ *
+ *     n[3,3]  # => 5.0
+ *     n[0..1,0..1] #=> matrix [2,2]
+ *
+ */
+static VALUE nm_mref(int argc, VALUE* argv, VALUE self) {
+  static void* (*ttable[nm::NUM_STYPES])(const STORAGE*, SLICE*) = {
+    nm_dense_storage_ref,
+    nm_list_storage_ref,
+    nm_yale_storage_ref
+  };
+  nm::stype_t stype = NM_STYPE(self);
+  return nm_xslice(argc, argv, ttable[stype], nm_delete_ref, self);
+}
+/*
+ * Modify the contents of an NMatrix in the given cell
+ *
+ *     n[3,3] = 5.0
+ *
+ * Also returns the new contents, so you can chain:
+ *
+ *     n[3,3] = n[2,3] = 5.0
+ */
+static VALUE nm_mset(int argc, VALUE* argv, VALUE self) {
+  size_t dim = NM_DIM(self); // last arg is the value
+  VALUE to_return = Qnil;
+  if ((size_t)(argc) > NM_DIM(self)+1) {
+    rb_raise(rb_eArgError, "wrong number of arguments (%d for %lu)", argc, effective_dim(NM_STORAGE(self))+1);
+  } else {
+    NM_CONSERVATIVE(nm_register_value(&self));
+    NM_CONSERVATIVE(nm_register_values(argv, argc));
+    SLICE slice_s;
+    SLICE* slice = &slice_s;
+    slice->coords = NM_ALLOCA_N(size_t, dim);
+    slice->lengths = NM_ALLOCA_N(size_t, dim);
+    init_slice_no_alloc(slice, dim, argc-1, argv, NM_STORAGE(self)->shape);
+    static void (*ttable[nm::NUM_STYPES])(VALUE, SLICE*, VALUE) = {
+      nm_dense_storage_set,
+      nm_list_storage_set,
+      nm_yale_storage_set
+    };
+    ttable[NM_STYPE(self)](self, slice, argv[argc-1]);
+    to_return = argv[argc-1];
+    NM_CONSERVATIVE(nm_unregister_value(&self));
+    NM_CONSERVATIVE(nm_unregister_values(argv, argc));
+  }
+  return to_return;
+}
+/*
+ * Matrix multiply (dot product): against another matrix or a vector.
+ *
+ * For elementwise, use * instead.
+ *
+ * The two matrices must be of the same stype (for now). If dtype differs, an upcast will occur.
+ */
+static VALUE nm_multiply(VALUE left_v, VALUE right_v) {
+  NM_CONSERVATIVE(nm_register_value(&left_v));
+  NM_CONSERVATIVE(nm_register_value(&right_v));
+  NMATRIX *left, *right;
+  UnwrapNMatrix( left_v, left );
+  if (NM_RUBYVAL_IS_NUMERIC(right_v)) {
+    NM_CONSERVATIVE(nm_unregister_value(&left_v));
+    NM_CONSERVATIVE(nm_unregister_value(&right_v));
+    return matrix_multiply_scalar(left, right_v);
+  }
+  else if (RB_TYPE_P(right_v, T_ARRAY)) {
+    NM_CONSERVATIVE(nm_unregister_value(&left_v));
+    NM_CONSERVATIVE(nm_unregister_value(&right_v));
+    rb_raise(rb_eNotImpError, "please convert array to nx1 or 1xn NMatrix first");
+  }
+  else { // both are matrices (probably)
+    CheckNMatrixType(right_v);
+    UnwrapNMatrix( right_v, right );
+    // work like vector dot product for 1dim
+    if (left->storage->dim == 1 && right->storage->dim == 1) {
+      if (left->storage->shape[0] != right->storage->shape[0]) {
+        NM_CONSERVATIVE(nm_unregister_value(&left_v));
+        NM_CONSERVATIVE(nm_unregister_value(&right_v));
+        rb_raise(rb_eArgError, "The left- and right-hand sides of the operation must have the same dimensionality.");
+      } else {
+        VALUE result = elementwise_op(nm::EW_MUL, left_v, right_v);
+        VALUE to_return = rb_funcall(result, rb_intern("sum"),0);
+        NM_CONSERVATIVE(nm_unregister_value(&left_v));
+        NM_CONSERVATIVE(nm_unregister_value(&right_v));
+        return to_return;
+      }
+    }
+    if (left->storage->shape[1] != right->storage->shape[0]) {
+      NM_CONSERVATIVE(nm_unregister_value(&left_v));
+      NM_CONSERVATIVE(nm_unregister_value(&right_v));
+      rb_raise(rb_eArgError, "incompatible dimensions");
+    }
+    if (left->stype != right->stype) {
+      NM_CONSERVATIVE(nm_unregister_value(&left_v));
+      NM_CONSERVATIVE(nm_unregister_value(&right_v));
+      rb_raise(rb_eNotImpError, "matrices must have same stype");
+    }
+    NM_CONSERVATIVE(nm_unregister_value(&left_v));
+    NM_CONSERVATIVE(nm_unregister_value(&right_v));
+    return matrix_multiply(left, right);
+  }
+  NM_CONSERVATIVE(nm_unregister_value(&left_v));
+  NM_CONSERVATIVE(nm_unregister_value(&right_v));
+  return Qnil;
+}
+/*
+ * call-seq:
+ *     dim -> Integer
+ *
+ * Get the number of dimensions of a matrix.
+ *
+ * In other words, if you set your matrix to be 3x4, the dim is 2. If the
+ * matrix was initialized as 3x4x3, the dim is 3.
+ *
+ * Use #effective_dim to get the dimension of an NMatrix which acts as a vector (e.g., a column or row).
+ */
+static VALUE nm_dim(VALUE self) {
+  return INT2FIX(NM_STORAGE(self)->dim);
+}
+/*
+ * call-seq:
+ *     shape -> Array
+ *
+ * Get the shape (dimensions) of a matrix.
+ */
+static VALUE nm_shape(VALUE self) {
+  NM_CONSERVATIVE(nm_register_value(&self));
+  STORAGE* s   = NM_STORAGE(self);
+  // Copy elements into a VALUE array and then use those to create a Ruby array with rb_ary_new4.
+  VALUE* shape = NM_ALLOCA_N(VALUE, s->dim);
+  nm_register_values(shape, s->dim);
+  for (size_t index = 0; index < s->dim; ++index)
+    shape[index] = INT2FIX(s->shape[index]);
+  nm_unregister_values(shape, s->dim);
+  NM_CONSERVATIVE(nm_unregister_value(&self));
+  return rb_ary_new4(s->dim, shape);
+}
+/*
+ * call-seq:
+ *     offset -> Array
+ *
+ * Get the offset (slice position) of a matrix. Typically all zeros, unless you have a reference slice.
+ */
+static VALUE nm_offset(VALUE self) {
+  NM_CONSERVATIVE(nm_register_value(&self));
+  STORAGE* s   = NM_STORAGE(self);
+  // Copy elements into a VALUE array and then use those to create a Ruby array with rb_ary_new4.
+  VALUE* offset = NM_ALLOCA_N(VALUE, s->dim);
+  nm_register_values(offset, s->dim);
+  for (size_t index = 0; index < s->dim; ++index)
+    offset[index] = INT2FIX(s->offset[index]);
+  nm_unregister_values(offset, s->dim);
+  NM_CONSERVATIVE(nm_unregister_value(&self));
+  return rb_ary_new4(s->dim, offset);
+}
+/*
+ * call-seq:
+ *     supershape -> Array
+ *
+ * Get the shape of a slice's parent.
+ */
+static VALUE nm_supershape(VALUE self) {
+  STORAGE* s   = NM_STORAGE(self);
+  if (s->src == s) {
+    return nm_shape(self); // easy case (not a slice)
+  }
+  else s = s->src;
+  NM_CONSERVATIVE(nm_register_value(&self));
+  VALUE* shape = NM_ALLOCA_N(VALUE, s->dim);
+  nm_register_values(shape, s->dim);
+  for (size_t index = 0; index < s->dim; ++index)
+    shape[index] = INT2FIX(s->shape[index]);
+  nm_unregister_values(shape, s->dim);
+  NM_CONSERVATIVE(nm_unregister_value(&self));
+  return rb_ary_new4(s->dim, shape);
+}
+/*
+ * call-seq:
+ *     stype -> Symbol
+ *
+ * Get the storage type (stype) of a matrix, e.g., :yale, :dense, or :list.
+ */
+static VALUE nm_stype(VALUE self) {
+  NM_CONSERVATIVE(nm_register_value(&self));
+  VALUE stype = ID2SYM(rb_intern(STYPE_NAMES[NM_STYPE(self)]));
+  NM_CONSERVATIVE(nm_unregister_value(&self));
+  return stype;
+}
+/*
+ * call-seq:
+ *     symmetric? -> Boolean
+ *
+ * Is this matrix symmetric?
+ */
+static VALUE nm_symmetric(VALUE self) {
+  return is_symmetric(self, false);
+}
+/*
+ * Gets the dimension of a matrix which might be a vector (have one or more shape components of size 1).
+ */
+static size_t effective_dim(STORAGE* s) {
+  size_t d = 0;
+  for (size_t i = 0; i < s->dim; ++i) {
+    if (s->shape[i] != 1) d++;
+  }
+  return d;
+}
+/*
+ * call-seq:
+ *     effective_dim -> Fixnum
+ *
+ * Returns the number of dimensions that don't have length 1. Guaranteed to be less than or equal to #dim.
+ */
+static VALUE nm_effective_dim(VALUE self) {
+  return INT2FIX(effective_dim(NM_STORAGE(self)));
+}
+/*
+ * Get a slice of an NMatrix.
+ */
+static VALUE nm_xslice(int argc, VALUE* argv, void* (*slice_func)(const STORAGE*, SLICE*), void (*delete_func)(NMATRIX*), VALUE self) {
+  VALUE result = Qnil;
+  STORAGE* s = NM_STORAGE(self);
+  if (NM_DIM(self) < (size_t)(argc)) {
+    rb_raise(rb_eArgError, "wrong number of arguments (%d for %lu)", argc, effective_dim(s));
+  } else {
+    NM_CONSERVATIVE(nm_register_values(argv, argc));
+    NM_CONSERVATIVE(nm_register_value(&self));
+    nm_register_value(&result);
+    SLICE slice_s;
+    SLICE* slice = &slice_s;
+    size_t dim = NM_DIM(self);
+    slice->coords = NM_ALLOCA_N(size_t, dim);
+    slice->lengths = NM_ALLOCA_N(size_t, dim);
+    init_slice_no_alloc(slice, dim, argc, argv, s->shape);
+    if (slice->single) {
+      static void* (*ttable[nm::NUM_STYPES])(const STORAGE*, SLICE*) = {
+        nm_dense_storage_ref,
+        nm_list_storage_ref,
+        nm_yale_storage_ref
+      };
+      if (NM_DTYPE(self) == nm::RUBYOBJ)  result = *reinterpret_cast<VALUE*>( ttable[NM_STYPE(self)](s, slice) );
+      else                                result = nm::rubyobj_from_cval( ttable[NM_STYPE(self)](s, slice), NM_DTYPE(self) ).rval;
+    } else {
+      NMATRIX* mat  = NM_ALLOC(NMATRIX);
+      mat->stype    = NM_STYPE(self);
+      mat->storage  = (STORAGE*)((*slice_func)( s, slice ));
+      nm_register_nmatrix(mat);
+      result        = Data_Wrap_Struct(CLASS_OF(self), nm_mark, delete_func, mat);
+      nm_unregister_nmatrix(mat);
+    }
+  }
+  nm_unregister_value(&result);
+  NM_CONSERVATIVE(nm_unregister_values(argv, argc));
+  NM_CONSERVATIVE(nm_unregister_value(&self));
+  return result;
+}
+//////////////////////
+// Helper Functions //
+//////////////////////
+static VALUE unary_op(nm::unaryop_t op, VALUE self) {
+  NM_CONSERVATIVE(nm_register_value(&self));
+  NMATRIX* left;
+  UnwrapNMatrix(self, left);
+  std::string sym;
+  switch(left->stype) {
+  case nm::DENSE_STORE:
+    sym = "__dense_unary_" + nm::UNARYOPS[op] + "__";
+    break;
+  case nm::YALE_STORE:
+    sym = "__yale_unary_" + nm::UNARYOPS[op]  + "__";
+    break;
+  case nm::LIST_STORE:
+    sym = "__list_unary_" + nm::UNARYOPS[op]  + "__";
+    break;
+  }
+  NM_CONSERVATIVE(nm_unregister_value(&self));
+  return rb_funcall(self, rb_intern(sym.c_str()), 0);
+}
+static void check_dims_and_shape(VALUE left_val, VALUE right_val) {
+    // Check that the left- and right-hand sides have the same dimensionality.
+    if (NM_DIM(left_val) != NM_DIM(right_val)) {
+      rb_raise(rb_eArgError, "The left- and right-hand sides of the operation must have the same dimensionality.");
+    }
+    // Check that the left- and right-hand sides have the same shape.
+    if (memcmp(&NM_SHAPE(left_val, 0), &NM_SHAPE(right_val, 0), sizeof(size_t) * NM_DIM(left_val)) != 0) {
+      rb_raise(rb_eArgError, "The left- and right-hand sides of the operation must have the same shape.");
+    }
+}
+static VALUE elementwise_op(nm::ewop_t op, VALUE left_val, VALUE right_val) {
+  NM_CONSERVATIVE(nm_register_value(&left_val));
+  NM_CONSERVATIVE(nm_register_value(&right_val));
+  NMATRIX* left;
+  NMATRIX* result;
+  CheckNMatrixType(left_val);
+  UnwrapNMatrix(left_val, left);
+  if (!IsNMatrixType(right_val)) {
+    // This is a matrix-scalar element-wise operation.
+    std::string sym;
+    switch(left->stype) {
+    case nm::DENSE_STORE:
+      sym = "__dense_scalar_" + nm::EWOP_NAMES[op] + "__";
+      break;
+    case nm::YALE_STORE:
+      sym = "__yale_scalar_" + nm::EWOP_NAMES[op] + "__";
+      break;
+    case nm::LIST_STORE:
+      sym = "__list_scalar_" + nm::EWOP_NAMES[op] + "__";
+      break;
+    default:
+      NM_CONSERVATIVE(nm_unregister_value(&left_val));
+      NM_CONSERVATIVE(nm_unregister_value(&right_val));
+      rb_raise(rb_eNotImpError, "unknown storage type requested scalar element-wise operation");
+    }
+    VALUE symv = rb_intern(sym.c_str());
+    NM_CONSERVATIVE(nm_unregister_value(&left_val));
+    NM_CONSERVATIVE(nm_unregister_value(&right_val));
+    return rb_funcall(left_val, symv, 1, right_val);
+  } else {
+    check_dims_and_shape(left_val, right_val);
+    NMATRIX* right;
+    UnwrapNMatrix(right_val, right);
+    if (left->stype == right->stype) {
+      std::string sym;
+      switch(left->stype) {
+      case nm::DENSE_STORE:
+        sym = "__dense_elementwise_" + nm::EWOP_NAMES[op] + "__";
+        break;
+      case nm::YALE_STORE:
+        sym = "__yale_elementwise_" + nm::EWOP_NAMES[op] + "__";
+        break;
+      case nm::LIST_STORE:
+        sym = "__list_elementwise_" + nm::EWOP_NAMES[op] + "__";
+        break;
+      default:
+        NM_CONSERVATIVE(nm_unregister_value(&left_val));
+        NM_CONSERVATIVE(nm_unregister_value(&right_val));
+        rb_raise(rb_eNotImpError, "unknown storage type requested element-wise operation");
+      }
+      VALUE symv = rb_intern(sym.c_str());
+      NM_CONSERVATIVE(nm_unregister_value(&left_val));
+      NM_CONSERVATIVE(nm_unregister_value(&right_val));
+      return rb_funcall(left_val, symv, 1, right_val);
+    } else {
+      NM_CONSERVATIVE(nm_unregister_value(&left_val));
+      NM_CONSERVATIVE(nm_unregister_value(&right_val));
+      rb_raise(rb_eArgError, "Element-wise operations are not currently supported between matrices with differing stypes.");
+    }
+  }
+  NM_CONSERVATIVE(nm_unregister_value(&left_val));
+  NM_CONSERVATIVE(nm_unregister_value(&right_val));
+  return Data_Wrap_Struct(CLASS_OF(left_val), nm_mark, nm_delete, result);
+}
+static VALUE noncom_elementwise_op(nm::noncom_ewop_t op, VALUE self, VALUE other, VALUE flip) {
+  NM_CONSERVATIVE(nm_register_value(&self));
+  NM_CONSERVATIVE(nm_register_value(&other));
+  NMATRIX* self_nm;
+  NMATRIX* result;
+  CheckNMatrixType(self);
+  UnwrapNMatrix(self, self_nm);
+  if (!IsNMatrixType(other)) {
+    // This is a matrix-scalar element-wise operation.
+    std::string sym;
+    switch(self_nm->stype) {
+    case nm::DENSE_STORE:
+      sym = "__dense_scalar_" + nm::NONCOM_EWOP_NAMES[op] + "__";
+      break;
+    case nm::YALE_STORE:
+      sym = "__yale_scalar_" + nm::NONCOM_EWOP_NAMES[op] + "__";
+      break;
+    case nm::LIST_STORE:
+      sym = "__list_scalar_" + nm::NONCOM_EWOP_NAMES[op] + "__";
+      break;
+    default:
+      NM_CONSERVATIVE(nm_unregister_value(&self));
+      NM_CONSERVATIVE(nm_unregister_value(&other));
+      rb_raise(rb_eNotImpError, "unknown storage type requested scalar element-wise operation");
+    }
+    NM_CONSERVATIVE(nm_unregister_value(&self));
+    NM_CONSERVATIVE(nm_unregister_value(&other));
+    return rb_funcall(self, rb_intern(sym.c_str()), 2, other, flip);
+  } else {
+    check_dims_and_shape(self, other);
+    NMATRIX* other_nm;
+    UnwrapNMatrix(other, other_nm);
+    if (self_nm->stype == other_nm->stype) {
+      std::string sym;
+      switch(self_nm->stype) {
+      case nm::DENSE_STORE:
+        sym = "__dense_elementwise_" + nm::NONCOM_EWOP_NAMES[op] + "__";
+        break;
+      case nm::YALE_STORE:
+        sym = "__yale_elementwise_" + nm::NONCOM_EWOP_NAMES[op] + "__";
+        break;
+      case nm::LIST_STORE:
+        sym = "__list_elementwise_" + nm::NONCOM_EWOP_NAMES[op] + "__";
+        break;
+      default:
+  NM_CONSERVATIVE(nm_unregister_value(&self));
+  NM_CONSERVATIVE(nm_unregister_value(&other));
+  rb_raise(rb_eNotImpError, "unknown storage type requested element-wise operation");
+      }
+      NM_CONSERVATIVE(nm_unregister_value(&self));
+      NM_CONSERVATIVE(nm_unregister_value(&other));
+      return rb_funcall(self, rb_intern(sym.c_str()), 2, other, flip);
+    } else {
+      nm_unregister_value(&self);
+      nm_unregister_value(&other);
+      rb_raise(rb_eArgError, "Element-wise operations are not currently supported between matrices with differing stypes.");
+    }
+  }
+  NM_CONSERVATIVE(nm_unregister_value(&self));
+  NM_CONSERVATIVE(nm_unregister_value(&other));
+  return Data_Wrap_Struct(CLASS_OF(self), nm_mark, nm_delete, result);
+}
+/*
+ * Check to determine whether matrix is a reference to another matrix.
+ */
+bool is_ref(const NMATRIX* matrix) {
+  return matrix->storage->src != matrix->storage;
+}
+/*
+ * Helper function for nm_symmetric and nm_hermitian.
+ */
+static VALUE is_symmetric(VALUE self, bool hermitian) {
+  NM_CONSERVATIVE(nm_register_value(&self));
+  NMATRIX* m;
+  UnwrapNMatrix(self, m);
+  bool is_symmetric = false;
+  if (m->storage->shape[0] == m->storage->shape[1] and m->storage->dim == 2) {
+    if (NM_STYPE(self) == nm::DENSE_STORE) {
+      if (hermitian) {
+        is_symmetric = nm_dense_storage_is_hermitian((DENSE_STORAGE*)(m->storage), m->storage->shape[0]);
+      } else {
+        is_symmetric = nm_dense_storage_is_symmetric((DENSE_STORAGE*)(m->storage), m->storage->shape[0]);
+      }
+    } else {
+      // TODO: Implement, at the very least, yale_is_symmetric. Model it after yale/transp.template.c.
+      NM_CONSERVATIVE(nm_unregister_value(&self));
+      rb_raise(rb_eNotImpError, "symmetric? and hermitian? only implemented for dense currently");
+    }
+  }
+  NM_CONSERVATIVE(nm_unregister_value(&self));
+  return is_symmetric ? Qtrue : Qfalse;
+}
+///////////////////////
+// Utility Functions //
+///////////////////////
+/*
+ * Guess the dtype given a Ruby VALUE and return it as a symbol.
+ *
+ * Not to be confused with nm_dtype_guess, which returns an nm::dtype_t. (This calls that.)
+ */
+static VALUE nm_guess_dtype(VALUE self, VALUE v) {
+  return ID2SYM(rb_intern(DTYPE_NAMES[nm_dtype_guess(v)]));
+}
+/*
+ * Get the minimum allowable dtype for a Ruby VALUE and return it as a symbol.
+ */
+static VALUE nm_min_dtype(VALUE self, VALUE v) {
+  return ID2SYM(rb_intern(DTYPE_NAMES[nm_dtype_min(v)]));
+}
+/*
+ * Helper for nm_dtype_min(), handling integers.
+ */
+nm::dtype_t nm_dtype_min_fixnum(int64_t v) {
+  if (v >= 0 && v <= UCHAR_MAX) return nm::BYTE;
+  else {
+    v = std::abs(v);
+    if (v <= CHAR_MAX) return nm::INT8;
+    else if (v <= SHRT_MAX) return nm::INT16;
+    else if (v <= INT_MAX) return nm::INT32;
+    else return nm::INT64;
+  }
+}
+/*
+ * Return the minimum dtype required to store a given value.
+ *
+ * This is kind of arbitrary. For Float, it always returns :float32 for example, since in some cases neither :float64
+ * not :float32 are sufficient.
+ *
+ * This function is used in upcasting for scalar math. We want to ensure that :int8 + 1 does not return an :int64, basically.
+ *
+ * FIXME: Eventually, this function should actually look at the value stored in Fixnums (for example), so that it knows
+ * whether to return :int64 or :int32.
+ */
+nm::dtype_t nm_dtype_min(VALUE v) {
+  if (RB_TYPE_P(v, T_FIXNUM))
+    return nm_dtype_min_fixnum(FIX2LONG(v));
+  else if (RB_TYPE_P(v, T_BIGNUM))
+    return nm::INT64;
+  else if (RB_TYPE_P(v, T_FLOAT))
+    return nm::FLOAT32;
+  else if (RB_TYPE_P(v, T_COMPLEX))
+    return nm::COMPLEX64;
+  else if (RB_TYPE_P(v, T_STRING))
+    return RSTRING_LEN(v) == 1 ? nm::BYTE : nm::RUBYOBJ;
+  else if (RB_TYPE_P(v, T_TRUE) || RB_TYPE_P(v, T_FALSE) || RB_TYPE_P(v, T_NIL))
+    return nm::RUBYOBJ;
+  else
+    return nm::RUBYOBJ;
+}
+/*
+ * Guess the data type given a value.
+ *
+ * TODO: Probably needs some work for Bignum.
+ */
+nm::dtype_t nm_dtype_guess(VALUE v) {
+  if (RB_TYPE_P(v, T_TRUE) || RB_TYPE_P(v, T_FALSE) || RB_TYPE_P(v, T_NIL))
+    return nm::RUBYOBJ;
+  else if (RB_TYPE_P(v, T_STRING))
+    return RSTRING_LEN(v) == 1 ? nm::BYTE : nm::RUBYOBJ;
+  else if (RB_TYPE_P(v, T_FIXNUM))
+#if SIZEOF_INT == 8
+    return nm::INT64;
+#elif SIZEOF_INT == 4
+    return nm::INT32;
+#else
+    return nm::INT16;
+#endif
+  else if (RB_TYPE_P(v, T_BIGNUM))
+    return nm::INT64;
+#if SIZEOF_FLOAT == 4
+  else if (RB_TYPE_P(v, T_COMPLEX))
+    return nm::COMPLEX128;
+  else if (RB_TYPE_P(v, T_FLOAT))
+    return nm::FLOAT64;
+#elif SIZEOF_FLOAT == 2
+  else if (RB_TYPE_P(v, T_COMPLEX))
+    return nm::COMPLEX64;
+  else if (RB_TYPE_P(v, T_FLOAT))
+    return nm::FLOAT32;
+#endif
+  else if (RB_TYPE_P(v, T_ARRAY))
+    /*
+     * May be passed for dense -- for now, just look at the first element.
+     *
+     * TODO: Look at entire array for most specific type.
+     */
+    return nm_dtype_guess(RARRAY_AREF(v, 0));
+  else {
+    RB_P(v);
+    rb_raise(rb_eArgError, "Unable to guess a data type from provided parameters; data type must be specified manually.");
+  }
+}
+/*
+ * Modify an existing SLICE object (with properly allocated memory),
+ * so that it will contain the appropriate coordinate and length information
+ * for accessing some part of a matrix.
+ */
+static void init_slice_no_alloc(SLICE* slice, size_t dim, int argc, VALUE* arg, size_t* shape) {
+  NM_CONSERVATIVE(nm_register_values(arg, argc));
+  VALUE beg, end;
+  int excl;
+  slice->single = true;
+  // r is the shape position; t is the slice position. They may differ when we're dealing with a
+  // matrix where the effective dimension is less than the dimension (e.g., a vector).
+  for (size_t r = 0, t = 0; r < dim; ++r) {
+    VALUE v = t == (unsigned int)argc ? Qnil : arg[t];
+    // if the current shape indicates a vector and fewer args were supplied than necessary, just use 0
+    if (argc - t + r < dim && shape[r] == 1) {
+      slice->coords[r]  = 0;
+      slice->lengths[r] = 1;
+    } else if (FIXNUM_P(v)) { // this used CLASS_OF before, which is inefficient for fixnum
+      int v_ = FIX2INT(v);
+      if (v_ < 0) // checking for negative indexes
+        slice->coords[r]  = shape[r]+v_;
+      else
+        slice->coords[r]  = v_;
+      slice->lengths[r] = 1;
+      t++;
+    } else if (SYMBOL_P(v) && rb_to_id(v) == nm_rb_mul) { // :* means the whole possible range
+      slice->coords[r]  = 0;
+      slice->lengths[r] = shape[r];
+      slice->single     = false;
+      t++;
+    } else if (CLASS_OF(v) == rb_cRange) {
+      rb_range_values(arg[t], &beg, &end, &excl);
+      int begin_ = FIX2INT(beg);
+      int end_   = FIX2INT(end);
+      slice->coords[r] = (begin_ < 0) ? shape[r] + begin_ : begin_;
+      // Exclude last element for a...b range
+      if (end_ < 0)
+        slice->lengths[r] = shape[r] + end_ - slice->coords[r] + (excl ? 0 : 1);
+      else
+        slice->lengths[r] = end_ - slice->coords[r] + (excl ? 0 : 1);
+      slice->single     = false;
+      t++;
+    } else {
+      NM_CONSERVATIVE(nm_unregister_values(arg, argc));
+      rb_raise(rb_eArgError, "expected Fixnum or Range for slice component instead of %s", rb_obj_classname(v));
+    }
+    if (slice->coords[r] > shape[r] || slice->coords[r] + slice->lengths[r] > shape[r]) {
+      NM_CONSERVATIVE(nm_unregister_values(arg, argc));
+      rb_raise(rb_eRangeError, "slice is larger than matrix in dimension %lu (slice component %lu)", r, t);
+    }
+  }
+  NM_CONSERVATIVE(nm_unregister_values(arg, argc));
+}
+#ifdef BENCHMARK
+/*
+ * A simple function used when benchmarking NMatrix.
+ */
+static double get_time(void) {
+  struct timeval t;
+  struct timezone tzp;
+  gettimeofday(&t, &tzp);
+  return t.tv_sec + t.tv_usec*1e-6;
+}
+#endif
+/*
+ * The argv parameter will be either 1 or 2 elements.  If 1, could be either
+ * initial or dtype.  If 2, is initial and dtype. This function returns the
+ * dtype.
+ */
+static nm::dtype_t interpret_dtype(int argc, VALUE* argv, nm::stype_t stype) {
+  int offset;
+  switch (argc) {
+    case 1:
+      offset = 0;
+      break;
+    case 2:
+      offset = 1;
+      break;
+    default:
+      rb_raise(rb_eArgError, "Need an initial value or a dtype.");
+      break;
+  }
+  if (SYMBOL_P(argv[offset])) {
+    return nm_dtype_from_rbsymbol(argv[offset]);
+  } else if (RB_TYPE_P(argv[offset], T_STRING)) {
+    return nm_dtype_from_rbstring(StringValue(argv[offset]));
+  } else if (stype == nm::YALE_STORE) {
+    rb_raise(rb_eArgError, "Yale storage class requires a dtype.");
+  } else {
+    return nm_dtype_guess(argv[0]);
+  }
+}
+/*
+ * Convert an Ruby value or an array of Ruby values into initial C values.
+ */
+static void* interpret_initial_value(VALUE arg, nm::dtype_t dtype) {
+  NM_CONSERVATIVE(nm_register_value(&arg));
+  unsigned int index;
+  void* init_val;
+  if (RB_TYPE_P(arg, T_ARRAY)) {
+    // Array
+    init_val = NM_ALLOC_N(char, DTYPE_SIZES[dtype] * RARRAY_LEN(arg));
+    NM_CHECK_ALLOC(init_val);
+    for (index = 0; index < RARRAY_LEN(arg); ++index) {
+      rubyval_to_cval(RARRAY_AREF(arg, index), dtype, (char*)init_val + (index * DTYPE_SIZES[dtype]));
+    }
+  } else {
+    // Single value
+    init_val = rubyobj_to_cval(arg, dtype);
+  }
+  NM_CONSERVATIVE(nm_unregister_value(&arg));
+  return init_val;
+}
+/*
+ * Convert the shape argument, which may be either a Ruby value or an array of
+ * Ruby values, into C values.  The second argument is where the dimensionality
+ * of the matrix will be stored.  The function itself returns a pointer to the
+ * array describing the shape, which must be freed manually.
+ */
+static size_t* interpret_shape(VALUE arg, size_t* dim) {
+  NM_CONSERVATIVE(nm_register_value(&arg));
+  size_t* shape;
+  if (RB_TYPE_P(arg, T_ARRAY)) {
+    *dim = RARRAY_LEN(arg);
+    shape = NM_ALLOC_N(size_t, *dim);
+    for (size_t index = 0; index < *dim; ++index) {
+      shape[index] = FIX2UINT( RARRAY_AREF(arg, index) );
+    }
+  } else if (FIXNUM_P(arg)) {
+    *dim = 2;
+    shape = NM_ALLOC_N(size_t, *dim);
+    shape[0] = FIX2UINT(arg);
+    shape[1] = FIX2UINT(arg);
+  } else {
+    nm_unregister_value(&arg);
+    rb_raise(rb_eArgError, "Expected an array of numbers or a single Fixnum for matrix shape");
+  }
+  NM_CONSERVATIVE(nm_unregister_value(&arg));
+  return shape;
+}
+/*
+ * Convert a Ruby symbol or string into an storage type.
+ */
+static nm::stype_t interpret_stype(VALUE arg) {
+  if (SYMBOL_P(arg)) {
+    return nm_stype_from_rbsymbol(arg);
+  } else if (RB_TYPE_P(arg, T_STRING)) {
+    return nm_stype_from_rbstring(StringValue(arg));
+  } else {
+    rb_raise(rb_eArgError, "Expected storage type");
+  }
+}
+//////////////////
+// Math Helpers //
+//////////////////
+STORAGE* matrix_storage_cast_alloc(NMATRIX* matrix, nm::dtype_t new_dtype) {
+  if (matrix->storage->dtype == new_dtype && !is_ref(matrix))
+    return matrix->storage;
+  CAST_TABLE(cast_copy_storage);
+  return cast_copy_storage[matrix->stype][matrix->stype](matrix->storage, new_dtype, NULL);
+}
+STORAGE_PAIR binary_storage_cast_alloc(NMATRIX* left_matrix, NMATRIX* right_matrix) {
+  nm_register_nmatrix(left_matrix);
+  nm_register_nmatrix(right_matrix);
+  STORAGE_PAIR casted;
+  nm::dtype_t new_dtype = Upcast[left_matrix->storage->dtype][right_matrix->storage->dtype];
+  casted.left  = matrix_storage_cast_alloc(left_matrix, new_dtype);
+  nm_register_storage(left_matrix->stype, casted.left);
+  casted.right = matrix_storage_cast_alloc(right_matrix, new_dtype);
+  nm_unregister_nmatrix(left_matrix);
+  nm_unregister_nmatrix(right_matrix);
+  nm_unregister_storage(left_matrix->stype, casted.left);
+  return casted;
+}
+static VALUE matrix_multiply_scalar(NMATRIX* left, VALUE scalar) {
+  rb_raise(rb_eNotImpError, "matrix-scalar multiplication not implemented yet");
+  return Qnil;
+}
+static VALUE matrix_multiply(NMATRIX* left, NMATRIX* right) {
+  nm_register_nmatrix(left);
+  nm_register_nmatrix(right);
+  ///TODO: multiplication for non-dense and/or non-decimal matrices
+  // Make sure both of our matrices are of the correct type.
+  STORAGE_PAIR casted = binary_storage_cast_alloc(left, right);
+  nm_register_storage(left->stype, casted.left);
+  nm_register_storage(right->stype, casted.right);
+  size_t*  resulting_shape   = NM_ALLOC_N(size_t, 2);
+  resulting_shape[0] = left->storage->shape[0];
+  resulting_shape[1] = right->storage->shape[1];
+  // Sometimes we only need to use matrix-vector multiplication (e.g., GEMM versus GEMV). Find out.
+  bool vector = false;
+  if (resulting_shape[1] == 1) vector = true;
+  static STORAGE* (*storage_matrix_multiply[nm::NUM_STYPES])(const STORAGE_PAIR&, size_t*, bool) = {
+    nm_dense_storage_matrix_multiply,
+    nm_list_storage_matrix_multiply,
+    nm_yale_storage_matrix_multiply
+  };
+  STORAGE* resulting_storage = storage_matrix_multiply[left->stype](casted, resulting_shape, vector);
+  NMATRIX* result = nm_create(left->stype, resulting_storage);
+  nm_register_nmatrix(result);
+  // Free any casted-storage we created for the multiplication.
+  // TODO: Can we make the Ruby GC take care of this stuff now that we're using it?
+  // If we did that, we night not have to re-create these every time, right? Or wrong? Need to do
+  // more research.
+  static void (*free_storage[nm::NUM_STYPES])(STORAGE*) = {
+    nm_dense_storage_delete,
+    nm_list_storage_delete,
+    nm_yale_storage_delete
+  };
+  nm_unregister_storage(left->stype, casted.left);
+  if (left->storage != casted.left)   free_storage[result->stype](casted.left);
+  nm_unregister_storage(right->stype, casted.right);
+  if (right->storage != casted.right) free_storage[result->stype](casted.right);
+  VALUE to_return = result ? Data_Wrap_Struct(cNMatrix, nm_mark, nm_delete, result) : Qnil; // Only if we try to multiply list matrices should we return Qnil.
+  nm_unregister_nmatrix(left);
+  nm_unregister_nmatrix(right);
+  nm_unregister_nmatrix(result);
+  return to_return;
+}
+/*
+ * Reduce a matrix to hessenberg form.
+ *
+ * == Arguments
+ *
+ * a - The NMatrix to be reduced. This matrix is replaced with the hessenberg form.
+ *
+ * == Notes
+ *
+ * LAPACK free.
+ */
+static VALUE nm_hessenberg(VALUE self, VALUE a) {
+  nm_math_hessenberg(a);
+  return a;
+}
+/*
+ * Calculate the inverse of a matrix with in-place Gauss-Jordan elimination.
+ * Inverse will fail if the largest element in any column in zero.
+ *
+ * LAPACK free.
+ */
+static VALUE nm_inverse(VALUE self, VALUE inverse, VALUE bang) {
+  if (NM_STYPE(self) != nm::DENSE_STORE) {
+    rb_raise(rb_eNotImpError, "needs exact determinant implementation for this matrix stype");
+    return Qnil;
+  }
+  if (NM_DIM(self) != 2 || NM_SHAPE0(self) != NM_SHAPE1(self)) {
+    rb_raise(nm_eShapeError, "matrices must be square to have an inverse defined");
+    return Qnil;
+  }
+  if (bang == Qtrue) {
+    nm_math_inverse(NM_SHAPE0(self), NM_STORAGE_DENSE(self)->elements,
+      NM_DTYPE(self));
+    return self;
+  }
+  nm_math_inverse(NM_SHAPE0(inverse), NM_STORAGE_DENSE(inverse)->elements,
+    NM_DTYPE(inverse));
+  return inverse;
+}
+/*
+ * Calculate the exact inverse of a 2x2 or 3x3 matrix.
+ *
+ * Does not test for invertibility!
+ */
+static VALUE nm_inverse_exact(VALUE self, VALUE inverse, VALUE lda, VALUE ldb) {
+  if (NM_DIM(self) != 2 || NM_SHAPE0(self) != NM_SHAPE1(self)) {
+    rb_raise(nm_eShapeError, "matrices must be square to have an inverse defined");
+    return Qnil;
+  }
+  nm::dtype_t dtype = NM_DTYPE(self);
+  void* result = NM_ALLOCA_N(char, DTYPE_SIZES[dtype]);
+  if (dtype == nm::RUBYOBJ) {
+    nm_register_values(reinterpret_cast<VALUE*>(result), 1);
+  }
+  nm::stype_t old_stype = NM_STYPE(self);
+  if (old_stype == nm::LIST_STORE) {
+    self = nm_cast_with_types(self, nm::YALE_STORE, dtype, result);
+    inverse = nm_cast_with_types(inverse, nm::YALE_STORE, dtype, result);
+  }
+  if (NM_STYPE(self) == nm::DENSE_STORE) {
+    nm_math_inverse_exact_from_dense(NM_SHAPE0(self),
+      NM_STORAGE_DENSE(self)->elements, FIX2INT(lda),
+      NM_STORAGE_DENSE(inverse)->elements, FIX2INT(ldb), dtype);
+  } else {
+    nm_math_inverse_exact_from_yale(NM_SHAPE0(self),
+      NM_STORAGE_YALE(self), FIX2INT(lda),
+      NM_STORAGE_YALE(inverse), FIX2INT(ldb), dtype);
+  }
+  if (old_stype == nm::LIST_STORE) {
+    inverse = nm_cast_with_types(inverse, nm::LIST_STORE, dtype, result);
+  }
+  if (dtype == nm::RUBYOBJ) {
+    nm_unregister_values(reinterpret_cast<VALUE*>(result), 1);
+  }
+  return inverse;
+}
+/*
+ * Calculate the exact determinant of a dense matrix.
+ *
+ * Returns nil for dense matrices which are not square or number of dimensions other than 2.
+ *
+ * Note: Currently only implemented for 2x2 and 3x3 matrices.
+ */
+static VALUE nm_det_exact(VALUE self) {
+  if (NM_DIM(self) != 2 || NM_SHAPE0(self) != NM_SHAPE1(self)) {
+    rb_raise(nm_eShapeError, "matrices must be square to have a determinant defined");
+    return Qnil;
+  }
+  nm::dtype_t dtype = NM_DTYPE(self);
+  void* result = NM_ALLOCA_N(char, DTYPE_SIZES[dtype]);
+  if (NM_STYPE(self) == nm::LIST_STORE) {
+    self = nm_cast_with_types(self, nm::YALE_STORE, dtype, result);
+  }
+  NM_CONSERVATIVE(nm_register_value(&self));
+  // Calculate the determinant and then assign it to the return value
+  if (NM_STYPE(self) == nm::DENSE_STORE) {
+    nm_math_det_exact_from_dense(NM_SHAPE0(self), NM_STORAGE_DENSE(self)->elements,
+          NM_SHAPE0(self), NM_DTYPE(self), result);
+  } else {
+    nm_math_det_exact_from_yale(NM_SHAPE0(self), NM_STORAGE_YALE(self),
+          NM_SHAPE0(self), NM_DTYPE(self), result);
+  }
+  VALUE to_return;
+  if (dtype == nm::RUBYOBJ) {
+    to_return = *reinterpret_cast<VALUE*>(result);
+  } else {
+    to_return = nm::rubyobj_from_cval(result, NM_DTYPE(self)).rval;
+  }
+  NM_CONSERVATIVE(nm_unregister_value(&self));
+  return to_return;
+}
+/*
+ * Returns the pointer to the matrix storage's data. This is useful primarily when you are using FFI with NMatrix --
+ * say, for example, you want to pass a float* to some function, and your NMatrix is a :float32 :dense matrix. Then you
+ * can call this function and get that pointer directly instead of copying the data.
+ */
+static VALUE nm_data_pointer(VALUE self) {
+  //if (NM_DTYPE(self) == nm::LIST_STORE)
+  //  rb_warn("pointer requested for list storage, which may be meaningless");
+  // This is actually pretty easy, since all of the storage types have their elements positioned in the same place
+  // relative to one another. So yes, believe it or not, this should work just as well for Yale or list storage as for
+  // dense.
+  return INT2FIX(NM_STORAGE_DENSE(self)->elements);
+}
+/////////////////
+// Exposed API //
+/////////////////
+/*
+ * Create a dense matrix. Used by the NMatrix GSL fork. Unlike nm_create, this one copies all of the
+ * arrays and such passed in -- so you don't have to allocate and pass a new shape object for every
+ * matrix you want to create, for example. Same goes for elements.
+ *
+ * Returns a properly-wrapped Ruby object as a VALUE.
+ *
+ * *** Note that this function is for API only. Please do not use it internally.
+ *
+ * TODO: Add a column-major option for libraries that use column-major matrices.
+ */
+VALUE rb_nmatrix_dense_create(nm::dtype_t dtype, size_t* shape, size_t dim, void* elements, size_t length) {
+  if (dtype == nm::RUBYOBJ) {
+    nm_register_values(reinterpret_cast<VALUE*>(elements), length);
+  }
+  NMATRIX* nm;
+  size_t nm_dim;
+  size_t* shape_copy;
+  // Do not allow a dim of 1. Treat it as a column or row matrix.
+  if (dim == 1) {
+    nm_dim        = 2;
+    shape_copy    = NM_ALLOC_N(size_t, nm_dim);
+    shape_copy[0]  = shape[0];
+    shape_copy[1]  = 1;
+  } else {
+    nm_dim      = dim;
+    shape_copy  = NM_ALLOC_N(size_t, nm_dim);
+    memcpy(shape_copy, shape, sizeof(size_t)*nm_dim);
+  }
+  // Copy elements
+  void* elements_copy = NM_ALLOC_N(char, DTYPE_SIZES[dtype]*length);
+  memcpy(elements_copy, elements, DTYPE_SIZES[dtype]*length);
+  // allocate and create the matrix and its storage
+  nm = nm_create(nm::DENSE_STORE, nm_dense_storage_create(dtype, shape_copy, dim, elements_copy, length));
+  nm_register_nmatrix(nm);
+  VALUE to_return = Data_Wrap_Struct(cNMatrix, nm_mark, nm_delete, nm);
+  nm_unregister_nmatrix(nm);
+  if (dtype == nm::RUBYOBJ) {
+    nm_unregister_values(reinterpret_cast<VALUE*>(elements), length);
+  }
+  // tell Ruby about the matrix and its storage, particularly how to garbage collect it.
+  return to_return;
+}
+/*
+ * Create a dense vector. Used by the NMatrix GSL fork.
+ *
+ * Basically just a convenience wrapper for rb_nmatrix_dense_create().
+ *
+ * Returns a properly-wrapped Ruby NMatrix object as a VALUE. Included for backwards compatibility
+ * for when NMatrix had an NVector class.
+ */
+VALUE rb_nvector_dense_create(nm::dtype_t dtype, void* elements, size_t length) {
+  size_t dim = 1, shape = length;
+  return rb_nmatrix_dense_create(dtype, &shape, dim, elements, length);
+}