RubyGems - numo-linalg-alt - Versions diffs - 0.3.0 → 0.4.1 - Mend

numo-linalg-alt 0.3.0 → 0.4.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (55) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +9 -0
data/ext/numo/linalg/blas/dot.c +61 -61
data/ext/numo/linalg/blas/dot_sub.c +60 -60
data/ext/numo/linalg/blas/gemm.c +161 -152
data/ext/numo/linalg/blas/gemv.c +135 -131
data/ext/numo/linalg/blas/nrm2.c +54 -54
data/ext/numo/linalg/lapack/gebal.c +87 -0
data/ext/numo/linalg/lapack/gebal.h +15 -0
data/ext/numo/linalg/lapack/gees.c +243 -224
data/ext/numo/linalg/lapack/geev.c +131 -114
data/ext/numo/linalg/lapack/gelsd.c +85 -74
data/ext/numo/linalg/lapack/geqrf.c +56 -55
data/ext/numo/linalg/lapack/gerqf.c +70 -0
data/ext/numo/linalg/lapack/gerqf.h +15 -0
data/ext/numo/linalg/lapack/gesdd.c +100 -90
data/ext/numo/linalg/lapack/gesv.c +84 -82
data/ext/numo/linalg/lapack/gesvd.c +144 -133
data/ext/numo/linalg/lapack/getrf.c +55 -54
data/ext/numo/linalg/lapack/getri.c +68 -67
data/ext/numo/linalg/lapack/getrs.c +96 -92
data/ext/numo/linalg/lapack/gges.c +214 -0
data/ext/numo/linalg/lapack/gges.h +15 -0
data/ext/numo/linalg/lapack/heev.c +56 -54
data/ext/numo/linalg/lapack/heevd.c +56 -54
data/ext/numo/linalg/lapack/heevr.c +111 -100
data/ext/numo/linalg/lapack/hegv.c +79 -76
data/ext/numo/linalg/lapack/hegvd.c +79 -76
data/ext/numo/linalg/lapack/hegvx.c +134 -122
data/ext/numo/linalg/lapack/hetrf.c +56 -52
data/ext/numo/linalg/lapack/lange.c +49 -48
data/ext/numo/linalg/lapack/orgqr.c +65 -64
data/ext/numo/linalg/lapack/orgrq.c +78 -0
data/ext/numo/linalg/lapack/orgrq.h +15 -0
data/ext/numo/linalg/lapack/potrf.c +53 -52
data/ext/numo/linalg/lapack/potri.c +53 -52
data/ext/numo/linalg/lapack/potrs.c +78 -76
data/ext/numo/linalg/lapack/syev.c +56 -54
data/ext/numo/linalg/lapack/syevd.c +56 -54
data/ext/numo/linalg/lapack/syevr.c +109 -100
data/ext/numo/linalg/lapack/sygv.c +79 -75
data/ext/numo/linalg/lapack/sygvd.c +79 -75
data/ext/numo/linalg/lapack/sygvx.c +134 -122
data/ext/numo/linalg/lapack/sytrf.c +58 -54
data/ext/numo/linalg/lapack/trtrs.c +83 -79
data/ext/numo/linalg/lapack/ungqr.c +65 -64
data/ext/numo/linalg/lapack/ungrq.c +78 -0
data/ext/numo/linalg/lapack/ungrq.h +15 -0
data/ext/numo/linalg/linalg.c +24 -13
data/ext/numo/linalg/linalg.h +5 -0
data/ext/numo/linalg/util.c +8 -0
data/ext/numo/linalg/util.h +1 -0
data/lib/numo/linalg/version.rb +1 -1
data/lib/numo/linalg.rb +235 -3
metadata +12 -2

data/ext/numo/linalg/blas/gemv.c CHANGED Viewed

@@ -1,138 +1,142 @@
 #include "gemv.h"
-#define DEF_LINALG_OPTIONS(tDType) \
-  struct _gemv_options_##tDType {  \
-    tDType alpha;                  \
-    tDType beta;                   \
-    enum CBLAS_ORDER order;        \
-    enum CBLAS_TRANSPOSE trans;    \
-    blasint m;                     \
-    blasint n;                     \
+#define DEF_LINALG_OPTIONS(tDType)                                                             \
+  struct _gemv_options_##tDType {                                                              \
+    tDType alpha;                                                                              \
+    tDType beta;                                                                               \
+    enum CBLAS_ORDER order;                                                                    \
+    enum CBLAS_TRANSPOSE trans;                                                                \
+    blasint m;                                                                                 \
+    blasint n;                                                                                 \
   };
-#define DEF_LINALG_ITER_FUNC(tDType, fBlasFunc)                                               \
-  static void _iter_##fBlasFunc(na_loop_t* const lp) {                                        \
-    const tDType* a = (tDType*)NDL_PTR(lp, 0);                                                \
-    const tDType* x = (tDType*)NDL_PTR(lp, 1);                                                \
-    tDType* y = (tDType*)NDL_PTR(lp, 2);                                                      \
-    const struct _gemv_options_##tDType* opt = (struct _gemv_options_##tDType*)(lp->opt_ptr); \
-    const blasint lda = opt->n;                                                               \
-    cblas_##fBlasFunc(opt->order, opt->trans, opt->m, opt->n,                                 \
-                      opt->alpha, a, lda, x, 1, opt->beta, y, 1);                             \
+#define DEF_LINALG_ITER_FUNC(tDType, fBlasFunc)                                                \
+  static void _iter_##fBlasFunc(na_loop_t* const lp) {                                         \
+    const tDType* a = (tDType*)NDL_PTR(lp, 0);                                                 \
+    const tDType* x = (tDType*)NDL_PTR(lp, 1);                                                 \
+    tDType* y = (tDType*)NDL_PTR(lp, 2);                                                       \
+    const struct _gemv_options_##tDType* opt = (struct _gemv_options_##tDType*)(lp->opt_ptr);  \
+    const blasint lda = opt->n;                                                                \
+    cblas_##fBlasFunc(                                                                         \
+      opt->order, opt->trans, opt->m, opt->n, opt->alpha, a, lda, x, 1, opt->beta, y, 1        \
+    );                                                                                         \
   }
-#define DEF_LINALG_ITER_FUNC_COMPLEX(tDType, fBlasFunc)                                       \
-  static void _iter_##fBlasFunc(na_loop_t* const lp) {                                        \
-    const tDType* a = (tDType*)NDL_PTR(lp, 0);                                                \
-    const tDType* x = (tDType*)NDL_PTR(lp, 1);                                                \
-    tDType* y = (tDType*)NDL_PTR(lp, 2);                                                      \
-    const struct _gemv_options_##tDType* opt = (struct _gemv_options_##tDType*)(lp->opt_ptr); \
-    const blasint lda = opt->n;                                                               \
-    cblas_##fBlasFunc(opt->order, opt->trans, opt->m, opt->n,                                 \
-                      &opt->alpha, a, lda, x, 1, &opt->beta, y, 1);                           \
+#define DEF_LINALG_ITER_FUNC_COMPLEX(tDType, fBlasFunc)                                        \
+  static void _iter_##fBlasFunc(na_loop_t* const lp) {                                         \
+    const tDType* a = (tDType*)NDL_PTR(lp, 0);                                                 \
+    const tDType* x = (tDType*)NDL_PTR(lp, 1);                                                 \
+    tDType* y = (tDType*)NDL_PTR(lp, 2);                                                       \
+    const struct _gemv_options_##tDType* opt = (struct _gemv_options_##tDType*)(lp->opt_ptr);  \
+    const blasint lda = opt->n;                                                                \
+    cblas_##fBlasFunc(                                                                         \
+      opt->order, opt->trans, opt->m, opt->n, &opt->alpha, a, lda, x, 1, &opt->beta, y, 1      \
+    );                                                                                         \
   }
-#define DEF_LINALG_FUNC(tDType, tNAryClass, fBlasFunc)                                                  \
-  static VALUE _linalg_blas_##fBlasFunc(int argc, VALUE* argv, VALUE self) {                            \
-    VALUE a = Qnil;                                                                                     \
-    VALUE x = Qnil;                                                                                     \
-    VALUE y = Qnil;                                                                                     \
-    VALUE kw_args = Qnil;                                                                               \
-    rb_scan_args(argc, argv, "21:", &a, &x, &y, &kw_args);                                              \
-                                                                                                        \
-    ID kw_table[4] = { rb_intern("alpha"), rb_intern("beta"),                                           \
-                       rb_intern("order"), rb_intern("trans") };                                        \
-    VALUE kw_values[4] = { Qundef, Qundef, Qundef, Qundef };                                            \
-    rb_get_kwargs(kw_args, kw_table, 0, 4, kw_values);                                                  \
-                                                                                                        \
-    if (CLASS_OF(a) != tNAryClass) {                                                                    \
-      a = rb_funcall(tNAryClass, rb_intern("cast"), 1, a);                                              \
-    }                                                                                                   \
-    if (!RTEST(nary_check_contiguous(a))) {                                                             \
-      a = nary_dup(a);                                                                                  \
-    }                                                                                                   \
-    if (CLASS_OF(x) != tNAryClass) {                                                                    \
-      x = rb_funcall(tNAryClass, rb_intern("cast"), 1, x);                                              \
-    }                                                                                                   \
-    if (!RTEST(nary_check_contiguous(x))) {                                                             \
-      x = nary_dup(x);                                                                                  \
-    }                                                                                                   \
-    if (!NIL_P(y)) {                                                                                    \
-      if (CLASS_OF(y) != tNAryClass) {                                                                  \
-        y = rb_funcall(tNAryClass, rb_intern("cast"), 1, y);                                            \
-      }                                                                                                 \
-      if (!RTEST(nary_check_contiguous(y))) {                                                           \
-        y = nary_dup(y);                                                                                \
-      }                                                                                                 \
-    }                                                                                                   \
-                                                                                                        \
-    tDType alpha = kw_values[0] != Qundef ? conv_##tDType(kw_values[0]) : one_##tDType();               \
-    tDType beta = kw_values[1] != Qundef ? conv_##tDType(kw_values[1]) : zero_##tDType();               \
-    enum CBLAS_ORDER order = kw_values[2] != Qundef ? get_cblas_order(kw_values[2]) : CblasRowMajor;    \
-    enum CBLAS_TRANSPOSE trans = kw_values[3] != Qundef ? get_cblas_trans(kw_values[3]) : CblasNoTrans; \
-                                                                                                        \
-    narray_t* a_nary = NULL;                                                                            \
-    GetNArray(a, a_nary);                                                                               \
-    narray_t* x_nary = NULL;                                                                            \
-    GetNArray(x, x_nary);                                                                               \
-                                                                                                        \
-    if (NA_NDIM(a_nary) != 2) {                                                                         \
-      rb_raise(rb_eArgError, "a must be 2-dimensional");                                                \
-      return Qnil;                                                                                      \
-    }                                                                                                   \
-    if (NA_NDIM(x_nary) != 1) {                                                                         \
-      rb_raise(rb_eArgError, "x must be 1-dimensional");                                                \
-      return Qnil;                                                                                      \
-    }                                                                                                   \
-    if (NA_SIZE(a_nary) == 0) {                                                                         \
-      rb_raise(rb_eArgError, "a must not be empty");                                                    \
-      return Qnil;                                                                                      \
-    }                                                                                                   \
-    if (NA_SIZE(x_nary) == 0) {                                                                         \
-      rb_raise(rb_eArgError, "x must not be empty");                                                    \
-      return Qnil;                                                                                      \
-    }                                                                                                   \
-                                                                                                        \
-    const blasint ma = (blasint)NA_SHAPE(a_nary)[0];                                                    \
-    const blasint na = (blasint)NA_SHAPE(a_nary)[1];                                                    \
-    const blasint mx = (blasint)NA_SHAPE(x_nary)[0];                                                    \
-    const blasint m = trans == CblasNoTrans ? ma : na;                                                  \
-    const blasint n = trans == CblasNoTrans ? na : ma;                                                  \
-                                                                                                        \
-    if (n != mx) {                                                                                      \
-      rb_raise(nary_eShapeError, "shape1[1](=%d) != shape2[0](=%d)", n, mx);                            \
-      return Qnil;                                                                                      \
-    }                                                                                                   \
-                                                                                                        \
-    struct _gemv_options_##tDType opt = { alpha, beta, order, trans, ma, na };                          \
-    size_t shape_out[1] = { (size_t)(m) };                                                              \
-    ndfunc_arg_out_t aout[1] = { { tNAryClass, 1, shape_out } };                                        \
-    VALUE ret = Qnil;                                                                                   \
-                                                                                                        \
-    if (!NIL_P(y)) {                                                                                    \
-      narray_t* y_nary = NULL;                                                                          \
-      GetNArray(y, y_nary);                                                                             \
-      blasint my = (blasint)NA_SHAPE(y_nary)[0];                                                        \
-      if (m > my) {                                                                                     \
-        rb_raise(nary_eShapeError, "shape3[0](=%d) >= shape1[0]=%d", my, m);                            \
-        return Qnil;                                                                                    \
-      }                                                                                                 \
-      ndfunc_arg_in_t ain[3] = { { tNAryClass, 2 }, { tNAryClass, 1 }, { OVERWRITE, 1 } };              \
-      ndfunc_t ndf = { _iter_##fBlasFunc, NO_LOOP, 3, 0, ain, aout };                                   \
-      na_ndloop3(&ndf, &opt, 3, a, x, y);                                                               \
-      ret = y;                                                                                          \
-    } else {                                                                                            \
-      y = INT2NUM(0);                                                                                   \
-      ndfunc_arg_in_t ain[3] = { { tNAryClass, 2 }, { tNAryClass, 1 }, { sym_init, 0 } };               \
-      ndfunc_t ndf = { _iter_##fBlasFunc, NO_LOOP, 3, 1, ain, aout };                                   \
-      ret = na_ndloop3(&ndf, &opt, 3, a, x, y);                                                         \
-    }                                                                                                   \
-                                                                                                        \
-    RB_GC_GUARD(a);                                                                                     \
-    RB_GC_GUARD(x);                                                                                     \
-    RB_GC_GUARD(y);                                                                                     \
-                                                                                                        \
-    return ret;                                                                                         \
+#define DEF_LINALG_FUNC(tDType, tNAryClass, fBlasFunc)                                         \
+  static VALUE _linalg_blas_##fBlasFunc(int argc, VALUE* argv, VALUE self) {                   \
+    VALUE a = Qnil;                                                                            \
+    VALUE x = Qnil;                                                                            \
+    VALUE y = Qnil;                                                                            \
+    VALUE kw_args = Qnil;                                                                      \
+    rb_scan_args(argc, argv, "21:", &a, &x, &y, &kw_args);                                     \
+                                                                                               \
+    ID kw_table[4] = { rb_intern("alpha"), rb_intern("beta"), rb_intern("order"),              \
+                       rb_intern("trans") };                                                   \
+    VALUE kw_values[4] = { Qundef, Qundef, Qundef, Qundef };                                   \
+    rb_get_kwargs(kw_args, kw_table, 0, 4, kw_values);                                         \
+                                                                                               \
+    if (CLASS_OF(a) != tNAryClass) {                                                           \
+      a = rb_funcall(tNAryClass, rb_intern("cast"), 1, a);                                     \
+    }                                                                                          \
+    if (!RTEST(nary_check_contiguous(a))) {                                                    \
+      a = nary_dup(a);                                                                         \
+    }                                                                                          \
+    if (CLASS_OF(x) != tNAryClass) {                                                           \
+      x = rb_funcall(tNAryClass, rb_intern("cast"), 1, x);                                     \
+    }                                                                                          \
+    if (!RTEST(nary_check_contiguous(x))) {                                                    \
+      x = nary_dup(x);                                                                         \
+    }                                                                                          \
+    if (!NIL_P(y)) {                                                                           \
+      if (CLASS_OF(y) != tNAryClass) {                                                         \
+        y = rb_funcall(tNAryClass, rb_intern("cast"), 1, y);                                   \
+      }                                                                                        \
+      if (!RTEST(nary_check_contiguous(y))) {                                                  \
+        y = nary_dup(y);                                                                       \
+      }                                                                                        \
+    }                                                                                          \
+                                                                                               \
+    tDType alpha = kw_values[0] != Qundef ? conv_##tDType(kw_values[0]) : one_##tDType();      \
+    tDType beta = kw_values[1] != Qundef ? conv_##tDType(kw_values[1]) : zero_##tDType();      \
+    enum CBLAS_ORDER order =                                                                   \
+      kw_values[2] != Qundef ? get_cblas_order(kw_values[2]) : CblasRowMajor;                  \
+    enum CBLAS_TRANSPOSE trans =                                                               \
+      kw_values[3] != Qundef ? get_cblas_trans(kw_values[3]) : CblasNoTrans;                   \
+                                                                                               \
+    narray_t* a_nary = NULL;                                                                   \
+    GetNArray(a, a_nary);                                                                      \
+    narray_t* x_nary = NULL;                                                                   \
+    GetNArray(x, x_nary);                                                                      \
+                                                                                               \
+    if (NA_NDIM(a_nary) != 2) {                                                                \
+      rb_raise(rb_eArgError, "a must be 2-dimensional");                                       \
+      return Qnil;                                                                             \
+    }                                                                                          \
+    if (NA_NDIM(x_nary) != 1) {                                                                \
+      rb_raise(rb_eArgError, "x must be 1-dimensional");                                       \
+      return Qnil;                                                                             \
+    }                                                                                          \
+    if (NA_SIZE(a_nary) == 0) {                                                                \
+      rb_raise(rb_eArgError, "a must not be empty");                                           \
+      return Qnil;                                                                             \
+    }                                                                                          \
+    if (NA_SIZE(x_nary) == 0) {                                                                \
+      rb_raise(rb_eArgError, "x must not be empty");                                           \
+      return Qnil;                                                                             \
+    }                                                                                          \
+                                                                                               \
+    const blasint ma = (blasint)NA_SHAPE(a_nary)[0];                                           \
+    const blasint na = (blasint)NA_SHAPE(a_nary)[1];                                           \
+    const blasint mx = (blasint)NA_SHAPE(x_nary)[0];                                           \
+    const blasint m = trans == CblasNoTrans ? ma : na;                                         \
+    const blasint n = trans == CblasNoTrans ? na : ma;                                         \
+                                                                                               \
+    if (n != mx) {                                                                             \
+      rb_raise(nary_eShapeError, "shape1[1](=%d) != shape2[0](=%d)", n, mx);                   \
+      return Qnil;                                                                             \
+    }                                                                                          \
+                                                                                               \
+    struct _gemv_options_##tDType opt = { alpha, beta, order, trans, ma, na };                 \
+    size_t shape_out[1] = { (size_t)(m) };                                                     \
+    ndfunc_arg_out_t aout[1] = { { tNAryClass, 1, shape_out } };                               \
+    VALUE ret = Qnil;                                                                          \
+                                                                                               \
+    if (!NIL_P(y)) {                                                                           \
+      narray_t* y_nary = NULL;                                                                 \
+      GetNArray(y, y_nary);                                                                    \
+      blasint my = (blasint)NA_SHAPE(y_nary)[0];                                               \
+      if (m > my) {                                                                            \
+        rb_raise(nary_eShapeError, "shape3[0](=%d) >= shape1[0]=%d", my, m);                   \
+        return Qnil;                                                                           \
+      }                                                                                        \
+      ndfunc_arg_in_t ain[3] = { { tNAryClass, 2 }, { tNAryClass, 1 }, { OVERWRITE, 1 } };     \
+      ndfunc_t ndf = { _iter_##fBlasFunc, NO_LOOP, 3, 0, ain, aout };                          \
+      na_ndloop3(&ndf, &opt, 3, a, x, y);                                                      \
+      ret = y;                                                                                 \
+    } else {                                                                                   \
+      y = INT2NUM(0);                                                                          \
+      ndfunc_arg_in_t ain[3] = { { tNAryClass, 2 }, { tNAryClass, 1 }, { sym_init, 0 } };      \
+      ndfunc_t ndf = { _iter_##fBlasFunc, NO_LOOP, 3, 1, ain, aout };                          \
+      ret = na_ndloop3(&ndf, &opt, 3, a, x, y);                                                \
+    }                                                                                          \
+                                                                                               \
+    RB_GC_GUARD(a);                                                                            \
+    RB_GC_GUARD(x);                                                                            \
+    RB_GC_GUARD(y);                                                                            \
+                                                                                               \
+    return ret;                                                                                \
   }
 DEF_LINALG_OPTIONS(double)
@@ -154,8 +158,8 @@ DEF_LINALG_FUNC(scomplex, numo_cSComplex, cgemv)
 #undef DEF_LINALG_FUNC
 void define_linalg_blas_gemv(VALUE mBlas) {
-  rb_define_module_function(mBlas, "dgemv", RUBY_METHOD_FUNC(_linalg_blas_dgemv), -1);
-  rb_define_module_function(mBlas, "sgemv", RUBY_METHOD_FUNC(_linalg_blas_sgemv), -1);
-  rb_define_module_function(mBlas, "zgemv", RUBY_METHOD_FUNC(_linalg_blas_zgemv), -1);
-  rb_define_module_function(mBlas, "cgemv", RUBY_METHOD_FUNC(_linalg_blas_cgemv), -1);
+  rb_define_module_function(mBlas, "dgemv", _linalg_blas_dgemv, -1);
+  rb_define_module_function(mBlas, "sgemv", _linalg_blas_sgemv, -1);
+  rb_define_module_function(mBlas, "zgemv", _linalg_blas_zgemv, -1);
+  rb_define_module_function(mBlas, "cgemv", _linalg_blas_cgemv, -1);
 }

data/ext/numo/linalg/blas/nrm2.c CHANGED Viewed

@@ -1,55 +1,55 @@
 #include "nrm2.h"
-#define DEF_LINALG_FUNC(tDType, tRtDType, tNAryClass, tRtNAryClass, fBlasFunc)    \
-  static void _iter_##fBlasFunc(na_loop_t* const lp) {                            \
-    tDType* x = (tDType*)NDL_PTR(lp, 0);                                          \
-    tRtDType* d = (tRtDType*)NDL_PTR(lp, 1);                                      \
-    const blasint n = (blasint)NDL_SHAPE(lp, 0)[0];                               \
-    tRtDType ret = cblas_##fBlasFunc(n, x, 1);                                    \
-    *d = ret;                                                                     \
-  }                                                                               \
-                                                                                  \
-  static VALUE _linalg_blas_##fBlasFunc(int argc, VALUE* argv, VALUE self) {      \
-    VALUE x = Qnil;                                                               \
-    VALUE kw_args = Qnil;                                                         \
-    rb_scan_args(argc, argv, "1:", &x, &kw_args);                                 \
-                                                                                  \
-    ID kw_table[1] = { rb_intern("keepdims") };                                   \
-    VALUE kw_values[1] = { Qundef };                                              \
-    rb_get_kwargs(kw_args, kw_table, 0, 1, kw_values);                            \
-    const bool keepdims = kw_values[0] != Qundef ? RTEST(kw_values[0]) : false;   \
-                                                                                  \
-    if (CLASS_OF(x) != tNAryClass) {                                              \
-      x = rb_funcall(tNAryClass, rb_intern("cast"), 1, x);                        \
-    }                                                                             \
-    if (!RTEST(nary_check_contiguous(x))) {                                       \
-      x = nary_dup(x);                                                            \
-    }                                                                             \
-                                                                                  \
-    narray_t* x_nary = NULL;                                                      \
-    GetNArray(x, x_nary);                                                         \
-                                                                                  \
-    if (NA_NDIM(x_nary) != 1) {                                                   \
-      rb_raise(rb_eArgError, "x must be 1-dimensional");                          \
-      return Qnil;                                                                \
-    }                                                                             \
-    if (NA_SIZE(x_nary) == 0) {                                                   \
-      rb_raise(rb_eArgError, "x must not be empty");                              \
-      return Qnil;                                                                \
-    }                                                                             \
-                                                                                  \
-    ndfunc_arg_in_t ain[1] = { { tNAryClass, 1 } };                               \
-    size_t shape_out[1] = { 1 };                                                  \
-    ndfunc_arg_out_t aout[1] = { { tRtNAryClass, 0, shape_out } };                \
-    ndfunc_t ndf = { _iter_##fBlasFunc, NO_LOOP | NDF_EXTRACT, 1, 1, ain, aout }; \
-    if (keepdims) {                                                               \
-      ndf.flag |= NDF_KEEP_DIM;                                                   \
-    }                                                                             \
-                                                                                  \
-    VALUE ret = na_ndloop(&ndf, 1, x);                                            \
-                                                                                  \
-    RB_GC_GUARD(x);                                                               \
-    return ret;                                                                   \
+#define DEF_LINALG_FUNC(tDType, tRtDType, tNAryClass, tRtNAryClass, fBlasFunc)                 \
+  static void _iter_##fBlasFunc(na_loop_t* const lp) {                                         \
+    tDType* x = (tDType*)NDL_PTR(lp, 0);                                                       \
+    tRtDType* d = (tRtDType*)NDL_PTR(lp, 1);                                                   \
+    const blasint n = (blasint)NDL_SHAPE(lp, 0)[0];                                            \
+    tRtDType ret = cblas_##fBlasFunc(n, x, 1);                                                 \
+    *d = ret;                                                                                  \
+  }                                                                                            \
+                                                                                               \
+  static VALUE _linalg_blas_##fBlasFunc(int argc, VALUE* argv, VALUE self) {                   \
+    VALUE x = Qnil;                                                                            \
+    VALUE kw_args = Qnil;                                                                      \
+    rb_scan_args(argc, argv, "1:", &x, &kw_args);                                              \
+                                                                                               \
+    ID kw_table[1] = { rb_intern("keepdims") };                                                \
+    VALUE kw_values[1] = { Qundef };                                                           \
+    rb_get_kwargs(kw_args, kw_table, 0, 1, kw_values);                                         \
+    const bool keepdims = kw_values[0] != Qundef ? RTEST(kw_values[0]) : false;                \
+                                                                                               \
+    if (CLASS_OF(x) != tNAryClass) {                                                           \
+      x = rb_funcall(tNAryClass, rb_intern("cast"), 1, x);                                     \
+    }                                                                                          \
+    if (!RTEST(nary_check_contiguous(x))) {                                                    \
+      x = nary_dup(x);                                                                         \
+    }                                                                                          \
+                                                                                               \
+    narray_t* x_nary = NULL;                                                                   \
+    GetNArray(x, x_nary);                                                                      \
+                                                                                               \
+    if (NA_NDIM(x_nary) != 1) {                                                                \
+      rb_raise(rb_eArgError, "x must be 1-dimensional");                                       \
+      return Qnil;                                                                             \
+    }                                                                                          \
+    if (NA_SIZE(x_nary) == 0) {                                                                \
+      rb_raise(rb_eArgError, "x must not be empty");                                           \
+      return Qnil;                                                                             \
+    }                                                                                          \
+                                                                                               \
+    ndfunc_arg_in_t ain[1] = { { tNAryClass, 1 } };                                            \
+    size_t shape_out[1] = { 1 };                                                               \
+    ndfunc_arg_out_t aout[1] = { { tRtNAryClass, 0, shape_out } };                             \
+    ndfunc_t ndf = { _iter_##fBlasFunc, NO_LOOP | NDF_EXTRACT, 1, 1, ain, aout };              \
+    if (keepdims) {                                                                            \
+      ndf.flag |= NDF_KEEP_DIM;                                                                \
+    }                                                                                          \
+                                                                                               \
+    VALUE ret = na_ndloop(&ndf, 1, x);                                                         \
+                                                                                               \
+    RB_GC_GUARD(x);                                                                            \
+    return ret;                                                                                \
   }
 DEF_LINALG_FUNC(double, double, numo_cDFloat, numo_cDFloat, dnrm2)
@@ -60,8 +60,8 @@ DEF_LINALG_FUNC(scomplex, float, numo_cSComplex, numo_cSFloat, scnrm2)
 #undef DEF_LINALG_FUNC
 void define_linalg_blas_nrm2(VALUE mBlas) {
-  rb_define_module_function(mBlas, "dnrm2", RUBY_METHOD_FUNC(_linalg_blas_dnrm2), -1);
-  rb_define_module_function(mBlas, "snrm2", RUBY_METHOD_FUNC(_linalg_blas_snrm2), -1);
-  rb_define_module_function(mBlas, "dznrm2", RUBY_METHOD_FUNC(_linalg_blas_dznrm2), -1);
-  rb_define_module_function(mBlas, "scnrm2", RUBY_METHOD_FUNC(_linalg_blas_scnrm2), -1);
+  rb_define_module_function(mBlas, "dnrm2", _linalg_blas_dnrm2, -1);
+  rb_define_module_function(mBlas, "snrm2", _linalg_blas_snrm2, -1);
+  rb_define_module_function(mBlas, "dznrm2", _linalg_blas_dznrm2, -1);
+  rb_define_module_function(mBlas, "scnrm2", _linalg_blas_scnrm2, -1);
 }

data/ext/numo/linalg/lapack/gebal.c ADDED Viewed

@@ -0,0 +1,87 @@
+#include "gebal.h"
+struct _gebal_option {
+  int matrix_layout;
+  char job;
+};
+char _get_job(VALUE val) {
+  const char job = NUM2CHR(val);
+  if (job != 'N' && job != 'P' && job != 'S' && job != 'B') {
+    rb_raise(rb_eArgError, "job must be 'N', 'P', 'S', or 'B'");
+  }
+  return job;
+}
+#define DEF_LINALG_FUNC(tDType, tRtDType, tNAryClass, tRtNAryClass, fLapackFunc)               \
+  static void _iter_##fLapackFunc(na_loop_t* const lp) {                                       \
+    tDType* a = (tDType*)NDL_PTR(lp, 0);                                                       \
+    int* ilo = (int*)NDL_PTR(lp, 1);                                                           \
+    int* ihi = (int*)NDL_PTR(lp, 2);                                                           \
+    tRtDType* scale = (tRtDType*)NDL_PTR(lp, 3);                                               \
+    int* info = (int*)NDL_PTR(lp, 4);                                                          \
+    struct _gebal_option* opt = (struct _gebal_option*)(lp->opt_ptr);                          \
+    const lapack_int n =                                                                       \
+      (lapack_int)(opt->matrix_layout == LAPACK_ROW_MAJOR ? NDL_SHAPE(lp, 0)[0]                \
+                                                          : NDL_SHAPE(lp, 0)[1]);              \
+    const lapack_int lda = n;                                                                  \
+    lapack_int i =                                                                             \
+      LAPACKE_##fLapackFunc(opt->matrix_layout, opt->job, n, a, lda, ilo, ihi, scale);         \
+    *info = (int)i;                                                                            \
+  }                                                                                            \
+                                                                                               \
+  static VALUE _linalg_lapack_##fLapackFunc(int argc, VALUE* argv, VALUE self) {               \
+    VALUE a_vnary = Qnil;                                                                      \
+    VALUE kw_args = Qnil;                                                                      \
+    rb_scan_args(argc, argv, "1:", &a_vnary, &kw_args);                                        \
+    ID kw_table[2] = { rb_intern("order"), rb_intern("job") };                                 \
+    VALUE kw_values[2] = { Qundef, Qundef };                                                   \
+    rb_get_kwargs(kw_args, kw_table, 0, 2, kw_values);                                         \
+    const int matrix_layout =                                                                  \
+      kw_values[0] != Qundef ? get_matrix_layout(kw_values[0]) : LAPACK_ROW_MAJOR;             \
+    const char job = kw_values[1] != Qundef ? _get_job(kw_values[1]) : 'B';                    \
+                                                                                               \
+    if (CLASS_OF(a_vnary) != tNAryClass) {                                                     \
+      a_vnary = rb_funcall(tNAryClass, rb_intern("cast"), 1, a_vnary);                         \
+    }                                                                                          \
+    if (!RTEST(nary_check_contiguous(a_vnary))) {                                              \
+      a_vnary = nary_dup(a_vnary);                                                             \
+    }                                                                                          \
+                                                                                               \
+    narray_t* a_nary = NULL;                                                                   \
+    GetNArray(a_vnary, a_nary);                                                                \
+    const int n_dims = NA_NDIM(a_nary);                                                        \
+    if (n_dims != 2) {                                                                         \
+      rb_raise(rb_eArgError, "input array a must be 2-dimensional");                           \
+      return Qnil;                                                                             \
+    }                                                                                          \
+                                                                                               \
+    size_t n = matrix_layout == LAPACK_ROW_MAJOR ? NA_SHAPE(a_nary)[0] : NA_SHAPE(a_nary)[1];  \
+    size_t shape_scale[1] = { n };                                                             \
+    ndfunc_arg_in_t ain[1] = { { OVERWRITE, 2 } };                                             \
+    ndfunc_arg_out_t aout[4] = { { numo_cInt32, 0 },                                           \
+                                 { numo_cInt32, 0 },                                           \
+                                 { tRtNAryClass, 1, shape_scale },                             \
+                                 { numo_cInt32, 0 } };                                         \
+    ndfunc_t ndf = { _iter_##fLapackFunc, NO_LOOP | NDF_EXTRACT, 1, 4, ain, aout };            \
+    struct _gebal_option opt = { matrix_layout, job };                                         \
+    VALUE res = na_ndloop3(&ndf, &opt, 1, a_vnary);                                            \
+    VALUE ret = rb_ary_concat(rb_ary_new3(1, a_vnary), res);                                   \
+                                                                                               \
+    RB_GC_GUARD(a_vnary);                                                                      \
+    return ret;                                                                                \
+  }
+DEF_LINALG_FUNC(double, double, numo_cDFloat, numo_cDFloat, dgebal)
+DEF_LINALG_FUNC(float, float, numo_cSFloat, numo_cSFloat, sgebal)
+DEF_LINALG_FUNC(lapack_complex_double, double, numo_cDComplex, numo_cDFloat, zgebal)
+DEF_LINALG_FUNC(lapack_complex_float, float, numo_cSComplex, numo_cSFloat, cgebal)
+#undef DEF_LINALG_FUNC
+void define_linalg_lapack_gebal(VALUE mLapack) {
+  rb_define_module_function(mLapack, "dgebal", _linalg_lapack_dgebal, -1);
+  rb_define_module_function(mLapack, "sgebal", _linalg_lapack_sgebal, -1);
+  rb_define_module_function(mLapack, "zgebal", _linalg_lapack_zgebal, -1);
+  rb_define_module_function(mLapack, "cgebal", _linalg_lapack_cgebal, -1);
+}

data/ext/numo/linalg/lapack/gebal.h ADDED Viewed

@@ -0,0 +1,15 @@
+#ifndef NUMO_LINALG_ALT_LAPACK_GEBAL_H
+#define NUMO_LINALG_ALT_LAPACK_GEBAL_H 1
+#include <lapacke.h>
+#include <ruby.h>
+#include <numo/narray.h>
+#include <numo/template.h>
+#include "../util.h"
+void define_linalg_lapack_gebal(VALUE mLapack);
+#endif /* NUMO_LINALG_ALT_LAPACK_GEBAL_H */