RubyGems - tomoto - Versions diffs - 0.1.3 → 0.1.4 - Mend

tomoto 0.1.3 → 0.1.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (50) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +6 -0
data/LICENSE.txt +1 -1
data/README.md +7 -0
data/ext/tomoto/ct.cpp +54 -0
data/ext/tomoto/dmr.cpp +62 -0
data/ext/tomoto/dt.cpp +82 -0
data/ext/tomoto/ext.cpp +27 -773
data/ext/tomoto/gdmr.cpp +34 -0
data/ext/tomoto/hdp.cpp +42 -0
data/ext/tomoto/hlda.cpp +66 -0
data/ext/tomoto/hpa.cpp +27 -0
data/ext/tomoto/lda.cpp +250 -0
data/ext/tomoto/llda.cpp +29 -0
data/ext/tomoto/mglda.cpp +71 -0
data/ext/tomoto/pa.cpp +27 -0
data/ext/tomoto/plda.cpp +29 -0
data/ext/tomoto/slda.cpp +40 -0
data/ext/tomoto/utils.h +84 -0
data/lib/tomoto/tomoto.bundle +0 -0
data/lib/tomoto/tomoto.so +0 -0
data/lib/tomoto/version.rb +1 -1
data/vendor/tomotopy/README.kr.rst +12 -3
data/vendor/tomotopy/README.rst +12 -3
data/vendor/tomotopy/src/Labeling/FoRelevance.cpp +47 -2
data/vendor/tomotopy/src/Labeling/FoRelevance.h +21 -151
data/vendor/tomotopy/src/Labeling/Labeler.h +5 -3
data/vendor/tomotopy/src/Labeling/Phraser.hpp +518 -0
data/vendor/tomotopy/src/TopicModel/CTModel.hpp +6 -3
data/vendor/tomotopy/src/TopicModel/DT.h +1 -1
data/vendor/tomotopy/src/TopicModel/DTModel.hpp +8 -23
data/vendor/tomotopy/src/TopicModel/HDPModel.hpp +9 -18
data/vendor/tomotopy/src/TopicModel/HLDAModel.hpp +56 -58
data/vendor/tomotopy/src/TopicModel/HPAModel.hpp +4 -14
data/vendor/tomotopy/src/TopicModel/LDA.h +69 -17
data/vendor/tomotopy/src/TopicModel/LDACVB0Model.hpp +1 -1
data/vendor/tomotopy/src/TopicModel/LDAModel.hpp +108 -61
data/vendor/tomotopy/src/TopicModel/MGLDAModel.hpp +7 -8
data/vendor/tomotopy/src/TopicModel/PAModel.hpp +26 -16
data/vendor/tomotopy/src/TopicModel/PT.h +27 -0
data/vendor/tomotopy/src/TopicModel/PTModel.cpp +10 -0
data/vendor/tomotopy/src/TopicModel/PTModel.hpp +273 -0
data/vendor/tomotopy/src/TopicModel/TopicModel.hpp +16 -11
data/vendor/tomotopy/src/Utils/MultiNormalDistribution.hpp +3 -2
data/vendor/tomotopy/src/Utils/Trie.hpp +39 -8
data/vendor/tomotopy/src/Utils/TruncMultiNormal.hpp +36 -38
data/vendor/tomotopy/src/Utils/Utils.hpp +50 -45
data/vendor/tomotopy/src/Utils/math.h +8 -4
data/vendor/tomotopy/src/Utils/tvector.hpp +4 -0
metadata +24 -60

checksums.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 SHA256:
-  metadata.gz: 370ff6a569a6e476137cda0db349cf1b22ff0e7d54b0df67500ffbbe46846a86
-  data.tar.gz: 8df2fb740a85f8a51485e992dfacd6bef4d3c185d8d08369c72d93b9bb412f6d
+  metadata.gz: b1cb95a96851ccd3d499ed38c9da531ce48588cf44c37ccc92bbfdc9277e0962
+  data.tar.gz: cadee081b1f0ea9cc37b75afd97e8ecebb32796cc335da2ff50e844c955a0e4a
 SHA512:
-  metadata.gz: 17abc53d6923a1fb24bfd040967944884cd7e1595ff4fb82c7af46a4bfae858875b2819b7e05fd2ff92e7fe17eec1350c551aa98bf88eedb344cde00a780f32a
-  data.tar.gz: 8f504f89679cf072fee04ac5b0319e164a509d140e65dd6f1c77e6fc9ecef252ce4ece0ac80087d0d69ddccf2a5b002910db58bb5212c4c2c7fa5d206b60d422
+  metadata.gz: f5154bfb71c0b8891953b97c8edf37a7fb70fcb2ab09c3f51126e14262c729dcdc4b82d2727a8601131e090a05efcd1958851d77b5e8e95b922fc9b1f44cedf6
+  data.tar.gz: f975f505493d41bc425e0d288762e97c83ffdb6c1812792bc2dca517c550f1508efef79a24bdde992d7acd3994d6566c27745b9bed806ea64dfa072d22c692a0

data/CHANGELOG.md CHANGED Viewed

@@ -1,3 +1,9 @@
+## 0.1.4 (2021-03-14)
+- Added `docs` method
+- Updated tomoto to 0.10.2
+- Updated `add_doc` to return the index of the document
 ## 0.1.3 (2020-12-19)
 - Updated tomoto to 0.10.0

data/LICENSE.txt CHANGED Viewed

@@ -1,7 +1,7 @@
 MIT License
 Copyright (c) 2019, bab2min
-Copyright (c) 2020 Andrew Kane
+Copyright (c) 2020-2021 Andrew Kane
 Permission is hereby granted, free of charge, to any person obtaining a copy
 of this software and associated documentation files (the "Software"), to deal

data/README.md CHANGED Viewed

@@ -50,6 +50,13 @@ Load the model from a file
 model = Tomoto::LDA.load("model.bin")
 ```
+Get topic probabilities for a document
+```ruby
+doc = model.docs[0]
+doc.topics
+```
 Get the number of words for each topic
 ```ruby

data/ext/tomoto/ct.cpp ADDED Viewed

@@ -0,0 +1,54 @@
+#include <CT.h>
+#include <rice/Module.hpp>
+#include "utils.h"
+void init_ct(Rice::Module& m) {
+  Rice::define_class_under<tomoto::ICTModel, tomoto::ILDAModel>(m, "CT")
+    .define_singleton_method(
+      "_new",
+      *[](size_t tw, size_t k, tomoto::Float alpha, tomoto::Float eta, int seed) {
+        if (seed < 0) {
+          seed = std::random_device{}();
+        }
+        return tomoto::ICTModel::create((tomoto::TermWeight)tw, k, alpha, eta, seed);
+      })
+    .define_method(
+      "_correlations",
+      *[](tomoto::ICTModel& self, tomoto::Tid topic_id) {
+        return self.getCorrelationTopic(topic_id);
+      })
+    .define_method(
+      "num_beta_sample",
+      *[](tomoto::ICTModel& self) {
+        return self.getNumBetaSample();
+      })
+    .define_method(
+      "num_beta_sample=",
+      *[](tomoto::ICTModel& self, size_t value) {
+        self.setNumBetaSample(value);
+        return value;
+      })
+    .define_method(
+      "num_tmn_sample",
+      *[](tomoto::ICTModel& self) {
+        return self.getNumTMNSample();
+      })
+    .define_method(
+      "num_tmn_sample=",
+      *[](tomoto::ICTModel& self, size_t value) {
+        self.setNumTMNSample(value);
+        return value;
+      })
+    .define_method(
+      "_prior_cov",
+      *[](tomoto::ICTModel& self) {
+        return self.getPriorCov();
+      })
+    .define_method(
+      "prior_mean",
+      *[](tomoto::ICTModel& self) {
+        return self.getPriorMean();
+      });
+}

data/ext/tomoto/dmr.cpp ADDED Viewed

@@ -0,0 +1,62 @@
+#include <DMR.h>
+#include <rice/Class.hpp>
+#include <rice/Module.hpp>
+#include "utils.h"
+void init_dmr(Rice::Module& m) {
+  Rice::define_class_under<tomoto::IDMRModel, tomoto::ILDAModel>(m, "DMR")
+    .define_singleton_method(
+      "_new",
+      *[](size_t tw, size_t k, tomoto::Float alpha, tomoto::Float sigma, tomoto::Float eta, tomoto::Float alpha_epsilon, int seed) {
+        if (seed < 0) {
+          seed = std::random_device{}();
+        }
+        return tomoto::IDMRModel::create((tomoto::TermWeight)tw, k, alpha, sigma, eta, alpha_epsilon, seed);
+      })
+    .define_method(
+      "_add_doc",
+      *[](tomoto::IDMRModel& self, std::vector<std::string> words, std::string metadata) {
+        auto doc = buildDoc(words);
+        doc.misc["metadata"] = metadata;
+        return self.addDoc(doc);
+      })
+    .define_method(
+      "alpha_epsilon",
+      *[](tomoto::IDMRModel& self) {
+        return self.getAlphaEps();
+      })
+    .define_method(
+      "alpha_epsilon=",
+      *[](tomoto::IDMRModel& self, tomoto::Float value) {
+        self.setAlphaEps(value);
+        return value;
+      })
+    .define_method(
+      "f",
+      *[](tomoto::IDMRModel& self) {
+        return self.getF();
+      })
+    .define_method(
+      "_lambdas",
+      *[](tomoto::IDMRModel& self, tomoto::Tid topic_id) {
+        return self.getLambdaByTopic(topic_id);
+      })
+    .define_method(
+      "metadata_dict",
+      *[](tomoto::IDMRModel& self) {
+        auto dict = self.getMetadataDict();
+        Array res;
+        auto utf8 = Rice::Class(rb_cEncoding).call("const_get", "UTF_8");
+        for (size_t i = 0; i < dict.size(); i++) {
+          res.push(to_ruby<std::string>(dict.toWord(i)).call("force_encoding", utf8));
+        }
+        return res;
+      })
+    .define_method(
+      "sigma",
+      *[](tomoto::IDMRModel& self) {
+        return self.getSigma();
+      });
+}

data/ext/tomoto/dt.cpp ADDED Viewed

@@ -0,0 +1,82 @@
+#include <DT.h>
+#include <rice/Module.hpp>
+#include "utils.h"
+void init_dt(Rice::Module& m) {
+  Rice::define_class_under<tomoto::IDTModel, tomoto::ILDAModel>(m, "DT")
+    .define_singleton_method(
+      "_new",
+      *[](size_t tw, size_t k, size_t t, tomoto::Float alphaVar, tomoto::Float etaVar, tomoto::Float phiVar, tomoto::Float shapeA, tomoto::Float shapeB, tomoto::Float shapeC) {
+        // Rice only supports 10 arguments
+        int seed = -1;
+        if (seed < 0) {
+          seed = std::random_device{}();
+        }
+        return tomoto::IDTModel::create((tomoto::TermWeight)tw, k, t, alphaVar, etaVar, phiVar, shapeA, shapeB, shapeC, 0, seed);
+      })
+    .define_method(
+      "_add_doc",
+      *[](tomoto::IDTModel& self, std::vector<std::string> words, uint32_t timepoint) {
+        auto doc = buildDoc(words);
+        doc.misc["timepoint"] = timepoint;
+        return self.addDoc(doc);
+      })
+    .define_method(
+      "alpha",
+      *[](tomoto::IDTModel& self) {
+        Array res;
+        for (size_t i = 0; i < self.getK(); i++) {
+          Array res2;
+          for (size_t j = 0; j < self.getT(); j++) {
+            res2.push(self.getAlpha(i, j));
+          }
+          res.push(res2);
+        }
+        return res;
+      })
+    .define_method(
+      "lr_a",
+      *[](tomoto::IDTModel& self) {
+        return self.getShapeA();
+      })
+    .define_method(
+      "lr_a=",
+      *[](tomoto::IDTModel& self, tomoto::Float value) {
+        self.setShapeA(value);
+        return value;
+      })
+    .define_method(
+      "lr_b",
+      *[](tomoto::IDTModel& self) {
+        return self.getShapeB();
+      })
+    .define_method(
+      "lr_b=",
+      *[](tomoto::IDTModel& self, tomoto::Float value) {
+        self.setShapeB(value);
+        return value;
+      })
+    .define_method(
+      "lr_c",
+      *[](tomoto::IDTModel& self) {
+        return self.getShapeC();
+      })
+    .define_method(
+      "lr_c=",
+      *[](tomoto::IDTModel& self, tomoto::Float value) {
+        self.setShapeC(value);
+        return value;
+      })
+    .define_method(
+      "num_docs_by_timepoint",
+      *[](tomoto::IDTModel& self) {
+        return self.getNumDocsByT();
+      })
+    .define_method(
+      "num_timepoints",
+      *[](tomoto::IDTModel& self) {
+        return self.getT();
+      });
+}

data/ext/tomoto/ext.cpp CHANGED Viewed

@@ -1,111 +1,23 @@
-// stdlib
-#include <fstream>
-#include <iostream>
-// tomoto
-#include <CT.h>
-#include <DMR.h>
-#include <DT.h>
-#include <GDMR.h>
-#include <HDP.h>
-#include <HLDA.h>
-#include <HPA.h>
-#include <LDA.h>
-#include <LLDA.h>
-#include <MGLDA.h>
-#include <PA.h>
-#include <PLDA.h>
-#include <SLDA.h>
-// rice
-#include <rice/Array.hpp>
-#include <rice/Hash.hpp>
 #include <rice/Module.hpp>
-using Rice::Array;
-using Rice::Class;
-using Rice::Hash;
-using Rice::Module;
-using Rice::Object;
-using Rice::define_class_under;
-using Rice::define_module;
-template<>
-Object to_ruby<std::vector<tomoto::Float>>(std::vector<tomoto::Float> const & x)
-{
-  Array res;
-  for (auto const& v : x) {
-    res.push(v);
-  }
-  return res;
-}
-template<>
-Object to_ruby<std::vector<uint32_t>>(std::vector<uint32_t> const & x)
-{
-  Array res;
-  for (auto const& v : x) {
-    res.push(v);
-  }
-  return res;
-}
-template<>
-Object to_ruby<std::vector<uint64_t>>(std::vector<uint64_t> const & x)
-{
-  Array res;
-  for (auto const& v : x) {
-    res.push(v);
-  }
-  return res;
-}
-template<>
-std::vector<std::string> from_ruby<std::vector<std::string>>(Object x)
-{
-  Array a = Array(x);
-  std::vector<std::string> res;
-  res.reserve(a.size());
-  for (auto const& v : a) {
-    res.push_back(from_ruby<std::string>(v));
-  }
-  return res;
-}
-template<>
-std::vector<tomoto::Float> from_ruby<std::vector<tomoto::Float>>(Object x)
-{
-  Array a = Array(x);
-  std::vector<tomoto::Float> res;
-  res.reserve(a.size());
-  for (auto const& v : a) {
-    res.push_back(from_ruby<tomoto::Float>(v));
-  }
-  return res;
-}
-template<>
-std::vector<uint64_t> from_ruby<std::vector<uint64_t>>(Object x)
-{
-  Array a = Array(x);
-  std::vector<uint64_t> res;
-  res.reserve(a.size());
-  for (auto const& v : a) {
-    res.push_back(from_ruby<uint64_t>(v));
-  }
-  return res;
-}
-tomoto::RawDoc buildDoc(std::vector<std::string>& words) {
-  tomoto::RawDoc doc;
-  doc.rawWords = words;
-  return doc;
-}
+void init_lda(Rice::Module& m);
+void init_ct(Rice::Module& m);
+void init_dmr(Rice::Module& m);
+void init_dt(Rice::Module& m);
+void init_gdmr(Rice::Module& m);
+void init_hdp(Rice::Module& m);
+void init_hlda(Rice::Module& m);
+void init_pa(Rice::Module& m);
+void init_hpa(Rice::Module& m);
+void init_mglda(Rice::Module& m);
+void init_llda(Rice::Module& m);
+void init_plda(Rice::Module& m);
+void init_slda(Rice::Module& m);
 extern "C"
 void Init_ext()
 {
-  Module rb_mTomoto = define_module("Tomoto")
+  auto m = Rice::define_module("Tomoto")
     .define_singleton_method(
       "isa",
       *[]() {
@@ -120,675 +32,17 @@ void Init_ext()
         #endif
       });
-  Class rb_cLDA = define_class_under<tomoto::ILDAModel>(rb_mTomoto, "LDA")
-    .define_singleton_method(
-      "_new",
-      *[](size_t tw, size_t k, tomoto::Float alpha, tomoto::Float eta, int seed) {
-        if (seed < 0) {
-          seed = std::random_device{}();
-        }
-        return tomoto::ILDAModel::create((tomoto::TermWeight)tw, k, alpha, eta, seed);
-      })
-    .define_method(
-      "_add_doc",
-      *[](tomoto::ILDAModel& self, std::vector<std::string> words) {
-        self.addDoc(buildDoc(words));
-      })
-    .define_method(
-      "alpha",
-      *[](tomoto::ILDAModel& self) {
-        Array res;
-        for (size_t i = 0; i < self.getK(); i++) {
-          res.push(self.getAlpha(i));
-        }
-        return res;
-      })
-    .define_method(
-      "burn_in",
-      *[](tomoto::ILDAModel& self) {
-        return self.getBurnInIteration();
-      })
-    .define_method(
-      "burn_in=",
-      *[](tomoto::ILDAModel& self, size_t iteration) {
-        self.setBurnInIteration(iteration);
-        return iteration;
-      })
-    .define_method(
-      "_count_by_topics",
-      *[](tomoto::ILDAModel& self) {
-        Array res;
-        for (auto const& v : self.getCountByTopic()) {
-          res.push(v);
-        }
-        return res;
-      })
-    .define_method(
-      "eta",
-      *[](tomoto::ILDAModel& self) {
-        return self.getEta();
-      })
-    .define_method(
-      "global_step",
-      *[](tomoto::ILDAModel& self) {
-        return self.getGlobalStep();
-      })
-    .define_method(
-      "k",
-      *[](tomoto::ILDAModel& self) {
-        return self.getK();
-      })
-    .define_method(
-      "_load",
-      *[](tomoto::ILDAModel& self, const char* filename) {
-        std::ifstream str{ filename, std::ios_base::binary };
-        if (!str) throw std::runtime_error{ std::string("cannot open file '") + filename + std::string("'") };
-        std::vector<uint8_t> extra_data;
-        self.loadModel(str, &extra_data);
-      })
-    .define_method(
-      "ll_per_word",
-      *[](tomoto::ILDAModel& self) {
-        return self.getLLPerWord();
-      })
-    .define_method(
-      "num_docs",
-      *[](tomoto::ILDAModel& self) {
-        return self.getNumDocs();
-      })
-    .define_method(
-      "num_vocabs",
-      *[](tomoto::ILDAModel& self) {
-        return self.getV();
-      })
-    .define_method(
-      "num_words",
-      *[](tomoto::ILDAModel& self) {
-        return self.getN();
-      })
-    .define_method(
-      "optim_interval",
-      *[](tomoto::ILDAModel& self) {
-        return self.getOptimInterval();
-      })
-    .define_method(
-      "optim_interval=",
-      *[](tomoto::ILDAModel& self, size_t value) {
-        self.setOptimInterval(value);
-        return value;
-      })
-    .define_method(
-      "perplexity",
-      *[](tomoto::ILDAModel& self) {
-        return self.getPerplexity();
-      })
-    .define_method(
-      "_prepare",
-      *[](tomoto::ILDAModel& self, size_t minCnt, size_t minDf, size_t rmTop) {
-        self.prepare(true, minCnt, minDf, rmTop);
-      })
-    .define_method(
-      "_removed_top_words",
-      *[](tomoto::ILDAModel& self, size_t rmTop) {
-        Array res;
-        auto dict = self.getVocabDict();
-        size_t size = dict.size();
-        for (size_t i = rmTop; i > 0; i--) {
-          res.push(dict.toWord(size - i));
-        }
-        return res;
-      })
-    .define_method(
-      "_save",
-      *[](tomoto::ILDAModel& self, const char* filename, bool full) {
-        std::ofstream str{ filename, std::ios_base::binary };
-        std::vector<uint8_t> extra_data;
-        self.saveModel(str, full, &extra_data);
-      })
-    .define_method(
-      "_topic_words",
-      *[](tomoto::ILDAModel& self, size_t topicId, size_t topN) {
-        Hash res;
-        for (auto const& v : self.getWordsByTopicSorted(topicId, topN)) {
-          res[v.first] = v.second;
-        }
-        return res;
-      })
-    .define_method(
-      "_train",
-      *[](tomoto::ILDAModel& self, size_t iteration, size_t workers, size_t ps) {
-        self.train(iteration, workers, (tomoto::ParallelScheme)ps);
-      })
-    .define_method(
-      "_tw",
-      *[](tomoto::ILDAModel& self) {
-        return (int)self.getTermWeight();
-      })
-    .define_method(
-      "used_vocab_df",
-      *[](tomoto::ILDAModel& self) {
-        auto vocab = self.getVocabDf();
-        Array res;
-        for (size_t i = 0; i < self.getV(); i++) {
-          res.push(vocab[i]);
-        }
-        return res;
-      })
-    .define_method(
-      "used_vocab_freq",
-      *[](tomoto::ILDAModel& self) {
-        auto vocab = self.getVocabCf();
-        Array res;
-        for (size_t i = 0; i < self.getV(); i++) {
-          res.push(vocab[i]);
-        }
-        return res;
-      })
-    .define_method(
-      "used_vocabs",
-      *[](tomoto::ILDAModel& self) {
-        auto dict = self.getVocabDict();
-        Array res;
-        auto utf8 = Class(rb_cEncoding).call("const_get", "UTF_8");
-        for (size_t i = 0; i < self.getV(); i++) {
-          res.push(to_ruby<std::string>(dict.toWord(i)).call("force_encoding", utf8));
-        }
-        return res;
-      })
-    .define_method(
-      "vocab_df",
-      *[](tomoto::ILDAModel& self) {
-        auto vocab = self.getVocabDf();
-        Array res;
-        for (size_t i = 0; i < vocab.size(); i++) {
-          res.push(vocab[i]);
-        }
-        return res;
-      })
-    .define_method(
-      "vocab_freq",
-      *[](tomoto::ILDAModel& self) {
-        auto vocab = self.getVocabCf();
-        Array res;
-        for (size_t i = 0; i < vocab.size(); i++) {
-          res.push(vocab[i]);
-        }
-        return res;
-      })
-    .define_method(
-      "vocabs",
-      *[](tomoto::ILDAModel& self) {
-        auto dict = self.getVocabDict();
-        Array res;
-        auto utf8 = Class(rb_cEncoding).call("const_get", "UTF_8");
-        for (size_t i = 0; i < dict.size(); i++) {
-          res.push(to_ruby<std::string>(dict.toWord(i)).call("force_encoding", utf8));
-        }
-        return res;
-      });
-  Class rb_cCT = define_class_under<tomoto::ICTModel, tomoto::ILDAModel>(rb_mTomoto, "CT")
-    .define_singleton_method(
-      "_new",
-      *[](size_t tw, size_t k, tomoto::Float alpha, tomoto::Float eta, int seed) {
-        if (seed < 0) {
-          seed = std::random_device{}();
-        }
-        return tomoto::ICTModel::create((tomoto::TermWeight)tw, k, alpha, eta, seed);
-      })
-    .define_method(
-      "_correlations",
-      *[](tomoto::ICTModel& self, tomoto::Tid topic_id) {
-        return self.getCorrelationTopic(topic_id);
-      })
-    .define_method(
-      "num_beta_sample",
-      *[](tomoto::ICTModel& self) {
-        return self.getNumBetaSample();
-      })
-    .define_method(
-      "num_beta_sample=",
-      *[](tomoto::ICTModel& self, size_t value) {
-        self.setNumBetaSample(value);
-        return value;
-      })
-    .define_method(
-      "num_tmn_sample",
-      *[](tomoto::ICTModel& self) {
-        return self.getNumTMNSample();
-      })
-    .define_method(
-      "num_tmn_sample=",
-      *[](tomoto::ICTModel& self, size_t value) {
-        self.setNumTMNSample(value);
-        return value;
-      })
-    .define_method(
-      "_prior_cov",
-      *[](tomoto::ICTModel& self) {
-        return self.getPriorCov();
-      })
-    .define_method(
-      "prior_mean",
-      *[](tomoto::ICTModel& self) {
-        return self.getPriorMean();
-      });
-  Class rb_cDMR = define_class_under<tomoto::IDMRModel, tomoto::ILDAModel>(rb_mTomoto, "DMR")
-    .define_singleton_method(
-      "_new",
-      *[](size_t tw, size_t k, tomoto::Float alpha, tomoto::Float sigma, tomoto::Float eta, tomoto::Float alpha_epsilon, int seed) {
-        if (seed < 0) {
-          seed = std::random_device{}();
-        }
-        return tomoto::IDMRModel::create((tomoto::TermWeight)tw, k, alpha, sigma, eta, alpha_epsilon, seed);
-      })
-    .define_method(
-      "_add_doc",
-      *[](tomoto::IDMRModel& self, std::vector<std::string> words, std::string metadata) {
-        auto doc = buildDoc(words);
-        doc.misc["metadata"] = metadata;
-        self.addDoc(doc);
-      })
-    .define_method(
-      "alpha_epsilon",
-      *[](tomoto::IDMRModel& self) {
-        return self.getAlphaEps();
-      })
-    .define_method(
-      "alpha_epsilon=",
-      *[](tomoto::IDMRModel& self, tomoto::Float value) {
-        self.setAlphaEps(value);
-        return value;
-      })
-    .define_method(
-      "f",
-      *[](tomoto::IDMRModel& self) {
-        return self.getF();
-      })
-    .define_method(
-      "_lambdas",
-      *[](tomoto::IDMRModel& self, tomoto::Tid topic_id) {
-        return self.getLambdaByTopic(topic_id);
-      })
-    .define_method(
-      "metadata_dict",
-      *[](tomoto::IDMRModel& self) {
-        auto dict = self.getMetadataDict();
-        Array res;
-        auto utf8 = Class(rb_cEncoding).call("const_get", "UTF_8");
-        for (size_t i = 0; i < dict.size(); i++) {
-          res.push(to_ruby<std::string>(dict.toWord(i)).call("force_encoding", utf8));
-        }
-        return res;
-      })
-    .define_method(
-      "sigma",
-      *[](tomoto::IDMRModel& self) {
-        return self.getSigma();
-      });
-  Class rb_cDT = define_class_under<tomoto::IDTModel, tomoto::ILDAModel>(rb_mTomoto, "DT")
-    .define_singleton_method(
-      "_new",
-      *[](size_t tw, size_t k, size_t t, tomoto::Float alphaVar, tomoto::Float etaVar, tomoto::Float phiVar, tomoto::Float shapeA, tomoto::Float shapeB, tomoto::Float shapeC) {
-        // Rice only supports 10 arguments
-        int seed = -1;
-        if (seed < 0) {
-          seed = std::random_device{}();
-        }
-        return tomoto::IDTModel::create((tomoto::TermWeight)tw, k, t, alphaVar, etaVar, phiVar, shapeA, shapeB, shapeC, 0, seed);
-      })
-    .define_method(
-      "_add_doc",
-      *[](tomoto::IDTModel& self, std::vector<std::string> words, uint32_t timepoint) {
-        auto doc = buildDoc(words);
-        doc.misc["timepoint"] = timepoint;
-        self.addDoc(doc);
-      })
-    .define_method(
-      "lr_a",
-      *[](tomoto::IDTModel& self) {
-        return self.getShapeA();
-      })
-    .define_method(
-      "lr_a=",
-      *[](tomoto::IDTModel& self, tomoto::Float value) {
-        self.setShapeA(value);
-        return value;
-      })
-    .define_method(
-      "lr_b",
-      *[](tomoto::IDTModel& self) {
-        return self.getShapeB();
-      })
-    .define_method(
-      "lr_b=",
-      *[](tomoto::IDTModel& self, tomoto::Float value) {
-        self.setShapeB(value);
-        return value;
-      })
-    .define_method(
-      "lr_c",
-      *[](tomoto::IDTModel& self) {
-        return self.getShapeC();
-      })
-    .define_method(
-      "lr_c=",
-      *[](tomoto::IDTModel& self, tomoto::Float value) {
-        self.setShapeC(value);
-        return value;
-      })
-    .define_method(
-      "num_docs_by_timepoint",
-      *[](tomoto::IDTModel& self) {
-        return self.getNumDocsByT();
-      })
-    .define_method(
-      "num_timepoints",
-      *[](tomoto::IDTModel& self) {
-        return self.getT();
-      });
-  Class rb_cGDMR = define_class_under<tomoto::IGDMRModel, tomoto::IDMRModel>(rb_mTomoto, "GDMR")
-    .define_singleton_method(
-      "_new",
-      *[](size_t tw, size_t k, std::vector<uint64_t> degrees, tomoto::Float alpha, tomoto::Float sigma, tomoto::Float sigma0, tomoto::Float eta, tomoto::Float alpha_epsilon, int seed) {
-        if (seed < 0) {
-          seed = std::random_device{}();
-        }
-        return tomoto::IGDMRModel::create((tomoto::TermWeight)tw, k, degrees, alpha, sigma, sigma0, eta, alpha_epsilon, seed);
-      })
-    .define_method(
-      "_add_doc",
-      *[](tomoto::IDMRModel& self, std::vector<std::string> words, std::vector<tomoto::Float> metadata) {
-        auto doc = buildDoc(words);
-        doc.misc["metadata"] = metadata;
-        self.addDoc(doc);
-      })
-    .define_method(
-      "degrees",
-      *[](tomoto::IGDMRModel& self) {
-        return self.getFs();
-      })
-    .define_method(
-      "sigma0",
-      *[](tomoto::IGDMRModel& self) {
-        return self.getSigma0();
-      });
-  Class rb_cHDP = define_class_under<tomoto::IHDPModel, tomoto::ILDAModel>(rb_mTomoto, "HDP")
-    .define_singleton_method(
-      "_new",
-      *[](size_t tw, size_t k, tomoto::Float alpha, tomoto::Float eta, tomoto::Float gamma, int seed) {
-        if (seed < 0) {
-          seed = std::random_device{}();
-        }
-        return tomoto::IHDPModel::create((tomoto::TermWeight)tw, k, alpha, eta, gamma, seed);
-      })
-    .define_method(
-      "alpha",
-      *[](tomoto::IHDPModel& self) {
-        return self.getAlpha();
-      })
-    .define_method(
-      "gamma",
-      *[](tomoto::IHDPModel& self) {
-        return self.getGamma();
-      })
-    .define_method(
-      "live_k",
-      *[](tomoto::IHDPModel& self) {
-        return self.getLiveK();
-      })
-    .define_method(
-      "live_topic?",
-      *[](tomoto::IHDPModel& self, size_t tid) {
-        return self.isLiveTopic(tid);
-      })
-    .define_method(
-      "num_tables",
-      *[](tomoto::IHDPModel& self) {
-        return self.getTotalTables();
-      });
-  Class rb_cHLDA = define_class_under<tomoto::IHLDAModel, tomoto::ILDAModel>(rb_mTomoto, "HLDA")
-    .define_singleton_method(
-      "_new",
-      *[](size_t tw, size_t levelDepth, tomoto::Float alpha, tomoto::Float eta, tomoto::Float gamma, int seed) {
-        if (seed < 0) {
-          seed = std::random_device{}();
-        }
-        return tomoto::IHLDAModel::create((tomoto::TermWeight)tw, levelDepth, alpha, eta, gamma, seed);
-      })
-    .define_method(
-      "alpha",
-      *[](tomoto::IHLDAModel& self) {
-        Array res;
-        for (size_t i = 0; i < self.getLevelDepth(); i++) {
-          res.push(self.getAlpha(i));
-        }
-        return res;
-      })
-    .define_method(
-      "_children_topics",
-      *[](tomoto::IHLDAModel& self, tomoto::Tid topic_id) {
-        return self.getChildTopicId(topic_id);
-      })
-    .define_method(
-      "depth",
-      *[](tomoto::IHLDAModel& self) {
-        return self.getLevelDepth();
-      })
-    .define_method(
-      "gamma",
-      *[](tomoto::IHLDAModel& self) {
-        return self.getGamma();
-      })
-    .define_method(
-      "_level",
-      *[](tomoto::IHLDAModel& self, tomoto::Tid topic_id) {
-        return self.getLevelOfTopic(topic_id);
-      })
-    .define_method(
-      "live_k",
-      *[](tomoto::IHLDAModel& self) {
-        return self.getLiveK();
-      })
-    .define_method(
-      "_live_topic?",
-      *[](tomoto::IHLDAModel& self, tomoto::Tid topic_id) {
-        return self.isLiveTopic(topic_id);
-      })
-    .define_method(
-      "_num_docs_of_topic",
-      *[](tomoto::IHLDAModel& self, tomoto::Tid topic_id) {
-        return self.getNumDocsOfTopic(topic_id);
-      })
-    .define_method(
-      "_parent_topic",
-      *[](tomoto::IHLDAModel& self, tomoto::Tid topic_id) {
-        return self.getParentTopicId(topic_id);
-      });
-  Class rb_cPA = define_class_under<tomoto::IPAModel, tomoto::ILDAModel>(rb_mTomoto, "PA")
-    .define_singleton_method(
-      "_new",
-      *[](size_t tw, size_t k1, size_t k2, tomoto::Float alpha, tomoto::Float eta, int seed) {
-        if (seed < 0) {
-          seed = std::random_device{}();
-        }
-        return tomoto::IPAModel::create((tomoto::TermWeight)tw, k1, k2, alpha, eta, seed);
-      })
-    .define_method(
-      "k1",
-      *[](tomoto::IPAModel& self) {
-        return self.getK();
-      })
-    .define_method(
-      "k2",
-      *[](tomoto::IPAModel& self) {
-        return self.getK2();
-      });
-  Class rb_cHPA = define_class_under<tomoto::IHPAModel, tomoto::IPAModel>(rb_mTomoto, "HPA")
-    .define_singleton_method(
-      "_new",
-      *[](size_t tw, size_t k1, size_t k2, tomoto::Float alpha, tomoto::Float eta, int seed) {
-        if (seed < 0) {
-          seed = std::random_device{}();
-        }
-        return tomoto::IHPAModel::create((tomoto::TermWeight)tw, false, k1, k2, alpha, eta, seed);
-      })
-    .define_method(
-      "alpha",
-      *[](tomoto::IHPAModel& self) {
-        Array res;
-        // use <= to return k+1 elements
-        for (size_t i = 0; i <= self.getK(); i++) {
-          res.push(self.getAlpha(i));
-        }
-        return res;
-      });
-  Class rb_cMGLDA = define_class_under<tomoto::IMGLDAModel, tomoto::ILDAModel>(rb_mTomoto, "MGLDA")
-    .define_singleton_method(
-      "_new",
-      *[](size_t tw, size_t k_g, size_t k_l, size_t t, tomoto::Float alpha_g, tomoto::Float alpha_l, tomoto::Float alpha_mg, tomoto::Float alpha_ml, tomoto::Float eta_g) {
-        return tomoto::IMGLDAModel::create((tomoto::TermWeight)tw, k_g, k_l, t, alpha_g, alpha_l, alpha_mg, alpha_ml, eta_g);
-      })
-    .define_method(
-      "_add_doc",
-      *[](tomoto::IMGLDAModel& self, std::vector<std::string> words, std::string delimiter) {
-        auto doc = buildDoc(words);
-        doc.misc["delimiter"] = delimiter;
-        self.addDoc(doc);
-      })
-    .define_method(
-      "alpha_g",
-      *[](tomoto::IMGLDAModel& self) {
-        return self.getAlpha();
-      })
-    .define_method(
-      "alpha_l",
-      *[](tomoto::IMGLDAModel& self) {
-        return self.getAlphaL();
-      })
-    .define_method(
-      "alpha_mg",
-      *[](tomoto::IMGLDAModel& self) {
-        return self.getAlphaM();
-      })
-    .define_method(
-      "alpha_ml",
-      *[](tomoto::IMGLDAModel& self) {
-        return self.getAlphaML();
-      })
-    .define_method(
-      "eta_g",
-      *[](tomoto::IMGLDAModel& self) {
-        return self.getEta();
-      })
-    .define_method(
-      "eta_l",
-      *[](tomoto::IMGLDAModel& self) {
-        return self.getEtaL();
-      })
-    .define_method(
-      "gamma",
-      *[](tomoto::IMGLDAModel& self) {
-        return self.getGamma();
-      })
-    .define_method(
-      "k_g",
-      *[](tomoto::IMGLDAModel& self) {
-        return self.getK();
-      })
-    .define_method(
-      "k_l",
-      *[](tomoto::IMGLDAModel& self) {
-        return self.getKL();
-      })
-    .define_method(
-      "t",
-      *[](tomoto::IMGLDAModel& self) {
-        return self.getT();
-      });
-  Class rb_cLLDA = define_class_under<tomoto::ILLDAModel, tomoto::ILDAModel>(rb_mTomoto, "LLDA")
-    .define_singleton_method(
-      "_new",
-      *[](size_t tw, size_t k, tomoto::Float alpha, tomoto::Float eta, int seed) {
-        if (seed < 0) {
-          seed = std::random_device{}();
-        }
-        return tomoto::ILLDAModel::create((tomoto::TermWeight)tw, k, alpha, eta, seed);
-      })
-    .define_method(
-      "_add_doc",
-      *[](tomoto::ILLDAModel& self, std::vector<std::string> words, std::vector<std::string> labels) {
-        auto doc = buildDoc(words);
-        doc.misc["labels"] = labels;
-        self.addDoc(doc);
-      })
-    .define_method(
-      "topics_per_label",
-      *[](tomoto::ILLDAModel& self) {
-        return self.getNumTopicsPerLabel();
-      });
-  Class rb_cPLDA = define_class_under<tomoto::IPLDAModel, tomoto::ILLDAModel>(rb_mTomoto, "PLDA")
-    .define_singleton_method(
-      "_new",
-      *[](size_t tw, size_t latent_topics, tomoto::Float alpha, tomoto::Float eta, int seed) {
-        if (seed < 0) {
-          seed = std::random_device{}();
-        }
-        return tomoto::IPLDAModel::create((tomoto::TermWeight)tw, latent_topics, 1, alpha, eta, seed);
-      })
-    .define_method(
-      "_add_doc",
-      *[](tomoto::IPLDAModel& self, std::vector<std::string> words, std::vector<std::string> labels) {
-        auto doc = buildDoc(words);
-        doc.misc["labels"] = labels;
-        self.addDoc(doc);
-      })
-    .define_method(
-      "latent_topics",
-      *[](tomoto::IPLDAModel& self) {
-        return self.getNumLatentTopics();
-      });
-  Class rb_cSLDA = define_class_under<tomoto::ISLDAModel, tomoto::ILDAModel>(rb_mTomoto, "SLDA")
-    .define_singleton_method(
-      "_new",
-      *[](size_t tw, size_t k, Array rb_vars, tomoto::Float alpha, tomoto::Float eta, std::vector<tomoto::Float> mu, std::vector<tomoto::Float> nu_sq, std::vector<tomoto::Float> glm_param, int seed) {
-        if (seed < 0) {
-          seed = std::random_device{}();
-        }
-        std::vector<tomoto::ISLDAModel::GLM> vars;
-        vars.reserve(rb_vars.size());
-        for (auto const& v : rb_vars) {
-          vars.push_back((tomoto::ISLDAModel::GLM) from_ruby<int>(v));
-        }
-        return tomoto::ISLDAModel::create((tomoto::TermWeight)tw, k, vars, alpha, eta, mu, nu_sq, glm_param, seed);
-      })
-    .define_method(
-      "_add_doc",
-      *[](tomoto::ISLDAModel& self, std::vector<std::string> words, std::vector<tomoto::Float> y) {
-        auto doc = buildDoc(words);
-        doc.misc["y"] = y;
-        self.addDoc(doc);
-      })
-    .define_method(
-      "f",
-      *[](tomoto::ISLDAModel& self) {
-        return self.getF();
-      })
-    .define_method(
-      "_var_type",
-      *[](tomoto::ISLDAModel& self, size_t var_id) {
-        if (var_id >= self.getF()) throw std::runtime_error{ "'var_id' must be < 'f'" };
-        return self.getTypeOfVar(var_id) == tomoto::ISLDAModel::GLM::linear ? "l" : "b";
-      });
+  init_lda(m);
+  init_ct(m);
+  init_dmr(m);
+  init_dt(m);
+  init_gdmr(m);
+  init_hdp(m);
+  init_hlda(m);
+  init_pa(m);
+  init_hpa(m);
+  init_mglda(m);
+  init_llda(m);
+  init_plda(m);
+  init_slda(m);
 }