RubyGems - tomoto - Versions diffs - 0.3.0-x86_64-darwin - Mend

tomoto 0.3.0-x86_64-darwin

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (97) hide show

checksums.yaml +7 -0
data/CHANGELOG.md +45 -0
data/LICENSE.txt +22 -0
data/README.md +162 -0
data/ext/tomoto/ct.cpp +58 -0
data/ext/tomoto/dmr.cpp +69 -0
data/ext/tomoto/dt.cpp +91 -0
data/ext/tomoto/extconf.rb +34 -0
data/ext/tomoto/gdmr.cpp +42 -0
data/ext/tomoto/hdp.cpp +47 -0
data/ext/tomoto/hlda.cpp +71 -0
data/ext/tomoto/hpa.cpp +32 -0
data/ext/tomoto/lda.cpp +281 -0
data/ext/tomoto/llda.cpp +33 -0
data/ext/tomoto/mglda.cpp +81 -0
data/ext/tomoto/pa.cpp +32 -0
data/ext/tomoto/plda.cpp +33 -0
data/ext/tomoto/slda.cpp +48 -0
data/ext/tomoto/tomoto.cpp +48 -0
data/ext/tomoto/utils.h +30 -0
data/lib/tomoto/2.7/tomoto.bundle +0 -0
data/lib/tomoto/3.0/tomoto.bundle +0 -0
data/lib/tomoto/3.1/tomoto.bundle +0 -0
data/lib/tomoto/ct.rb +24 -0
data/lib/tomoto/dmr.rb +27 -0
data/lib/tomoto/dt.rb +15 -0
data/lib/tomoto/gdmr.rb +15 -0
data/lib/tomoto/hdp.rb +11 -0
data/lib/tomoto/hlda.rb +56 -0
data/lib/tomoto/hpa.rb +11 -0
data/lib/tomoto/lda.rb +181 -0
data/lib/tomoto/llda.rb +15 -0
data/lib/tomoto/mglda.rb +15 -0
data/lib/tomoto/pa.rb +11 -0
data/lib/tomoto/plda.rb +15 -0
data/lib/tomoto/slda.rb +37 -0
data/lib/tomoto/version.rb +3 -0
data/lib/tomoto.rb +27 -0
data/vendor/EigenRand/EigenRand/EigenRand +24 -0
data/vendor/EigenRand/LICENSE +21 -0
data/vendor/EigenRand/README.md +426 -0
data/vendor/eigen/COPYING.APACHE +203 -0
data/vendor/eigen/COPYING.BSD +26 -0
data/vendor/eigen/COPYING.GPL +674 -0
data/vendor/eigen/COPYING.LGPL +502 -0
data/vendor/eigen/COPYING.MINPACK +51 -0
data/vendor/eigen/COPYING.MPL2 +373 -0
data/vendor/eigen/COPYING.README +18 -0
data/vendor/eigen/Eigen/Cholesky +45 -0
data/vendor/eigen/Eigen/CholmodSupport +48 -0
data/vendor/eigen/Eigen/Core +384 -0
data/vendor/eigen/Eigen/Dense +7 -0
data/vendor/eigen/Eigen/Eigen +2 -0
data/vendor/eigen/Eigen/Eigenvalues +60 -0
data/vendor/eigen/Eigen/Geometry +59 -0
data/vendor/eigen/Eigen/Householder +29 -0
data/vendor/eigen/Eigen/IterativeLinearSolvers +48 -0
data/vendor/eigen/Eigen/Jacobi +32 -0
data/vendor/eigen/Eigen/KLUSupport +41 -0
data/vendor/eigen/Eigen/LU +47 -0
data/vendor/eigen/Eigen/MetisSupport +35 -0
data/vendor/eigen/Eigen/OrderingMethods +70 -0
data/vendor/eigen/Eigen/PaStiXSupport +49 -0
data/vendor/eigen/Eigen/PardisoSupport +35 -0
data/vendor/eigen/Eigen/QR +50 -0
data/vendor/eigen/Eigen/QtAlignedMalloc +39 -0
data/vendor/eigen/Eigen/SPQRSupport +34 -0
data/vendor/eigen/Eigen/SVD +50 -0
data/vendor/eigen/Eigen/Sparse +34 -0
data/vendor/eigen/Eigen/SparseCholesky +37 -0
data/vendor/eigen/Eigen/SparseCore +69 -0
data/vendor/eigen/Eigen/SparseLU +50 -0
data/vendor/eigen/Eigen/SparseQR +36 -0
data/vendor/eigen/Eigen/StdDeque +27 -0
data/vendor/eigen/Eigen/StdList +26 -0
data/vendor/eigen/Eigen/StdVector +27 -0
data/vendor/eigen/Eigen/SuperLUSupport +64 -0
data/vendor/eigen/Eigen/UmfPackSupport +40 -0
data/vendor/eigen/README.md +5 -0
data/vendor/eigen/bench/README.txt +55 -0
data/vendor/eigen/bench/btl/COPYING +340 -0
data/vendor/eigen/bench/btl/README +154 -0
data/vendor/eigen/bench/tensors/README +20 -0
data/vendor/eigen/blas/README.txt +6 -0
data/vendor/eigen/ci/README.md +56 -0
data/vendor/eigen/demos/mandelbrot/README +10 -0
data/vendor/eigen/demos/mix_eigen_and_c/README +9 -0
data/vendor/eigen/demos/opengl/README +13 -0
data/vendor/eigen/unsupported/Eigen/CXX11/src/Tensor/README.md +1815 -0
data/vendor/eigen/unsupported/README.txt +50 -0
data/vendor/tomotopy/LICENSE +21 -0
data/vendor/tomotopy/README.kr.rst +512 -0
data/vendor/tomotopy/README.rst +516 -0
data/vendor/variant/LICENSE +25 -0
data/vendor/variant/LICENSE_1_0.txt +23 -0
data/vendor/variant/README.md +102 -0
metadata +140 -0

checksums.yaml ADDED Viewed

@@ -0,0 +1,7 @@
+---
+SHA256:
+  metadata.gz: b23bb72cb63777f22912c00abe475b2ba903b2abd0ab12ef5ebafc0832ef3d4d
+  data.tar.gz: c7a98c977d7864ce142df08380b0ed3cc94b663221af79ddb291393102b9603b
+SHA512:
+  metadata.gz: 378389c5f113de2e5cf0db7b6a433fd189a74afca495e2ecc69cf1ffddb32c5dba0761a98c245ba748e1e8365633958573591d0182af1d2d5b8b23bee9f6a3ba
+  data.tar.gz: 385e48e227645fb6148bea04b6d04157e6cf4b271b23114bc168463886ac167e06315ffa65ce7def5eb9cf3c94cfee5483cf1761208a5fb5323c00e2a3395550

data/CHANGELOG.md ADDED Viewed

@@ -0,0 +1,45 @@
+## 0.3.0 (2022-10-03)
+- Added precompiled gems for Linux and Mac
+- Updated tomoto to 0.12.3
+- Dropped support for Ruby < 2.7
+## 0.2.3 (2021-08-26)
+- Updated to Rice 4
+## 0.2.2 (2021-08-23)
+- Reduced gem size
+## 0.2.1 (2021-08-23)
+- Added support for unseen documents
+## 0.2.0 (2021-05-23)
+- Updated tomoto to 0.12.0
+- Dropped support for Ruby < 2.6
+## 0.1.4 (2021-03-14)
+- Added `docs` method
+- Updated tomoto to 0.10.2
+- Updated `add_doc` to return the index of the document
+## 0.1.3 (2020-12-19)
+- Updated tomoto to 0.10.0
+## 0.1.2 (2020-10-10)
+- Added `summary` method
+- Added `parallel` option to `train` method
+## 0.1.1 (2020-10-10)
+- Added many more models
+## 0.1.0 (2020-10-09)
+- First release

data/LICENSE.txt ADDED Viewed

@@ -0,0 +1,22 @@
+MIT License
+Copyright (c) 2019, bab2min
+Copyright (c) 2020-2021 Andrew Kane
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.

data/README.md ADDED Viewed

@@ -0,0 +1,162 @@
+# tomoto.rb
+:tomato: [tomoto](https://github.com/bab2min/tomotopy) - high performance topic modeling - for Ruby
+[![Build Status](https://github.com/ankane/tomoto-ruby/workflows/build/badge.svg?branch=master)](https://github.com/ankane/tomoto-ruby/actions)
+## Installation
+Add this line to your application’s Gemfile:
+```ruby
+gem "tomoto"
+```
+## Getting Started
+Train a model
+```ruby
+model = Tomoto::LDA.new(k: 2)
+model.add_doc("text from document one")
+model.add_doc("text from document two")
+model.add_doc("text from document three")
+model.train(100) # iterations
+```
+Get the summary
+```ruby
+model.summary
+```
+Get topic words
+```ruby
+model.topic_words
+```
+Save the model to a file
+```ruby
+model.save("model.bin")
+```
+Load the model from a file
+```ruby
+model = Tomoto::LDA.load("model.bin")
+```
+Get topic probabilities for a document
+```ruby
+doc = model.docs[0]
+doc.topics
+```
+Get the number of words for each topic
+```ruby
+model.count_by_topics
+```
+Get the vocab
+```ruby
+model.vocabs
+```
+Get the log likelihood per word
+```ruby
+model.ll_per_word
+```
+Perform inference for unseen documents
+```ruby
+doc = model.make_doc("unseen doc")
+topic_dist, ll = model.infer(doc)
+```
+## Models
+Supports:
+- Latent Dirichlet Allocation (`LDA`)
+- Labeled LDA (`LLDA`)
+- Partially Labeled LDA (`PLDA`)
+- Supervised LDA (`SLDA`)
+- Dirichlet Multinomial Regression (`DMR`)
+- Generalized Dirichlet Multinomial Regression (`GDMR`)
+- Hierarchical Dirichlet Process (`HDP`)
+- Hierarchical LDA (`HLDA`)
+- Multi Grain LDA (`MGLDA`)
+- Pachinko Allocation (`PA`)
+- Hierarchical PA (`HPA`)
+- Correlated Topic Model (`CT`)
+- Dynamic Topic Model (`DT`)
+## API
+This library follows the [tomotopy API](https://bab2min.github.io/tomotopy/v0.9.0/en/). There are a few changes to make it more Ruby-like:
+- The `get_` prefix has been removed from methods (`topic_words` instead of `get_topic_words`)
+- Methods that return booleans use `?` instead of `is_`  (`live_topic?` instead of `is_live_topic`)
+If a method or option you need isn’t supported, feel free to open an issue.
+## Examples
+- [LDA](examples/lda_basic.rb)
+- [HDP](examples/hdp_basic.rb)
+## Tokenization
+Documents are tokenized by whitespace by default, or you can perform your own tokenization.
+```ruby
+model.add_doc(["tokens", "from", "document", "one"])
+```
+## Performance
+tomoto uses AVX2, AVX, or SSE2 instructions to increase performance on machines that support it. Check which instruction set architecture it’s using with:
+```ruby
+Tomoto.isa
+```
+## Parallelism
+Choose a [parallelism algorithm](https://bab2min.github.io/tomotopy/v0.9.0/en/#parallel-sampling-algorithms) with:
+```ruby
+model.train(parallel: :partition)
+```
+Supported values are `:default`, `:none`, `:copy_merge`, and `:partition`.
+## History
+View the [changelog](https://github.com/ankane/tomoto-ruby/blob/master/CHANGELOG.md)
+## Contributing
+Everyone is encouraged to help improve this project. Here are a few ways you can help:
+- [Report bugs](https://github.com/ankane/tomoto-ruby/issues)
+- Fix bugs and [submit pull requests](https://github.com/ankane/tomoto-ruby/pulls)
+- Write, clarify, or fix documentation
+- Suggest or add new features
+To get started with development:
+```sh
+git clone --recursive https://github.com/ankane/tomoto-ruby.git
+cd tomoto-ruby
+bundle install
+bundle exec rake compile
+bundle exec rake test
+```

data/ext/tomoto/ct.cpp ADDED Viewed

@@ -0,0 +1,58 @@
+#include <CT.h>
+#include <rice/rice.hpp>
+#include "utils.h"
+void init_ct(Rice::Module& m) {
+  Rice::define_class_under<tomoto::ICTModel, tomoto::ILDAModel>(m, "CT")
+    .define_singleton_function(
+      "_new",
+      [](size_t tw, size_t k, tomoto::Float alpha, tomoto::Float eta, size_t seed) {
+        tomoto::CTArgs args;
+        args.k = k;
+        args.alpha = {alpha};
+        args.eta = eta;
+        if (seed >= 0) {
+          args.seed = seed;
+        }
+        return tomoto::ICTModel::create((tomoto::TermWeight)tw, args);
+      }, Rice::Return().takeOwnership())
+    .define_method(
+      "_correlations",
+      [](tomoto::ICTModel& self, tomoto::Tid topic_id) {
+        return self.getCorrelationTopic(topic_id);
+      })
+    .define_method(
+      "num_beta_sample",
+      [](tomoto::ICTModel& self) {
+        return self.getNumBetaSample();
+      })
+    .define_method(
+      "num_beta_sample=",
+      [](tomoto::ICTModel& self, size_t value) {
+        self.setNumBetaSample(value);
+        return value;
+      })
+    .define_method(
+      "num_tmn_sample",
+      [](tomoto::ICTModel& self) {
+        return self.getNumTMNSample();
+      })
+    .define_method(
+      "num_tmn_sample=",
+      [](tomoto::ICTModel& self, size_t value) {
+        self.setNumTMNSample(value);
+        return value;
+      })
+    .define_method(
+      "_prior_cov",
+      [](tomoto::ICTModel& self) {
+        return self.getPriorCov();
+      })
+    .define_method(
+      "prior_mean",
+      [](tomoto::ICTModel& self) {
+        return self.getPriorMean();
+      });
+}

data/ext/tomoto/dmr.cpp ADDED Viewed

@@ -0,0 +1,69 @@
+#include <DMR.h>
+#include <rice/rice.hpp>
+#include "utils.h"
+void init_dmr(Rice::Module& m) {
+  Rice::define_class_under<tomoto::IDMRModel, tomoto::ILDAModel>(m, "DMR")
+    .define_singleton_function(
+      "_new",
+      [](size_t tw, size_t k, tomoto::Float alpha, tomoto::Float sigma, tomoto::Float eta, tomoto::Float alpha_epsilon, size_t seed) {
+        tomoto::DMRArgs args;
+        args.k = k;
+        args.alpha = {alpha};
+        args.sigma = sigma;
+        args.eta = eta;
+        args.alphaEps = alpha_epsilon;
+        if (seed >= 0) {
+          args.seed = seed;
+        }
+        return tomoto::IDMRModel::create((tomoto::TermWeight)tw, args);
+      }, Rice::Return().takeOwnership())
+    .define_method(
+      "_add_doc",
+      [](tomoto::IDMRModel& self, std::vector<std::string> words, std::string metadata) {
+        auto doc = buildDoc(words);
+        doc.misc["metadata"] = metadata;
+        return self.addDoc(doc);
+      })
+    .define_method(
+      "alpha_epsilon",
+      [](tomoto::IDMRModel& self) {
+        return self.getAlphaEps();
+      })
+    .define_method(
+      "alpha_epsilon=",
+      [](tomoto::IDMRModel& self, tomoto::Float value) {
+        self.setAlphaEps(value);
+        return value;
+      })
+    .define_method(
+      "f",
+      [](tomoto::IDMRModel& self) {
+        return self.getF();
+      })
+    .define_method(
+      "_lambdas",
+      [](tomoto::IDMRModel& self, tomoto::Tid topic_id) {
+        return self.getLambdaByTopic(topic_id);
+      })
+    .define_method(
+      "metadata_dict",
+      [](tomoto::IDMRModel& self) {
+        auto dict = self.getMetadataDict();
+        Array res;
+        auto utf8 = Rice::Class(rb_cEncoding).call("const_get", "UTF_8");
+        for (size_t i = 0; i < dict.size(); i++) {
+          VALUE value = Rice::detail::To_Ruby<std::string>().convert(dict.toWord(i));
+          Object obj(value);
+          res.push(obj.call("force_encoding", utf8));
+        }
+        return res;
+      })
+    .define_method(
+      "sigma",
+      [](tomoto::IDMRModel& self) {
+        return self.getSigma();
+      });
+}

data/ext/tomoto/dt.cpp ADDED Viewed

@@ -0,0 +1,91 @@
+#include <DT.h>
+#include <rice/rice.hpp>
+#include "utils.h"
+void init_dt(Rice::Module& m) {
+  Rice::define_class_under<tomoto::IDTModel, tomoto::ILDAModel>(m, "DT")
+    .define_singleton_function(
+      "_new",
+      [](size_t tw, size_t k, size_t t, tomoto::Float alphaVar, tomoto::Float etaVar, tomoto::Float phiVar, tomoto::Float shapeA, tomoto::Float shapeB, tomoto::Float shapeC) {
+        // Rice only supports 10 arguments
+        size_t seed = -1;
+        tomoto::DTArgs args;
+        args.k = k;
+        args.t = t;
+        args.alpha = {alphaVar};
+        args.eta = etaVar;
+        args.phi = phiVar;
+        args.shapeA = shapeA;
+        args.shapeB = shapeB;
+        args.shapeC = shapeC;
+        if (seed >= 0) {
+          args.seed = seed;
+        }
+        return tomoto::IDTModel::create((tomoto::TermWeight)tw, args);
+      }, Rice::Return().takeOwnership())
+    .define_method(
+      "_add_doc",
+      [](tomoto::IDTModel& self, std::vector<std::string> words, uint32_t timepoint) {
+        auto doc = buildDoc(words);
+        doc.misc["timepoint"] = timepoint;
+        return self.addDoc(doc);
+      })
+    .define_method(
+      "alpha",
+      [](tomoto::IDTModel& self) {
+        Array res;
+        for (size_t i = 0; i < self.getK(); i++) {
+          Array res2;
+          for (size_t j = 0; j < self.getT(); j++) {
+            res2.push(self.getAlpha(i, j));
+          }
+          res.push(res2);
+        }
+        return res;
+      })
+    .define_method(
+      "lr_a",
+      [](tomoto::IDTModel& self) {
+        return self.getShapeA();
+      })
+    .define_method(
+      "lr_a=",
+      [](tomoto::IDTModel& self, tomoto::Float value) {
+        self.setShapeA(value);
+        return value;
+      })
+    .define_method(
+      "lr_b",
+      [](tomoto::IDTModel& self) {
+        return self.getShapeB();
+      })
+    .define_method(
+      "lr_b=",
+      [](tomoto::IDTModel& self, tomoto::Float value) {
+        self.setShapeB(value);
+        return value;
+      })
+    .define_method(
+      "lr_c",
+      [](tomoto::IDTModel& self) {
+        return self.getShapeC();
+      })
+    .define_method(
+      "lr_c=",
+      [](tomoto::IDTModel& self, tomoto::Float value) {
+        self.setShapeC(value);
+        return value;
+      })
+    .define_method(
+      "num_docs_by_timepoint",
+      [](tomoto::IDTModel& self) {
+        return self.getNumDocsByT();
+      })
+    .define_method(
+      "num_timepoints",
+      [](tomoto::IDTModel& self) {
+        return self.getT();
+      });
+}

data/ext/tomoto/extconf.rb ADDED Viewed

@@ -0,0 +1,34 @@
+require "mkmf-rice"
+$CXXFLAGS += " -std=c++17 $(optflags) -DEIGEN_MPL2_ONLY"
+unless ENV["RUBY_CC_VERSION"]
+  # AVX-512F not support yet
+  # https://github.com/bab2min/tomotopy/issues/188
+  $CXXFLAGS << " " << with_config("optflags", "-march=native -mno-avx512f")
+end
+apple_clang = RbConfig::CONFIG["CC_VERSION_MESSAGE"] =~ /apple clang/i
+if apple_clang
+  # silence rice warnings
+  $CXXFLAGS += " -Wno-deprecated-declarations"
+else
+  # silence eigen warnings
+  $CXXFLAGS += " -Wno-ignored-attributes -Wno-deprecated-copy"
+end
+# silence tomoto warnings
+$CXXFLAGS += " -Wno-unused-variable -Wno-switch"
+ext = File.expand_path(".", __dir__)
+tomoto = File.expand_path("../../vendor/tomotopy/src/TopicModel", __dir__)
+eigen = File.expand_path("../../vendor/eigen", __dir__)
+eigen_rand = File.expand_path("../../vendor/EigenRand", __dir__)
+variant = File.expand_path("../../vendor/variant/include", __dir__)
+$srcs = Dir["{#{ext},#{tomoto}}/*.cpp"]
+$INCFLAGS += " -I#{tomoto} -I#{eigen} -I#{eigen_rand} -I#{variant}"
+$VPATH << tomoto
+create_makefile("tomoto/tomoto")

data/ext/tomoto/gdmr.cpp ADDED Viewed

@@ -0,0 +1,42 @@
+#include <GDMR.h>
+#include <rice/rice.hpp>
+#include "utils.h"
+void init_gdmr(Rice::Module& m) {
+  Rice::define_class_under<tomoto::IGDMRModel, tomoto::IDMRModel>(m, "GDMR")
+    .define_singleton_function(
+      "_new",
+      [](size_t tw, size_t k, std::vector<uint64_t> degrees, tomoto::Float alpha, tomoto::Float sigma, tomoto::Float sigma0, tomoto::Float eta, tomoto::Float alpha_epsilon, size_t seed) {
+        tomoto::GDMRArgs args;
+        args.k = k;
+        args.degrees = degrees;
+        args.alpha = {alpha};
+        args.sigma = sigma;
+        args.sigma0 = sigma0;
+        args.eta = eta;
+        args.alphaEps = alpha_epsilon;
+        if (seed >= 0) {
+          args.seed = seed;
+        }
+        return tomoto::IGDMRModel::create((tomoto::TermWeight)tw, args);
+      }, Rice::Return().takeOwnership())
+    .define_method(
+      "_add_doc",
+      [](tomoto::IGDMRModel& self, std::vector<std::string> words, std::vector<tomoto::Float> numeric_metadata) {
+        auto doc = buildDoc(words);
+        doc.misc["numeric_metadata"] = numeric_metadata;
+        return self.addDoc(doc);
+      })
+    .define_method(
+      "degrees",
+      [](tomoto::IGDMRModel& self) {
+        return self.getFs();
+      })
+    .define_method(
+      "sigma0",
+      [](tomoto::IGDMRModel& self) {
+        return self.getSigma0();
+      });
+}

data/ext/tomoto/hdp.cpp ADDED Viewed

@@ -0,0 +1,47 @@
+#include <HDP.h>
+#include <rice/rice.hpp>
+#include "utils.h"
+void init_hdp(Rice::Module& m) {
+  Rice::define_class_under<tomoto::IHDPModel, tomoto::ILDAModel>(m, "HDP")
+    .define_singleton_function(
+      "_new",
+      [](size_t tw, size_t k, tomoto::Float alpha, tomoto::Float eta, tomoto::Float gamma, size_t seed) {
+        tomoto::HDPArgs args;
+        args.k = k;
+        args.alpha = {alpha};
+        args.eta = eta;
+        args.gamma = gamma;
+        if (seed >= 0) {
+          args.seed = seed;
+        }
+        return tomoto::IHDPModel::create((tomoto::TermWeight)tw, args);
+      }, Rice::Return().takeOwnership())
+    .define_method(
+      "alpha",
+      [](tomoto::IHDPModel& self) {
+        return self.getAlpha();
+      })
+    .define_method(
+      "gamma",
+      [](tomoto::IHDPModel& self) {
+        return self.getGamma();
+      })
+    .define_method(
+      "live_k",
+      [](tomoto::IHDPModel& self) {
+        return self.getLiveK();
+      })
+    .define_method(
+      "live_topic?",
+      [](tomoto::IHDPModel& self, size_t tid) {
+        return self.isLiveTopic(tid);
+      })
+    .define_method(
+      "num_tables",
+      [](tomoto::IHDPModel& self) {
+        return self.getTotalTables();
+      });
+}

data/ext/tomoto/hlda.cpp ADDED Viewed

@@ -0,0 +1,71 @@
+#include <HLDA.h>
+#include <rice/rice.hpp>
+#include "utils.h"
+void init_hlda(Rice::Module& m) {
+  Rice::define_class_under<tomoto::IHLDAModel, tomoto::ILDAModel>(m, "HLDA")
+    .define_singleton_function(
+      "_new",
+      [](size_t tw, size_t levelDepth, tomoto::Float alpha, tomoto::Float eta, tomoto::Float gamma, size_t seed) {
+        tomoto::HLDAArgs args;
+        args.k = levelDepth;
+        args.alpha = {alpha};
+        args.eta = eta;
+        args.gamma = gamma;
+        if (seed >= 0) {
+          args.seed = seed;
+        }
+        return tomoto::IHLDAModel::create((tomoto::TermWeight)tw, args);
+      }, Rice::Return().takeOwnership())
+    .define_method(
+      "alpha",
+      [](tomoto::IHLDAModel& self) {
+        Array res;
+        for (size_t i = 0; i < self.getLevelDepth(); i++) {
+          res.push(self.getAlpha(i));
+        }
+        return res;
+      })
+    .define_method(
+      "_children_topics",
+      [](tomoto::IHLDAModel& self, tomoto::Tid topic_id) {
+        return self.getChildTopicId(topic_id);
+      })
+    .define_method(
+      "depth",
+      [](tomoto::IHLDAModel& self) {
+        return self.getLevelDepth();
+      })
+    .define_method(
+      "gamma",
+      [](tomoto::IHLDAModel& self) {
+        return self.getGamma();
+      })
+    .define_method(
+      "_level",
+      [](tomoto::IHLDAModel& self, tomoto::Tid topic_id) {
+        return self.getLevelOfTopic(topic_id);
+      })
+    .define_method(
+      "live_k",
+      [](tomoto::IHLDAModel& self) {
+        return self.getLiveK();
+      })
+    .define_method(
+      "_live_topic?",
+      [](tomoto::IHLDAModel& self, tomoto::Tid topic_id) {
+        return self.isLiveTopic(topic_id);
+      })
+    .define_method(
+      "_num_docs_of_topic",
+      [](tomoto::IHLDAModel& self, tomoto::Tid topic_id) {
+        return self.getNumDocsOfTopic(topic_id);
+      })
+    .define_method(
+      "_parent_topic",
+      [](tomoto::IHLDAModel& self, tomoto::Tid topic_id) {
+        return self.getParentTopicId(topic_id);
+      });
+}

data/ext/tomoto/hpa.cpp ADDED Viewed

@@ -0,0 +1,32 @@
+#include <HPA.h>
+#include <rice/rice.hpp>
+#include "utils.h"
+void init_hpa(Rice::Module& m) {
+  Rice::define_class_under<tomoto::IHPAModel, tomoto::IPAModel>(m, "HPA")
+    .define_singleton_function(
+      "_new",
+      [](size_t tw, size_t k1, size_t k2, tomoto::Float alpha, tomoto::Float eta, size_t seed) {
+        tomoto::HPAArgs args;
+        args.k = k1;
+        args.k2 = k2;
+        args.alpha = {alpha};
+        args.eta = eta;
+        if (seed >= 0) {
+          args.seed = seed;
+        }
+        return tomoto::IHPAModel::create((tomoto::TermWeight)tw, false, args);
+      }, Rice::Return().takeOwnership())
+    .define_method(
+      "alpha",
+      [](tomoto::IHPAModel& self) {
+        Array res;
+        // use <= to return k+1 elements
+        for (size_t i = 0; i <= self.getK(); i++) {
+          res.push(self.getAlpha(i));
+        }
+        return res;
+      });
+}