RubyGems - tomoto - Versions diffs - 0.1.3 → 0.1.4 - Mend

tomoto 0.1.3 → 0.1.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (50) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +6 -0
data/LICENSE.txt +1 -1
data/README.md +7 -0
data/ext/tomoto/ct.cpp +54 -0
data/ext/tomoto/dmr.cpp +62 -0
data/ext/tomoto/dt.cpp +82 -0
data/ext/tomoto/ext.cpp +27 -773
data/ext/tomoto/gdmr.cpp +34 -0
data/ext/tomoto/hdp.cpp +42 -0
data/ext/tomoto/hlda.cpp +66 -0
data/ext/tomoto/hpa.cpp +27 -0
data/ext/tomoto/lda.cpp +250 -0
data/ext/tomoto/llda.cpp +29 -0
data/ext/tomoto/mglda.cpp +71 -0
data/ext/tomoto/pa.cpp +27 -0
data/ext/tomoto/plda.cpp +29 -0
data/ext/tomoto/slda.cpp +40 -0
data/ext/tomoto/utils.h +84 -0
data/lib/tomoto/tomoto.bundle +0 -0
data/lib/tomoto/tomoto.so +0 -0
data/lib/tomoto/version.rb +1 -1
data/vendor/tomotopy/README.kr.rst +12 -3
data/vendor/tomotopy/README.rst +12 -3
data/vendor/tomotopy/src/Labeling/FoRelevance.cpp +47 -2
data/vendor/tomotopy/src/Labeling/FoRelevance.h +21 -151
data/vendor/tomotopy/src/Labeling/Labeler.h +5 -3
data/vendor/tomotopy/src/Labeling/Phraser.hpp +518 -0
data/vendor/tomotopy/src/TopicModel/CTModel.hpp +6 -3
data/vendor/tomotopy/src/TopicModel/DT.h +1 -1
data/vendor/tomotopy/src/TopicModel/DTModel.hpp +8 -23
data/vendor/tomotopy/src/TopicModel/HDPModel.hpp +9 -18
data/vendor/tomotopy/src/TopicModel/HLDAModel.hpp +56 -58
data/vendor/tomotopy/src/TopicModel/HPAModel.hpp +4 -14
data/vendor/tomotopy/src/TopicModel/LDA.h +69 -17
data/vendor/tomotopy/src/TopicModel/LDACVB0Model.hpp +1 -1
data/vendor/tomotopy/src/TopicModel/LDAModel.hpp +108 -61
data/vendor/tomotopy/src/TopicModel/MGLDAModel.hpp +7 -8
data/vendor/tomotopy/src/TopicModel/PAModel.hpp +26 -16
data/vendor/tomotopy/src/TopicModel/PT.h +27 -0
data/vendor/tomotopy/src/TopicModel/PTModel.cpp +10 -0
data/vendor/tomotopy/src/TopicModel/PTModel.hpp +273 -0
data/vendor/tomotopy/src/TopicModel/TopicModel.hpp +16 -11
data/vendor/tomotopy/src/Utils/MultiNormalDistribution.hpp +3 -2
data/vendor/tomotopy/src/Utils/Trie.hpp +39 -8
data/vendor/tomotopy/src/Utils/TruncMultiNormal.hpp +36 -38
data/vendor/tomotopy/src/Utils/Utils.hpp +50 -45
data/vendor/tomotopy/src/Utils/math.h +8 -4
data/vendor/tomotopy/src/Utils/tvector.hpp +4 -0
metadata +24 -60

data/vendor/tomotopy/src/TopicModel/MGLDAModel.hpp CHANGED Viewed

@@ -107,18 +107,16 @@ namespace tomoto
 				e = edd.chunkOffsetByDoc(partitionId + 1, docId);
 			}
-			size_t vOffset = (_ps == ParallelScheme::partition && partitionId) ? edd.vChunkOffset[partitionId - 1] : 0;
 			const auto K = this->K;
 			for (size_t w = b; w < e; ++w)
 			{
 				if (doc.words[w] >= this->realV) continue;
-				addWordTo<-1>(ld, doc, w, doc.words[w] - vOffset, doc.Zs[w] - (doc.Zs[w] < K ? 0 : K), doc.sents[w], doc.Vs[w], doc.Zs[w] < K ? 0 : 1);
-				auto dist = getVZLikelihoods(ld, doc, doc.words[w] - vOffset, doc.sents[w]);
+				addWordTo<-1>(ld, doc, w, doc.words[w], doc.Zs[w] - (doc.Zs[w] < K ? 0 : K), doc.sents[w], doc.Vs[w], doc.Zs[w] < K ? 0 : 1);
+				auto dist = getVZLikelihoods(ld, doc, doc.words[w], doc.sents[w]);
 				auto vz = sample::sampleFromDiscreteAcc(dist, dist + T * (K + KL), rgs);
 				doc.Vs[w] = vz / (K + KL);
 				doc.Zs[w] = vz % (K + KL);
-				addWordTo<1>(ld, doc, w, doc.words[w] - vOffset, doc.Zs[w] - (doc.Zs[w] < K ? 0 : K), doc.sents[w], doc.Vs[w], doc.Zs[w] < K ? 0 : 1);
+				addWordTo<1>(ld, doc, w, doc.words[w], doc.Zs[w] - (doc.Zs[w] < K ? 0 : K), doc.sents[w], doc.Vs[w], doc.Zs[w] < K ? 0 : 1);
 			}
 		}
@@ -294,7 +292,7 @@ namespace tomoto
 			doc.Zs = tvector<Tid>(wordSize);
 			doc.Vs.resize(wordSize);
 			if (_tw != TermWeight::one) doc.wordWeights.resize(wordSize);
-			doc.numByTopic.init(nullptr, this->K + KL);
+			doc.numByTopic.init(nullptr, this->K + KL, 1);
 			doc.numBySentWin = Eigen::Matrix<WeightType, -1, -1>::Zero(S, T);
 			doc.numByWin = Eigen::Matrix<WeightType, -1, 1>::Zero(S + T - 1);
 			doc.numByWinL = Eigen::Matrix<WeightType, -1, 1>::Zero(S + T - 1);
@@ -308,7 +306,8 @@ namespace tomoto
 			if (initDocs)
 			{
 				this->globalState.numByTopic = Eigen::Matrix<WeightType, -1, 1>::Zero(this->K + KL);
-				this->globalState.numByTopicWord = Eigen::Matrix<WeightType, -1, -1>::Zero(this->K + KL, V);
+				//this->globalState.numByTopicWord = Eigen::Matrix<WeightType, -1, -1>::Zero(this->K + KL, V);
+				this->globalState.numByTopicWord.init(nullptr, this->K + KL, V);
 			}
 		}
@@ -533,7 +532,7 @@ namespace tomoto
 	template<typename _TopicModel>
 	void DocumentMGLDA<_tw>::update(WeightType * ptr, const _TopicModel & mdl)
 	{
-		this->numByTopic.init(ptr, mdl.getK() + mdl.getKL());
+		this->numByTopic.init(ptr, mdl.getK() + mdl.getKL(), 1);
 		numBySent.resize(*std::max_element(sents.begin(), sents.end()) + 1);
 		for (size_t i = 0; i < this->Zs.size(); ++i)
 		{

data/vendor/tomotopy/src/TopicModel/PAModel.hpp CHANGED Viewed

@@ -144,7 +144,7 @@ namespace tomoto
 				size_t b = partitionId ? edd.vChunkOffset[partitionId - 1] : 0,
 					e = edd.vChunkOffset[partitionId];
-				localData[partitionId].numByTopicWord = globalState.numByTopicWord.block(0, b, globalState.numByTopicWord.rows(), e - b);
+				localData[partitionId].numByTopicWord.matrix() = globalState.numByTopicWord.block(0, b, globalState.numByTopicWord.rows(), e - b);
 				localData[partitionId].numByTopic = globalState.numByTopic;
 				localData[partitionId].numByTopic1_2 = globalState.numByTopic1_2;
 				localData[partitionId].numByTopic2 = globalState.numByTopic2;
@@ -157,8 +157,6 @@ namespace tomoto
 		template<ParallelScheme _ps, typename _ExtraDocData>
 		void mergeState(ThreadPool& pool, _ModelState& globalState, _ModelState& tState, _ModelState* localData, _RandGen*, const _ExtraDocData& edd) const
 		{
-			std::vector<std::future<void>> res;
 			if (_ps == ParallelScheme::copy_merge)
 			{
 				tState = globalState;
@@ -177,19 +175,12 @@ namespace tomoto
 					globalState.numByTopic = globalState.numByTopic.cwiseMax(0);
 					globalState.numByTopic1_2 = globalState.numByTopic1_2.cwiseMax(0);
 					globalState.numByTopic2 = globalState.numByTopic2.cwiseMax(0);
-					globalState.numByTopicWord = globalState.numByTopicWord.cwiseMax(0);
-				}
-				for (size_t i = 0; i < pool.getNumWorkers(); ++i)
-				{
-					res.emplace_back(pool.enqueue([&, this, i](size_t threadId)
-					{
-						localData[i] = globalState;
-					}));
+					globalState.numByTopicWord.matrix() = globalState.numByTopicWord.cwiseMax(0);
 				}
 			}
 			else if (_ps == ParallelScheme::partition)
 			{
+				std::vector<std::future<void>> res;
 				res = pool.enqueueToAll([&](size_t partitionId)
 				{
 					size_t b = partitionId ? edd.vChunkOffset[partitionId - 1] : 0,
@@ -197,7 +188,6 @@ namespace tomoto
 					globalState.numByTopicWord.block(0, b, globalState.numByTopicWord.rows(), e - b) = localData[partitionId].numByTopicWord;
 				});
 				for (auto& r : res) r.get();
-				res.clear();
 				tState.numByTopic1_2 = globalState.numByTopic1_2;
 				globalState.numByTopic1_2 = localData[0].numByTopic1_2;
@@ -209,11 +199,31 @@ namespace tomoto
 				// make all count being positive
 				if (_tw != TermWeight::one)
 				{
-					globalState.numByTopicWord = globalState.numByTopicWord.cwiseMax(0);
+					globalState.numByTopicWord.matrix() = globalState.numByTopicWord.cwiseMax(0);
 				}
 				globalState.numByTopic = globalState.numByTopic1_2.rowwise().sum();
 				globalState.numByTopic2 = globalState.numByTopicWord.rowwise().sum();
+			}
+		}
+		template<ParallelScheme _ps>
+		void distributeMergedState(ThreadPool& pool, _ModelState& globalState, _ModelState* localData) const
+		{
+			std::vector<std::future<void>> res;
+			if (_ps == ParallelScheme::copy_merge)
+			{
+				for (size_t i = 0; i < pool.getNumWorkers(); ++i)
+				{
+					res.emplace_back(pool.enqueue([&, i](size_t)
+					{
+						localData[i] = globalState;
+					}));
+				}
+			}
+			else if (_ps == ParallelScheme::partition)
+			{
 				res = pool.enqueueToAll([&](size_t threadId)
 				{
 					localData[threadId].numByTopic = globalState.numByTopic;
@@ -221,7 +231,6 @@ namespace tomoto
 					localData[threadId].numByTopic2 = globalState.numByTopic2;
 				});
 			}
 			for (auto& r : res) r.get();
 		}
@@ -304,7 +313,8 @@ namespace tomoto
 				this->globalState.numByTopic = Eigen::Matrix<WeightType, -1, 1>::Zero(this->K);
 				this->globalState.numByTopic2 = Eigen::Matrix<WeightType, -1, 1>::Zero(K2);
 				this->globalState.numByTopic1_2 = Eigen::Matrix<WeightType, -1, -1>::Zero(this->K, K2);
-				this->globalState.numByTopicWord = Eigen::Matrix<WeightType, -1, -1>::Zero(K2, V);
+				//this->globalState.numByTopicWord = Eigen::Matrix<WeightType, -1, -1>::Zero(K2, V);
+				this->globalState.numByTopicWord.init(nullptr, K2, V);
 			}
 		}

data/vendor/tomotopy/src/TopicModel/PT.h ADDED Viewed

@@ -0,0 +1,27 @@
+#pragma once
+#include "LDA.h"
+namespace tomoto
+{
+	template<TermWeight _tw>
+	struct DocumentPTM : public DocumentLDA<_tw>
+	{
+		using BaseDocument = DocumentLDA<_tw>;
+		using DocumentLDA<_tw>::DocumentLDA;
+		using WeightType = typename DocumentLDA<_tw>::WeightType;
+		uint64_t pseudoDoc = 0;
+		DEFINE_SERIALIZER_AFTER_BASE_WITH_VERSION(BaseDocument, 0, pseudoDoc);
+		DEFINE_TAGGED_SERIALIZER_AFTER_BASE_WITH_VERSION(BaseDocument, 1, 0x00010001, pseudoDoc);
+	};
+	class IPTModel : public ILDAModel
+	{
+	public:
+		using DefaultDocType = DocumentPTM<TermWeight::one>;
+		static IPTModel* create(TermWeight _weight, size_t _K = 1, size_t _P = 100,
+			Float alpha = 0.1, Float eta = 0.01, Float lambda = 0.01, size_t seed = std::random_device{}(),
+			bool scalarRng = false);
+	};
+}

data/vendor/tomotopy/src/TopicModel/PTModel.cpp ADDED Viewed

@@ -0,0 +1,10 @@
+#include "PTModel.hpp"
+namespace tomoto
+{
+	IPTModel* IPTModel::create(TermWeight _weight, size_t _K, size_t _P, Float _alpha, Float _eta, Float _lambda, size_t seed, bool scalarRng)
+	{
+		TMT_SWITCH_TW(_weight, scalarRng, PTModel, _K, _P, _alpha, _eta, _lambda, seed);
+	}
+}

data/vendor/tomotopy/src/TopicModel/PTModel.hpp ADDED Viewed

@@ -0,0 +1,273 @@
+#pragma once
+#include "LDAModel.hpp"
+#include "PT.h"
+/*
+Implementation of Pseudo-document topic model using Gibbs sampling by bab2min
+Zuo, Y., Wu, J., Zhang, H., Lin, H., Wang, F., Xu, K., & Xiong, H. (2016, August). Topic modeling of short texts: A pseudo-document view. In Proceedings of the 22nd ACM SIGKDD international conference on knowledge discovery and data mining (pp. 2105-2114).
+*/
+namespace tomoto
+{
+	template<TermWeight _tw>
+	struct ModelStatePTM : public ModelStateLDA<_tw>
+	{
+		using WeightType = typename ModelStateLDA<_tw>::WeightType;
+		Eigen::Array<Float, -1, 1> pLikelihood;
+		Eigen::ArrayXi numDocsByPDoc;
+		Eigen::Matrix<WeightType, -1, -1> numByTopicPDoc;
+		//DEFINE_SERIALIZER_AFTER_BASE(ModelStateLDA<_tw>);
+	};
+	template<TermWeight _tw, typename _RandGen,
+		typename _Interface = IPTModel,
+		typename _Derived = void,
+		typename _DocType = DocumentPTM<_tw>,
+		typename _ModelState = ModelStatePTM<_tw>>
+	class PTModel : public LDAModel<_tw, _RandGen, flags::continuous_doc_data | flags::partitioned_multisampling, _Interface,
+		typename std::conditional<std::is_same<_Derived, void>::value, PTModel<_tw, _RandGen>, _Derived>::type,
+		_DocType, _ModelState>
+	{
+	protected:
+		using DerivedClass = typename std::conditional<std::is_same<_Derived, void>::value, PTModel<_tw, _RandGen>, _Derived>::type;
+		using BaseClass = LDAModel<_tw, _RandGen, flags::continuous_doc_data | flags::partitioned_multisampling, _Interface, DerivedClass, _DocType, _ModelState>;
+		friend BaseClass;
+		friend typename BaseClass::BaseClass;
+		using WeightType = typename BaseClass::WeightType;
+		static constexpr char TMID[] = "PTM";
+		uint64_t numPDocs;
+		Float lambda;
+		uint32_t pseudoDocSamplingInterval = 10;
+		void optimizeParameters(ThreadPool& pool, _ModelState* localData, _RandGen* rgs)
+		{
+			const auto K = this->K;
+			for (size_t i = 0; i < 10; ++i)
+			{
+				Float denom = this->calcDigammaSum(&pool, [&](size_t i) { return this->globalState.numByTopicPDoc.col(i).sum(); }, numPDocs, this->alphas.sum());
+				for (size_t k = 0; k < K; ++k)
+				{
+					Float nom = this->calcDigammaSum(&pool, [&](size_t i) { return this->globalState.numByTopicPDoc(k, i);}, numPDocs, this->alphas(k));
+					this->alphas(k) = std::max(nom / denom * this->alphas(k), 1e-5f);
+				}
+			}
+		}
+		void samplePseudoDoc(ThreadPool* pool, _ModelState& ld, _RandGen& rgs, _DocType& doc) const
+		{
+			if (doc.getSumWordWeight() == 0) return;
+			Eigen::Array<WeightType, -1, 1> docTopicDist = Eigen::Array<WeightType, -1, 1>::Zero(this->K);
+			for (size_t i = 0; i < doc.words.size(); ++i)
+			{
+				if (doc.words[i] >= this->realV) continue;
+				this->template addWordTo<-1>(ld, doc, i, doc.words[i], doc.Zs[i]);
+				typename std::conditional<_tw != TermWeight::one, float, int32_t>::type weight
+					= _tw != TermWeight::one ? doc.wordWeights[i] : 1;
+				docTopicDist[doc.Zs[i]] += weight;
+			}
+			--ld.numDocsByPDoc[doc.pseudoDoc];
+			if (pool)
+			{
+				std::vector<std::future<void>> futures;
+				for (size_t w = 0; w < pool->getNumWorkers(); ++w)
+				{
+					futures.emplace_back(pool->enqueue([&](size_t, size_t w)
+					{
+						for (size_t p = w; p < numPDocs; p += pool->getNumWorkers())
+						{
+							Float ax = math::lgammaSubt(ld.numByTopicPDoc.col(p).array().template cast<Float>() + this->alphas.array(), docTopicDist.template cast<Float>()).sum();
+							Float bx = math::lgammaSubt(ld.numByTopicPDoc.col(p).sum() + this->alphas.sum(), docTopicDist.sum());
+							ld.pLikelihood[p] = ax - bx;
+						}
+					}, w));
+				}
+				for (auto& f : futures) f.get();
+			}
+			else
+			{
+				for (size_t p = 0; p < numPDocs; ++p)
+				{
+					Float ax = math::lgammaSubt(ld.numByTopicPDoc.col(p).array().template cast<Float>() + this->alphas.array(), docTopicDist.template cast<Float>()).sum();
+					Float bx = math::lgammaSubt(ld.numByTopicPDoc.col(p).sum() + this->alphas.sum(), docTopicDist.sum());
+					ld.pLikelihood[p] = ax - bx;
+				}
+			}
+			ld.pLikelihood = (ld.pLikelihood - ld.pLikelihood.maxCoeff()).exp();
+			ld.pLikelihood *= ld.numDocsByPDoc.template cast<Float>() + lambda;
+			sample::prefixSum(ld.pLikelihood.data(), numPDocs);
+			doc.pseudoDoc = sample::sampleFromDiscreteAcc(ld.pLikelihood.data(), ld.pLikelihood.data() + numPDocs, rgs);
+			++ld.numDocsByPDoc[doc.pseudoDoc];
+			doc.numByTopic.init(ld.numByTopicPDoc.col(doc.pseudoDoc).data(), this->K, 1);
+			for (size_t i = 0; i < doc.words.size(); ++i)
+			{
+				if (doc.words[i] >= this->realV) continue;
+				this->template addWordTo<1>(ld, doc, i, doc.words[i], doc.Zs[i]);
+			}
+		}
+		template<ParallelScheme _ps, bool _infer, typename _DocIter>
+		void performSamplingGlobal(ThreadPool* pool, _ModelState& globalState, _RandGen* rgs,
+			_DocIter docFirst, _DocIter docLast) const
+		{
+			if (this->globalStep % pseudoDocSamplingInterval) return;
+			for (; docFirst != docLast; ++docFirst)
+			{
+				samplePseudoDoc(pool, globalState, rgs[0], *docFirst);
+			}
+		}
+		template<typename _DocIter>
+		double getLLDocs(_DocIter _first, _DocIter _last) const
+		{
+			double ll = 0;
+			// doc-topic distribution
+			for (; _first != _last; ++_first)
+			{
+				auto& doc = *_first;
+			}
+			return ll;
+		}
+		double getLLRest(const _ModelState& ld) const
+		{
+			double ll = BaseClass::getLLRest(ld);
+			const size_t V = this->realV;
+			ll -= math::lgammaT(ld.numDocsByPDoc.sum() + lambda * numPDocs) - math::lgammaT(lambda * numPDocs);
+			// pseudo_doc-topic distribution
+			for (size_t p = 0; p < numPDocs; ++p)
+			{
+				ll += math::lgammaT(ld.numDocsByPDoc[p] + lambda) - math::lgammaT(lambda);
+				ll -= math::lgammaT(ld.numByTopicPDoc.col(p).sum() + this->alphas.sum()) - math::lgammaT(this->alphas.sum());
+				for (Tid k = 0; k < this->K; ++k)
+				{
+					ll += math::lgammaT(ld.numByTopicPDoc(k, p) + this->alphas[k]) - math::lgammaT(this->alphas[k]);
+				}
+			}
+			return ll;
+		}
+		void prepareDoc(_DocType& doc, size_t docId, size_t wordSize) const
+		{
+			sortAndWriteOrder(doc.words, doc.wOrder);
+			doc.numByTopic.init((WeightType*)this->globalState.numByTopicPDoc.col(0).data(), this->K, 1);
+			doc.Zs = tvector<Tid>(wordSize);
+			if (_tw != TermWeight::one) doc.wordWeights.resize(wordSize);
+		}
+		void initGlobalState(bool initDocs)
+		{
+			this->alphas.resize(this->K);
+			this->alphas.array() = this->alpha;
+			this->globalState.pLikelihood = Eigen::Matrix<Float, -1, 1>::Zero(numPDocs);
+			this->globalState.numDocsByPDoc = Eigen::ArrayXi::Zero(numPDocs);
+			this->globalState.numByTopicPDoc = Eigen::Matrix<WeightType, -1, -1>::Zero(this->K, numPDocs);
+			BaseClass::initGlobalState(initDocs);
+		}
+		struct Generator
+		{
+			std::uniform_int_distribution<uint64_t> psi;
+			std::uniform_int_distribution<Tid> theta;
+		};
+		Generator makeGeneratorForInit(const _DocType*) const
+		{
+			return Generator{
+				std::uniform_int_distribution<uint64_t>{0, numPDocs - 1},
+				std::uniform_int_distribution<Tid>{0, (Tid)(this->K - 1)}
+			};
+		}
+		template<bool _Infer>
+		void updateStateWithDoc(Generator& g, _ModelState& ld, _RandGen& rgs, _DocType& doc, size_t i) const
+		{
+			if (i == 0)
+			{
+				doc.pseudoDoc = g.psi(rgs);
+				++ld.numDocsByPDoc[doc.pseudoDoc];
+				doc.numByTopic.init(ld.numByTopicPDoc.col(doc.pseudoDoc).data(), this->K, 1);
+			}
+			auto& z = doc.Zs[i];
+			auto w = doc.words[i];
+			if (this->etaByTopicWord.size())
+			{
+				auto col = this->etaByTopicWord.col(w);
+				z = sample::sampleFromDiscrete(col.data(), col.data() + col.size(), rgs);
+			}
+			else
+			{
+				z = g.theta(rgs);
+			}
+			this->template addWordTo<1>(ld, doc, i, w, z);
+		}
+		template<ParallelScheme _ps, bool _infer, typename _DocIter, typename _ExtraDocData>
+		void performSampling(ThreadPool& pool, _ModelState* localData, _RandGen* rgs, std::vector<std::future<void>>& res,
+			_DocIter docFirst, _DocIter docLast, const _ExtraDocData& edd) const
+		{
+			// single-threaded sampling
+			if (_ps == ParallelScheme::none)
+			{
+				forShuffled((size_t)std::distance(docFirst, docLast), rgs[0](), [&](size_t id)
+				{
+					static_cast<const DerivedClass*>(this)->presampleDocument(docFirst[id], id, *localData, *rgs, this->globalStep);
+					static_cast<const DerivedClass*>(this)->template sampleDocument<_ps, _infer>(
+						docFirst[id], edd, id,
+						*localData, *rgs, this->globalStep, 0);
+				});
+			}
+			// multi-threaded sampling on partition and update into global
+			else if (_ps == ParallelScheme::partition)
+			{
+				const size_t chStride = pool.getNumWorkers();
+				for (size_t i = 0; i < chStride; ++i)
+				{
+					res = pool.enqueueToAll([&, i, chStride](size_t partitionId)
+					{
+						forShuffled((size_t)std::distance(docFirst, docLast), rgs[partitionId](), [&](size_t id)
+						{
+							if ((docFirst[id].pseudoDoc + partitionId) % chStride != i) return;
+							static_cast<const DerivedClass*>(this)->template sampleDocument<_ps, _infer>(
+								docFirst[id], edd, id,
+								localData[partitionId], rgs[partitionId], this->globalStep, partitionId
+							);
+						});
+					});
+					for (auto& r : res) r.get();
+					res.clear();
+				}
+			}
+			else
+			{
+				throw std::runtime_error{ "Unsupported ParallelScheme" };
+			}
+		}
+	public:
+		DEFINE_SERIALIZER_AFTER_BASE_WITH_VERSION(BaseClass, 0, numPDocs, lambda);
+		DEFINE_TAGGED_SERIALIZER_AFTER_BASE_WITH_VERSION(BaseClass, 1, 0x00010001, numPDocs, lambda);
+		PTModel(size_t _K = 1, size_t _P = 100, Float _alpha = 1.0, Float _eta = 0.01, Float _lambda = 0.01,
+			size_t _rg = std::random_device{}())
+			: BaseClass(_K, _alpha, _eta, _rg), numPDocs(_P), lambda(_lambda)
+		{
+		}
+		void updateDocs()
+		{
+			for (auto& doc : this->docs)
+			{
+				doc.template update<>(this->getTopicDocPtr(doc.pseudoDoc), *static_cast<DerivedClass*>(this));
+			}
+		}
+	};
+}