PyPI - unike - Versions diffs - 3.0.1__py3-none-any.whl - Mend

unike 3.0.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (59) hide show

unike/__init__.py +5 -0
unike/config/HPOTrainer.py +305 -0
unike/config/Tester.py +385 -0
unike/config/Trainer.py +519 -0
unike/config/TrainerAccelerator.py +39 -0
unike/config/__init__.py +37 -0
unike/data/BernSampler.py +168 -0
unike/data/CompGCNSampler.py +140 -0
unike/data/CompGCNTestSampler.py +84 -0
unike/data/KGEDataLoader.py +315 -0
unike/data/KGReader.py +138 -0
unike/data/RGCNSampler.py +261 -0
unike/data/RGCNTestSampler.py +208 -0
unike/data/RevSampler.py +78 -0
unike/data/TestSampler.py +189 -0
unike/data/TradSampler.py +122 -0
unike/data/TradTestSampler.py +87 -0
unike/data/UniSampler.py +145 -0
unike/data/__init__.py +47 -0
unike/module/BaseModule.py +130 -0
unike/module/__init__.py +20 -0
unike/module/loss/CompGCNLoss.py +96 -0
unike/module/loss/Loss.py +26 -0
unike/module/loss/MarginLoss.py +148 -0
unike/module/loss/RGCNLoss.py +117 -0
unike/module/loss/SigmoidLoss.py +145 -0
unike/module/loss/SoftplusLoss.py +145 -0
unike/module/loss/__init__.py +35 -0
unike/module/model/Analogy.py +237 -0
unike/module/model/CompGCN.py +562 -0
unike/module/model/ComplEx.py +235 -0
unike/module/model/DistMult.py +276 -0
unike/module/model/HolE.py +308 -0
unike/module/model/Model.py +107 -0
unike/module/model/RESCAL.py +309 -0
unike/module/model/RGCN.py +304 -0
unike/module/model/RotatE.py +303 -0
unike/module/model/SimplE.py +237 -0
unike/module/model/TransD.py +458 -0
unike/module/model/TransE.py +290 -0
unike/module/model/TransH.py +322 -0
unike/module/model/TransR.py +402 -0
unike/module/model/__init__.py +60 -0
unike/module/strategy/CompGCNSampling.py +140 -0
unike/module/strategy/NegativeSampling.py +138 -0
unike/module/strategy/RGCNSampling.py +134 -0
unike/module/strategy/Strategy.py +26 -0
unike/module/strategy/__init__.py +29 -0
unike/utils/EarlyStopping.py +94 -0
unike/utils/Timer.py +74 -0
unike/utils/WandbLogger.py +46 -0
unike/utils/__init__.py +26 -0
unike/utils/tools.py +118 -0
unike/version.py +1 -0
unike-3.0.1.dist-info/METADATA +101 -0
unike-3.0.1.dist-info/RECORD +59 -0
unike-3.0.1.dist-info/WHEEL +4 -0
unike-3.0.1.dist-info/entry_points.txt +2 -0
unike-3.0.1.dist-info/licenses/LICENSE +21 -0

unike/module/loss/SoftplusLoss.py ADDED Viewed

@@ -0,0 +1,145 @@
+# coding:utf-8
+#
+# unike/module/loss/SoftplusLoss.py
+#
+# git pull from OpenKE-PyTorch by LuYF-Lemon-love <luyanfeng_nlp@qq.com> on May 7, 2023
+# updated by LuYF-Lemon-love <luyanfeng_nlp@qq.com> on Jan 6, 2023
+#
+# 该脚本定义了 regularized logistic loss 损失函数.
+"""
+SoftplusLoss - 损失函数类，DistMult 经常应用这种损失函数完成模型学习。
+"""
+import torch
+import numpy as np
+import torch.nn as nn
+from typing import Any
+import torch.nn.functional as F
+from .Loss import Loss
+class SoftplusLoss(Loss):
+	"""
+	``ComplEx`` :cite:`ComplEx` 原论文中应用这种损失函数完成模型训练。
+	.. Note:: :py:meth:`forward` 中的正样本评分函数的得分应大于负样本评分函数的得分。
+	例子::
+		from unike.module.loss import SoftplusLoss
+		from unike.module.strategy import NegativeSampling
+		# define the loss function
+		model = NegativeSampling(
+			model = distmult,
+			loss = SoftplusLoss(),
+			batch_size = train_dataloader.get_batch_size(),
+			regul_rate = 1.0
+		)
+	"""
+	def __init__(
+		self,
+		adv_temperature: float | None = None):
+		"""创建 SoftplusLoss 对象。
+		:param adv_temperature: RotatE 提出的自我对抗负采样中的温度。
+		:type adv_temperature: float
+		"""
+		super(SoftplusLoss, self).__init__()
+		#: 用于代替逻辑函数，类型为 :py:class:`torch.nn.Softplus`，它是 ReLU 函数的平滑近似。
+		self.criterion: torch.nn.Softplus = nn.Softplus()
+		if adv_temperature != None:
+			#: RotatE 提出的自我对抗负采样中的温度。
+			self.adv_temperature: torch.nn.parameter.Parameter = nn.Parameter(torch.Tensor([adv_temperature]))
+			self.adv_temperature.requires_grad = False
+			#: 是否启用 RotatE 提出的自我对抗负采样。
+			self.adv_flag: bool = True
+		else:
+			self.adv_flag: bool = False
+	def get_weights(
+		self,
+		n_score: torch.Tensor) -> torch.Tensor:
+		"""计算 RotatE 提出的自我对抗负采样中的负样本的分布概率。
+		:param n_score: 负样本评分函数的得分。
+		:type n_score: torch.Tensor
+		:returns: 自我对抗负采样中的负样本的分布概率
+		:rtype: torch.Tensor
+		"""
+		return F.softmax(n_score * self.adv_temperature, dim = -1).detach()
+	def forward(
+		self,
+		p_score: torch.Tensor,
+		n_score: torch.Tensor) -> torch.Tensor:
+		"""计算 SoftplusLoss 损失函数。定义每次调用时执行的计算。
+		:py:class:`torch.nn.Module` 子类必须重写 :py:meth:`torch.nn.Module.forward`。
+		:param p_score: 正样本评分函数的得分。
+		:type p_score: torch.Tensor
+		:param n_score: 负样本评分函数的得分。
+		:type n_score: torch.Tensor
+		:returns: 损失值
+		:rtype: torch.Tensor
+		"""
+		if self.adv_flag:
+			return (self.criterion(-p_score).mean() + (self.get_weights(n_score) * self.criterion(n_score)).sum(dim = -1).mean()) / 2
+		else:
+			return (self.criterion(-p_score).mean() + self.criterion(n_score).mean()) / 2
+	def predict(
+		self,
+		p_score: torch.Tensor,
+		n_score: torch.Tensor) -> np.ndarray:
+		"""SoftplusLoss 的推理方法。
+		:param p_score: 正样本评分函数的得分。
+		:type p_score: torch.Tensor
+		:param n_score: 负样本评分函数的得分。
+		:type n_score: torch.Tensor
+		:returns: 损失值
+		:rtype: numpy.ndarray
+		"""
+		score = self.forward(p_score, n_score)
+		return score.cpu().data.numpy()
+def get_softplus_loss_hpo_config() -> dict[str, dict[str, Any]]:
+	"""返回 :py:class:`SoftplusLoss` 的默认超参数优化配置。
+	默认配置为::
+		parameters_dict = {
+			'loss': {
+				'value': 'SoftplusLoss'
+			},
+			'adv_temperature': {
+				'values': [1.0, 3.0, 6.0]
+			}
+		}
+	:returns: :py:class:`SoftplusLoss` 的默认超参数优化配置
+	:rtype: dict[str, dict[str, typing.Any]]
+	"""
+	parameters_dict = {
+		'loss': {
+			'value': 'SoftplusLoss'
+		},
+		'adv_temperature': {
+			'values': [1.0, 3.0, 6.0]
+		}
+	}
+	return parameters_dict

unike/module/loss/__init__.py ADDED Viewed

@@ -0,0 +1,35 @@
+# coding:utf-8
+#
+# unike/module/loss/__init__.py
+#
+# git pull from OpenKE-PyTorch by LuYF-Lemon-love <luyanfeng_nlp@qq.com> on May 7, 2023
+# updated by LuYF-Lemon-love <luyanfeng_nlp@qq.com> on May 28, 2023
+#
+# 该头文件定义了 loss 接口.
+"""损失函数部分。"""
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+from .Loss import Loss
+from .MarginLoss import MarginLoss, get_margin_loss_hpo_config
+from .SigmoidLoss import SigmoidLoss, get_sigmoid_loss_hpo_config
+from .SoftplusLoss import SoftplusLoss, get_softplus_loss_hpo_config
+from .RGCNLoss import RGCNLoss, get_rgcn_loss_hpo_config
+from .CompGCNLoss import CompGCNLoss, get_compgcn_loss_hpo_config
+__all__ = [
+    'Loss',
+    'MarginLoss',
+    'get_margin_loss_hpo_config',
+    'SigmoidLoss',
+    'get_sigmoid_loss_hpo_config',
+    'SoftplusLoss',
+    'get_softplus_loss_hpo_config',
+    'RGCNLoss',
+    'get_rgcn_loss_hpo_config',
+    'CompGCNLoss',
+    'get_compgcn_loss_hpo_config'
+]

unike/module/model/Analogy.py ADDED Viewed

@@ -0,0 +1,237 @@
+# coding:utf-8
+#
+# unike/module/model/Analogy.py
+#
+# git pull from OpenKE-PyTorch by LuYF-Lemon-love <luyanfeng_nlp@qq.com> on May 7, 2023
+# updated by LuYF-Lemon-love <luyanfeng_nlp@qq.com> on Jan 31, 2024
+#
+# 该头文件定义了 Analogy.
+"""
+Analogy 类 - DistMult、HolE 和 ComplEx 的集大成者，效果与 HolE、ComplEx 差不多。
+"""
+import torch
+import typing
+import torch.nn as nn
+from .Model import Model
+from typing_extensions import override
+class Analogy(Model):
+	"""
+	``Analogy`` :cite:`ANALOGY` 提出于 2017 年，:py:class:`unike.module.model.DistMult`、:py:class:`unike.module.model.HolE` 和 :py:class:`unike.module.model.ComplEx` 的集大成者，
+	效果与 :py:class:`unike.module.model.HolE`、:py:class:`unike.module.model.ComplEx` 差不多。
+	评分函数为:
+	.. math::
+	    <\operatorname{Re}(\mathbf{h_c}),\operatorname{Re}(\mathbf{r_c}),\operatorname{Re}(\mathbf{t_c})>
+	        +<\operatorname{Re}(\mathbf{h_c}),\operatorname{Im}(\mathbf{r_c}),\operatorname{Im}(\mathbf{t_c})>
+	        +<\operatorname{Im}(\mathbf{h_c}),\operatorname{Re}(\mathbf{r_c}),\operatorname{Im}(\mathbf{t_c})>
+	        -<\operatorname{Im}(\mathbf{h_c}),\operatorname{Im}(\mathbf{r_c}),\operatorname{Re}(\mathbf{t_c})>
+	        +<\mathbf{h_d}, \mathbf{r_d}, \mathbf{t_d}>
+	评分函数为 :py:class:`unike.module.model.DistMult` 和 :py:class:`unike.module.model.ComplEx` 两者评分函数的和。:math:`< \mathbf{a}, \mathbf{b}, \mathbf{c} >` 为逐元素多线性点积（element-wise multi-linear dot product），
+	正三元组的评分函数的值越大越好，负三元组越小越好，如果想获得更详细的信息请访问 :ref:`ANALOGY <analogy>`。
+	例子::
+		from unike.config import Trainer, Tester
+		from unike.module.model import Analogy
+		from unike.module.loss import SoftplusLoss
+		from unike.module.strategy import NegativeSampling
+		# define the model
+		analogy = Analogy(
+			ent_tol = train_dataloader.get_ent_tol(),
+			rel_tol = train_dataloader.get_rel_tol(),
+			dim = 200
+		)
+		# define the loss function
+		model = NegativeSampling(
+			model = analogy,
+			loss = SoftplusLoss(),
+			batch_size = train_dataloader.get_batch_size(),
+			regul_rate = 1.0
+		)
+		# test the model
+		tester = Tester(model = analogy, data_loader = test_dataloader, use_gpu = True, device = 'cuda:1')
+		# train the model
+		trainer = Trainer(model = model, data_loader = train_dataloader,
+			epochs = 2000, lr = 0.5, opt_method = "adagrad", use_gpu = True, device = 'cuda:1',
+			tester = tester, test = True, valid_interval = 100,
+			log_interval = 100, save_interval = 100,
+			save_path = '../../checkpoint/analogy.pth', delta = 0.01)
+		trainer.run()
+	"""
+	def __init__(
+		self,
+		ent_tol: int,
+		rel_tol: int,
+		dim: int = 100):
+		"""创建 Analogy 对象。
+		:param ent_tol: 实体的个数
+		:type ent_tol: int
+		:param rel_tol: 关系的个数
+		:type rel_tol: int
+		:param dim: 实体嵌入向量和关系嵌入向量的维度
+		:type dim: int
+		"""
+		super(Analogy, self).__init__(ent_tol, rel_tol)
+		#: 实体嵌入向量和关系嵌入向量的维度
+		self.dim: int = dim
+		#: 根据实体个数，创建的实体嵌入
+		self.ent_embeddings: torch.nn.Embedding = nn.Embedding(self.ent_tol, self.dim * 4)
+		#: 根据关系个数，创建的关系嵌入
+		self.rel_embeddings: torch.nn.Embedding = nn.Embedding(self.rel_tol, self.dim * 4)
+		nn.init.xavier_uniform_(self.ent_embeddings.weight.data)
+		nn.init.xavier_uniform_(self.rel_embeddings.weight.data)
+	@override
+	def forward(
+		self,
+		triples: torch.Tensor,
+		negs: torch.Tensor = None,
+		mode: str = 'single') -> torch.Tensor:
+		"""
+		定义每次调用时执行的计算。
+		:py:class:`torch.nn.Module` 子类必须重写 :py:meth:`torch.nn.Module.forward`。
+		:param triples: 正确的三元组
+		:type triples: torch.Tensor
+		:param negs: 负三元组类别
+		:type negs: torch.Tensor
+		:param mode: 模式
+		:type triples: str
+		:returns: 三元组的得分
+		:rtype: torch.Tensor
+		"""
+		head_emb, relation_emb, tail_emb = self.tri2emb(triples, negs, mode)
+		score = self._calc(head_emb, relation_emb, tail_emb)
+		return score
+	def _calc(
+		self,
+		head_emb: torch.Tensor,
+		relation_emb: torch.Tensor,
+		tail_emb: torch.Tensor) -> torch.Tensor:
+		"""计算 Analogy 的评分函数。
+		:param head_emb: 头实体的向量。
+		:type head_emb: torch.Tensor
+		:param relation_emb: 关系的向量。
+		:type relation_emb: torch.Tensor
+		:param tail_emb: 尾实体的向量。
+		:type tail_emb: torch.Tensor
+		:returns: 三元组的得分
+		:rtype: torch.Tensor
+		"""
+		head, h = torch.chunk(head_emb, 2, dim=-1)
+		h_re, h_im = torch.chunk(head, 2, dim=-1)
+		relation, r = torch.chunk(relation_emb, 2, dim=-1)
+		r_re, r_im = torch.chunk(relation, 2, dim=-1)
+		tail, t = torch.chunk(tail_emb, 2, dim=-1)
+		t_re, t_im = torch.chunk(tail, 2, dim=-1)
+		return (torch.sum(r_re * h_re * t_re +
+						  r_re * h_im * t_im +
+						  r_im * h_re * t_im -
+						  r_im * h_im * t_re, -1)
+					+ torch.sum(h * t * r, -1))
+	@override
+	def predict(
+		self,
+		data: dict[str, typing.Union[torch.Tensor,str]],
+		mode) -> torch.Tensor:
+		"""Analogy 的推理方法。
+		:param data: 数据。
+		:type data: dict[str, typing.Union[torch.Tensor,str]]
+		:returns: 三元组的得分
+		:rtype: torch.Tensor
+		"""
+		triples = data["positive_sample"]
+		head_emb, relation_emb, tail_emb = self.tri2emb(triples, mode=mode)
+		score = self._calc(head_emb, relation_emb, tail_emb)
+		return score
+	def regularization(
+		self,
+		data: dict[str, typing.Union[torch.Tensor, str]]) -> torch.Tensor:
+		"""L2 正则化函数（又称权重衰减），在损失函数中用到。
+		:param data: 数据。
+		:type data: dict[str, typing.Union[torch.Tensor, str]]
+		:returns: 模型参数的正则损失
+		:rtype: torch.Tensor
+		"""
+		pos_sample = data["positive_sample"]
+		neg_sample = data["negative_sample"]
+		mode = data["mode"]
+		pos_head_emb, pos_relation_emb, pos_tail_emb = self.tri2emb(pos_sample)
+		if mode == "bern":
+			neg_head_emb, neg_relation_emb, neg_tail_emb = self.tri2emb(neg_sample)
+		else:
+			neg_head_emb, neg_relation_emb, neg_tail_emb = self.tri2emb(pos_sample, neg_sample, mode)
+		pos_regul = (torch.mean(pos_head_emb ** 2) +
+					 torch.mean(pos_relation_emb ** 2) +
+					 torch.mean(pos_tail_emb ** 2)) / 3
+		neg_regul = (torch.mean(neg_head_emb ** 2) +
+					 torch.mean(neg_relation_emb ** 2) +
+					 torch.mean(neg_tail_emb ** 2)) / 3
+		regul = (pos_regul + neg_regul) / 2
+		return regul
+def get_analogy_hpo_config() -> dict[str, dict[str, typing.Any]]:
+	"""返回 :py:class:`Analogy` 的默认超参数优化配置。
+	默认配置为::
+		parameters_dict = {
+			'model': {
+				'value': 'Analogy'
+			},
+			'dim': {
+				'values': [50, 100, 200]
+			}
+		}
+	:returns: :py:class:`Analogy` 的默认超参数优化配置
+	:rtype: dict[str, dict[str, typing.Any]]
+	"""
+	parameters_dict = {
+		'model': {
+			'value': 'Analogy'
+		},
+		'dim': {
+			'values': [50, 100, 200]
+		}
+	}
+	return parameters_dict