PyPI - torch-rechub - Versions diffs - 0.0.1__py3-none-any.whl → 0.0.4__py3-none-any.whl - Mend

torch-rechub 0.0.1py3-none-any.whl → 0.0.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (65) hide show

torch_rechub/__init__.py +14 -0
torch_rechub/basic/activation.py +3 -1
torch_rechub/basic/callback.py +2 -2
torch_rechub/basic/features.py +38 -8
torch_rechub/basic/initializers.py +92 -0
torch_rechub/basic/layers.py +800 -46
torch_rechub/basic/loss_func.py +223 -0
torch_rechub/basic/metaoptimizer.py +76 -0
torch_rechub/basic/metric.py +251 -0
torch_rechub/models/generative/__init__.py +6 -0
torch_rechub/models/generative/hllm.py +249 -0
torch_rechub/models/generative/hstu.py +189 -0
torch_rechub/models/matching/__init__.py +13 -0
torch_rechub/models/matching/comirec.py +193 -0
torch_rechub/models/matching/dssm.py +72 -0
torch_rechub/models/matching/dssm_facebook.py +77 -0
torch_rechub/models/matching/dssm_senet.py +87 -0
torch_rechub/models/matching/gru4rec.py +85 -0
torch_rechub/models/matching/mind.py +103 -0
torch_rechub/models/matching/narm.py +82 -0
torch_rechub/models/matching/sasrec.py +143 -0
torch_rechub/models/matching/sine.py +148 -0
torch_rechub/models/matching/stamp.py +81 -0
torch_rechub/models/matching/youtube_dnn.py +75 -0
torch_rechub/models/matching/youtube_sbc.py +98 -0
torch_rechub/models/multi_task/__init__.py +5 -2
torch_rechub/models/multi_task/aitm.py +83 -0
torch_rechub/models/multi_task/esmm.py +19 -8
torch_rechub/models/multi_task/mmoe.py +18 -12
torch_rechub/models/multi_task/ple.py +41 -29
torch_rechub/models/multi_task/shared_bottom.py +3 -2
torch_rechub/models/ranking/__init__.py +13 -2
torch_rechub/models/ranking/afm.py +65 -0
torch_rechub/models/ranking/autoint.py +102 -0
torch_rechub/models/ranking/bst.py +61 -0
torch_rechub/models/ranking/dcn.py +38 -0
torch_rechub/models/ranking/dcn_v2.py +59 -0
torch_rechub/models/ranking/deepffm.py +131 -0
torch_rechub/models/ranking/deepfm.py +8 -7
torch_rechub/models/ranking/dien.py +191 -0
torch_rechub/models/ranking/din.py +31 -19
torch_rechub/models/ranking/edcn.py +101 -0
torch_rechub/models/ranking/fibinet.py +42 -0
torch_rechub/models/ranking/widedeep.py +6 -6
torch_rechub/trainers/__init__.py +4 -2
torch_rechub/trainers/ctr_trainer.py +191 -0
torch_rechub/trainers/match_trainer.py +239 -0
torch_rechub/trainers/matching.md +3 -0
torch_rechub/trainers/mtl_trainer.py +137 -23
torch_rechub/trainers/seq_trainer.py +293 -0
torch_rechub/utils/__init__.py +0 -0
torch_rechub/utils/data.py +492 -0
torch_rechub/utils/hstu_utils.py +198 -0
torch_rechub/utils/match.py +457 -0
torch_rechub/utils/mtl.py +136 -0
torch_rechub/utils/onnx_export.py +353 -0
torch_rechub-0.0.4.dist-info/METADATA +391 -0
torch_rechub-0.0.4.dist-info/RECORD +62 -0
{torch_rechub-0.0.1.dist-info → torch_rechub-0.0.4.dist-info}/WHEEL +1 -2
{torch_rechub-0.0.1.dist-info → torch_rechub-0.0.4.dist-info/licenses}/LICENSE +1 -1
torch_rechub/basic/utils.py +0 -168
torch_rechub/trainers/trainer.py +0 -111
torch_rechub-0.0.1.dist-info/METADATA +0 -105
torch_rechub-0.0.1.dist-info/RECORD +0 -26
torch_rechub-0.0.1.dist-info/top_level.txt +0 -1

torch_rechub/__init__.py CHANGED Viewed

@@ -0,0 +1,14 @@
+"""Torch-RecHub: A PyTorch Toolbox for Recommendation Models."""
+__version__ = "0.1.0"
+# 导入主要模块
+from . import basic, models, trainers, utils
+__all__ = [
+    "__version__",
+    "basic",
+    "models",
+    "trainers",
+    "utils",
+]

torch_rechub/basic/activation.py CHANGED Viewed

@@ -30,7 +30,7 @@ def activation_layer(act_name):
     Args:
         act_name: str or nn.Module, name of activation function
     Returns:
         act_layer: activation layer
     """
@@ -45,6 +45,8 @@ def activation_layer(act_name):
             act_layer = nn.PReLU()
         elif act_name.lower() == "softmax":
             act_layer = nn.Softmax(dim=1)
+        elif act_name.lower() == 'leakyrelu':
+            act_layer = nn.LeakyReLU()
     elif issubclass(act_name, nn.Module):
         act_layer = act_name()
     else:

torch_rechub/basic/callback.py CHANGED Viewed

@@ -3,7 +3,7 @@ import copy
 class EarlyStopper(object):
     """Early stops the training if validation loss doesn't improve after a given patience.
     Args:
         patience (int): How long to wait after last time validation auc improved.
     """
@@ -30,4 +30,4 @@ class EarlyStopper(object):
             self.trial_counter += 1
             return False
         else:
-            return True
+            return True

torch_rechub/basic/features.py CHANGED Viewed

@@ -1,4 +1,5 @@
-from .utils import get_auto_embedding_dim
+from ..utils.data import get_auto_embedding_dim
+from .initializers import RandomNormal
 class SequenceFeature(object):
@@ -13,17 +14,29 @@ class SequenceFeature(object):
         embed_dim (int): embedding vector's length
         pooling (str): pooling method, support `["mean", "sum", "concat"]` (default=`"mean"`)
         shared_with (str): the another feature name which this feature will shared with embedding.
+        padding_idx (int, optional): If specified, the entries at padding_idx will be masked 0 in InputMask Layer.
+        initializer(Initializer): Initializer the embedding layer weight.
     """
-    def __init__(self, name, vocab_size, embed_dim=None, pooling="mean", shared_with=None):
+    def __init__(self, name, vocab_size, embed_dim=None, pooling="mean", shared_with=None, padding_idx=None, initializer=RandomNormal(0, 0.0001)):
         self.name = name
         self.vocab_size = vocab_size
-        if embed_dim == None:
+        if embed_dim is None:
             self.embed_dim = get_auto_embedding_dim(vocab_size)
         else:
             self.embed_dim = embed_dim
         self.pooling = pooling
         self.shared_with = shared_with
+        self.padding_idx = padding_idx
+        self.initializer = initializer
+    def __repr__(self):
+        return f'<SequenceFeature {self.name} with Embedding shape ({self.vocab_size}, {self.embed_dim})>'
+    def get_embedding_layer(self):
+        if not hasattr(self, 'embed'):
+            self.embed = self.initializer(self.vocab_size, self.embed_dim)
+        return self.embed
 class SparseFeature(object):
@@ -33,15 +46,29 @@ class SparseFeature(object):
         name (str): feature's name.
         vocab_size (int): vocabulary size of embedding table.
         embed_dim (int): embedding vector's length
+        shared_with (str): the another feature name which this feature will shared with embedding.
+        padding_idx (int, optional): If specified, the entries at padding_idx will be masked 0 in InputMask Layer.
+        initializer(Initializer): Initializer the embedding layer weight.
     """
-    def __init__(self, name, vocab_size, embed_dim=None):
+    def __init__(self, name, vocab_size, embed_dim=None, shared_with=None, padding_idx=None, initializer=RandomNormal(0, 0.0001)):
         self.name = name
         self.vocab_size = vocab_size
-        if embed_dim == None:
+        if embed_dim is None:
             self.embed_dim = get_auto_embedding_dim(vocab_size)
         else:
             self.embed_dim = embed_dim
+        self.shared_with = shared_with
+        self.padding_idx = padding_idx
+        self.initializer = initializer
+    def __repr__(self):
+        return f'<SparseFeature {self.name} with Embedding shape ({self.vocab_size}, {self.embed_dim})>'
+    def get_embedding_layer(self):
+        if not hasattr(self, 'embed'):
+            self.embed = self.initializer(self.vocab_size, self.embed_dim)
+        return self.embed
 class DenseFeature(object):
@@ -49,9 +76,12 @@ class DenseFeature(object):
     Args:
         name (str): feature's name.
-        embed_dim (int): embedding vector's length, the value fixed `1`.
+        embed_dim (int): embedding vector's length, the value fixed `1`. If you put a vector (torch.tensor) , replace the embed_dim with your vector dimension.
     """
-    def __init__(self, name):
+    def __init__(self, name, embed_dim=1):
         self.name = name
-        self.embed_dim = 1
+        self.embed_dim = embed_dim
+    def __repr__(self):
+        return f'<DenseFeature {self.name}>'

torch_rechub/basic/initializers.py ADDED Viewed

@@ -0,0 +1,92 @@
+import torch
+class RandomNormal(object):
+    """Returns an embedding initialized with a normal distribution.
+    Args:
+        mean (float): the mean of the normal distribution
+        std (float): the standard deviation of the normal distribution
+    """
+    def __init__(self, mean=0.0, std=1.0):
+        self.mean = mean
+        self.std = std
+    def __call__(self, vocab_size, embed_dim):
+        embed = torch.nn.Embedding(vocab_size, embed_dim)
+        torch.nn.init.normal_(embed.weight, self.mean, self.std)
+        return embed
+class RandomUniform(object):
+    """Returns an embedding initialized with a uniform distribution.
+    Args:
+        minval (float): Lower bound of the range of random values of the uniform distribution.
+        maxval (float): Upper bound of the range of random values of the uniform distribution.
+    """
+    def __init__(self, minval=0.0, maxval=1.0):
+        self.minval = minval
+        self.maxval = maxval
+    def __call__(self, vocab_size, embed_dim):
+        embed = torch.nn.Embedding(vocab_size, embed_dim)
+        torch.nn.init.uniform_(embed.weight, self.minval, self.maxval)
+        return embed
+class XavierNormal(object):
+    """Returns an embedding initialized with  the method described in
+    `Understanding the difficulty of training deep feedforward neural networks`
+    - Glorot, X. & Bengio, Y. (2010), using a uniform distribution.
+    Args:
+        gain (float): stddev = gain*sqrt(2 / (fan_in + fan_out))
+    """
+    def __init__(self, gain=1.0):
+        self.gain = gain
+    def __call__(self, vocab_size, embed_dim):
+        embed = torch.nn.Embedding(vocab_size, embed_dim)
+        torch.nn.init.xavier_normal_(embed.weight, self.gain)
+        return embed
+class XavierUniform(object):
+    """Returns an embedding initialized with the method described in
+    `Understanding the difficulty of training deep feedforward neural networks`
+    - Glorot, X. & Bengio, Y. (2010), using a uniform distribution.
+    Args:
+        gain (float): stddev = gain*sqrt(6 / (fan_in + fan_out))
+    """
+    def __init__(self, gain=1.0):
+        self.gain = gain
+    def __call__(self, vocab_size, embed_dim):
+        embed = torch.nn.Embedding(vocab_size, embed_dim)
+        torch.nn.init.xavier_uniform_(embed.weight, self.gain)
+        return embed
+class Pretrained(object):
+    """Creates Embedding instance from given 2-dimensional FloatTensor.
+    Args:
+        embedding_weight(Tensor or ndarray or List[List[int]]): FloatTensor containing weights for the Embedding.
+                First dimension is being passed to Embedding as ``num_embeddings``, second as ``embedding_dim``.
+        freeze (boolean, optional): If ``True``, the tensor does not get updated in the learning process.
+    """
+    def __init__(self, embedding_weight, freeze=True):
+        self.embedding_weight = torch.FloatTensor(embedding_weight)
+        self.freeze = freeze
+    def __call__(self, vocab_size, embed_dim):
+        assert vocab_size == self.embedding_weight.shape[0] and embed_dim == self.embedding_weight.shape[1]
+        embed = torch.nn.Embedding.from_pretrained(self.embedding_weight, freeze=self.freeze)
+        return embed

torch-rechub 0.0.1__py3-none-any.whl → 0.0.4__py3-none-any.whl

torch-rechub 0.0.1py3-none-any.whl → 0.0.4py3-none-any.whl