PyPI - nextrec - Versions diffs - 0.4.22__py3-none-any.whl → 0.4.24__py3-none-any.whl - Mend

nextrec 0.4.22py3-none-any.whl → 0.4.24py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (50) hide show

nextrec/__version__.py +1 -1
nextrec/basic/layers.py +96 -46
nextrec/basic/metrics.py +128 -114
nextrec/basic/model.py +94 -91
nextrec/basic/summary.py +36 -2
nextrec/data/dataloader.py +2 -0
nextrec/data/preprocessor.py +137 -5
nextrec/loss/listwise.py +19 -6
nextrec/loss/pairwise.py +6 -4
nextrec/loss/pointwise.py +8 -6
nextrec/models/multi_task/aitm.py +0 -0
nextrec/models/multi_task/apg.py +0 -0
nextrec/models/multi_task/cross_stitch.py +0 -0
nextrec/models/multi_task/esmm.py +5 -28
nextrec/models/multi_task/mmoe.py +6 -28
nextrec/models/multi_task/pepnet.py +335 -0
nextrec/models/multi_task/ple.py +21 -40
nextrec/models/multi_task/poso.py +17 -39
nextrec/models/multi_task/share_bottom.py +5 -28
nextrec/models/multi_task/snr_trans.py +0 -0
nextrec/models/ranking/afm.py +3 -27
nextrec/models/ranking/autoint.py +5 -38
nextrec/models/ranking/dcn.py +1 -26
nextrec/models/ranking/dcn_v2.py +6 -34
nextrec/models/ranking/deepfm.py +2 -29
nextrec/models/ranking/dien.py +2 -28
nextrec/models/ranking/din.py +2 -27
nextrec/models/ranking/eulernet.py +3 -30
nextrec/models/ranking/ffm.py +0 -26
nextrec/models/ranking/fibinet.py +8 -32
nextrec/models/ranking/fm.py +0 -29
nextrec/models/ranking/lr.py +0 -30
nextrec/models/ranking/masknet.py +4 -30
nextrec/models/ranking/pnn.py +4 -28
nextrec/models/ranking/widedeep.py +0 -32
nextrec/models/ranking/xdeepfm.py +0 -30
nextrec/models/retrieval/dssm.py +4 -28
nextrec/models/retrieval/dssm_v2.py +4 -28
nextrec/models/retrieval/mind.py +2 -22
nextrec/models/retrieval/sdm.py +4 -24
nextrec/models/retrieval/youtube_dnn.py +4 -25
nextrec/models/sequential/hstu.py +0 -18
nextrec/utils/model.py +91 -4
nextrec/utils/types.py +35 -0
{nextrec-0.4.22.dist-info → nextrec-0.4.24.dist-info}/METADATA +8 -6
nextrec-0.4.24.dist-info/RECORD +86 -0
nextrec-0.4.22.dist-info/RECORD +0 -81
{nextrec-0.4.22.dist-info → nextrec-0.4.24.dist-info}/WHEEL +0 -0
{nextrec-0.4.22.dist-info → nextrec-0.4.24.dist-info}/entry_points.txt +0 -0
{nextrec-0.4.22.dist-info → nextrec-0.4.24.dist-info}/licenses/LICENSE +0 -0

nextrec/loss/listwise.py CHANGED Viewed

@@ -2,10 +2,11 @@
 Listwise loss functions for ranking and contrastive training.
 Date: create on 27/10/2025
-Checkpoint: edit on 29/11/2025
+Checkpoint: edit on 29/12/2025
 Author: Yang Zhou, zyaztec@gmail.com
 """
+from typing import Literal
 import torch
 import torch.nn as nn
 import torch.nn.functional as F
@@ -16,7 +17,7 @@ class SampledSoftmaxLoss(nn.Module):
     Softmax over one positive and multiple sampled negatives.
     """
-    def __init__(self, reduction: str = "mean"):
+    def __init__(self, reduction: Literal["mean", "sum", "none"] = "mean"):
         super().__init__()
         self.reduction = reduction
@@ -37,7 +38,11 @@ class InfoNCELoss(nn.Module):
     InfoNCE loss for contrastive learning with one positive and many negatives.
     """
-    def __init__(self, temperature: float = 0.07, reduction: str = "mean"):
+    def __init__(
+        self,
+        temperature: float = 0.07,
+        reduction: Literal["mean", "sum", "none"] = "mean",
+    ):
         super().__init__()
         self.temperature = temperature
         self.reduction = reduction
@@ -61,7 +66,11 @@ class ListNetLoss(nn.Module):
     Reference: Cao et al. (ICML 2007)
     """
-    def __init__(self, temperature: float = 1.0, reduction: str = "mean"):
+    def __init__(
+        self,
+        temperature: float = 1.0,
+        reduction: Literal["mean", "sum", "none"] = "mean",
+    ):
         super().__init__()
         self.temperature = temperature
         self.reduction = reduction
@@ -84,7 +93,7 @@ class ListMLELoss(nn.Module):
     Reference: Xia et al. (ICML 2008)
     """
-    def __init__(self, reduction: str = "mean"):
+    def __init__(self, reduction: Literal["mean", "sum", "none"] = "mean"):
         super().__init__()
         self.reduction = reduction
@@ -117,7 +126,11 @@ class ApproxNDCGLoss(nn.Module):
     Reference: Qin et al. (2010)
     """
-    def __init__(self, temperature: float = 1.0, reduction: str = "mean"):
+    def __init__(
+        self,
+        temperature: float = 1.0,
+        reduction: Literal["mean", "sum", "none"] = "mean",
+    ):
         super().__init__()
         self.temperature = temperature
         self.reduction = reduction

nextrec/loss/pairwise.py CHANGED Viewed

@@ -2,7 +2,7 @@
 Pairwise loss functions for learning-to-rank and matching tasks.
 Date: create on 27/10/2025
-Checkpoint: edit on 29/11/2025
+Checkpoint: edit on 29/12/2025
 Author: Yang Zhou, zyaztec@gmail.com
 """
@@ -18,7 +18,7 @@ class BPRLoss(nn.Module):
     Bayesian Personalized Ranking loss with support for multiple negatives.
     """
-    def __init__(self, reduction: str = "mean"):
+    def __init__(self, reduction: Literal["mean", "sum", "none"] = "mean"):
         super().__init__()
         self.reduction = reduction
@@ -42,7 +42,9 @@ class HingeLoss(nn.Module):
     Hinge loss for pairwise ranking.
     """
-    def __init__(self, margin: float = 1.0, reduction: str = "mean"):
+    def __init__(
+        self, margin: float = 1.0, reduction: Literal["mean", "sum", "none"] = "mean"
+    ):
         super().__init__()
         self.margin = margin
         self.reduction = reduction
@@ -69,7 +71,7 @@ class TripletLoss(nn.Module):
     def __init__(
         self,
         margin: float = 1.0,
-        reduction: str = "mean",
+        reduction: Literal["mean", "sum", "none"] = "mean",
         distance: Literal["euclidean", "cosine"] = "euclidean",
     ):
         super().__init__()

nextrec/loss/pointwise.py CHANGED Viewed

@@ -2,11 +2,11 @@
 Pointwise loss functions, including imbalance-aware variants.
 Date: create on 27/10/2025
-Checkpoint: edit on 29/11/2025
+Checkpoint: edit on 29/12/2025
 Author: Yang Zhou, zyaztec@gmail.com
 """
-from typing import Optional, Sequence
+from typing import Optional, Sequence, Literal
 import torch
 import torch.nn as nn
@@ -18,7 +18,9 @@ class CosineContrastiveLoss(nn.Module):
     Contrastive loss using cosine similarity for positive/negative pairs.
     """
-    def __init__(self, margin: float = 0.5, reduction: str = "mean"):
+    def __init__(
+        self, margin: float = 0.5, reduction: Literal["mean", "sum", "none"] = "mean"
+    ):
         super().__init__()
         self.margin = margin
         self.reduction = reduction
@@ -50,7 +52,7 @@ class WeightedBCELoss(nn.Module):
     def __init__(
         self,
         pos_weight: float | torch.Tensor | None = None,
-        reduction: str = "mean",
+        reduction: Literal["mean", "sum", "none"] = "mean",
         logits: bool = False,
         auto_balance: bool = False,
     ):
@@ -110,7 +112,7 @@ class FocalLoss(nn.Module):
         self,
         gamma: float = 2.0,
         alpha: Optional[float | Sequence[float] | torch.Tensor] = None,
-        reduction: str = "mean",
+        reduction: Literal["mean", "sum", "none"] = "mean",
         logits: bool = False,
     ):
         super().__init__()
@@ -187,7 +189,7 @@ class ClassBalancedFocalLoss(nn.Module):
         class_counts: Sequence[int] | torch.Tensor,
         beta: float = 0.9999,
         gamma: float = 2.0,
-        reduction: str = "mean",
+        reduction: Literal["mean", "sum", "none"] = "mean",
     ):
         super().__init__()
         self.gamma = gamma

nextrec/models/multi_task/aitm.py ADDED Viewed

File without changes

nextrec/models/multi_task/apg.py ADDED Viewed

File without changes

nextrec/models/multi_task/cross_stitch.py ADDED Viewed

File without changes

nextrec/models/multi_task/esmm.py CHANGED Viewed

@@ -42,12 +42,12 @@ CVR 预测 P(conversion|click)，二者相乘得到 CTCVR 并在曝光标签上
 """
 import torch
-import torch.nn as nn
 from nextrec.basic.features import DenseFeature, SequenceFeature, SparseFeature
 from nextrec.basic.layers import MLP, EmbeddingLayer
 from nextrec.basic.heads import TaskHead
 from nextrec.basic.model import BaseModel
+from nextrec.utils.types import TaskTypeName
 class ESMM(BaseModel):
@@ -77,23 +77,12 @@ class ESMM(BaseModel):
         sequence_features: list[SequenceFeature],
         ctr_params: dict,
         cvr_params: dict,
+        task: TaskTypeName | list[TaskTypeName] | None = None,
         target: list[str] | None = None,  # Note: ctcvr = ctr * cvr
-        task: list[str] | None = None,
-        optimizer: str = "adam",
-        optimizer_params: dict | None = None,
-        loss: str | nn.Module | list[str | nn.Module] | None = "bce",
-        loss_params: dict | list[dict] | None = None,
-        embedding_l1_reg=0.0,
-        dense_l1_reg=0.0,
-        embedding_l2_reg=0.0,
-        dense_l2_reg=0.0,
         **kwargs,
     ):
         target = target or ["ctr", "ctcvr"]
-        optimizer_params = optimizer_params or {}
-        if loss is None:
-            loss = "bce"
         if len(target) != 2:
             raise ValueError(
@@ -120,35 +109,23 @@ class ESMM(BaseModel):
             sequence_features=sequence_features,
             target=target,
             task=resolved_task,  # Both CTR and CTCVR are binary classification
-            embedding_l1_reg=embedding_l1_reg,
-            dense_l1_reg=dense_l1_reg,
-            embedding_l2_reg=embedding_l2_reg,
-            dense_l2_reg=dense_l2_reg,
             **kwargs,
         )
-        self.loss = loss
         self.embedding = EmbeddingLayer(features=self.all_features)
         input_dim = self.embedding.input_dim
         # CTR tower
-        self.ctr_tower = MLP(input_dim=input_dim, output_layer=True, **ctr_params)
+        self.ctr_tower = MLP(input_dim=input_dim, output_dim=1, **ctr_params)
         # CVR tower
-        self.cvr_tower = MLP(input_dim=input_dim, output_layer=True, **cvr_params)
+        self.cvr_tower = MLP(input_dim=input_dim, output_dim=1, **cvr_params)
         self.grad_norm_shared_modules = ["embedding"]
-        self.prediction_layer = TaskHead(task_type=self.default_task, task_dims=[1, 1])
+        self.prediction_layer = TaskHead(task_type=self.task, task_dims=[1, 1])
         # Register regularization weights
         self.register_regularization_weights(
             embedding_attr="embedding", include_modules=["ctr_tower", "cvr_tower"]
         )
-        self.compile(
-            optimizer=optimizer,
-            optimizer_params=optimizer_params,
-            loss=loss,
-            loss_params=loss_params,
-        )
     def forward(self, x):
         # Get all embeddings and flatten

nextrec/models/multi_task/mmoe.py CHANGED Viewed

@@ -82,14 +82,6 @@ class MMOE(BaseModel):
         tower_params_list: list[dict] | None = None,
         target: list[str] | str | None = None,
         task: str | list[str] = "binary",
-        optimizer: str = "adam",
-        optimizer_params: dict | None = None,
-        loss: str | nn.Module | list[str | nn.Module] | None = "bce",
-        loss_params: dict | list[dict] | None = None,
-        embedding_l1_reg=0.0,
-        dense_l1_reg=0.0,
-        embedding_l2_reg=0.0,
-        dense_l2_reg=0.0,
         **kwargs,
     ):
@@ -98,9 +90,7 @@ class MMOE(BaseModel):
         sequence_features = sequence_features or []
         expert_params = expert_params or {}
         tower_params_list = tower_params_list or []
-        optimizer_params = optimizer_params or {}
-        if loss is None:
-            loss = "bce"
         if target is None:
             target = []
         elif isinstance(target, str):
@@ -126,15 +116,9 @@ class MMOE(BaseModel):
             sequence_features=sequence_features,
             target=target,
             task=resolved_task,
-            embedding_l1_reg=embedding_l1_reg,
-            dense_l1_reg=dense_l1_reg,
-            embedding_l2_reg=embedding_l2_reg,
-            dense_l2_reg=dense_l2_reg,
             **kwargs,
         )
-        self.loss = loss
         # Number of tasks and experts
         self.nums_task = len(target)
         self.num_experts = num_experts
@@ -150,12 +134,12 @@ class MMOE(BaseModel):
         # Expert networks (shared by all tasks)
         self.experts = nn.ModuleList()
         for _ in range(num_experts):
-            expert = MLP(input_dim=input_dim, output_layer=False, **expert_params)
+            expert = MLP(input_dim=input_dim, output_dim=None, **expert_params)
             self.experts.append(expert)
         # Get expert output dimension
-        if "dims" in expert_params and len(expert_params["dims"]) > 0:
-            expert_output_dim = expert_params["dims"][-1]
+        if "hidden_dims" in expert_params and len(expert_params["hidden_dims"]) > 0:
+            expert_output_dim = expert_params["hidden_dims"][-1]
         else:
             expert_output_dim = input_dim
@@ -169,21 +153,15 @@ class MMOE(BaseModel):
         # Task-specific towers
         self.towers = nn.ModuleList()
         for tower_params in tower_params_list:
-            tower = MLP(input_dim=expert_output_dim, output_layer=True, **tower_params)
+            tower = MLP(input_dim=expert_output_dim, output_dim=1, **tower_params)
             self.towers.append(tower)
         self.prediction_layer = TaskHead(
-            task_type=self.default_task, task_dims=[1] * self.nums_task
+            task_type=self.task, task_dims=[1] * self.nums_task
         )
         # Register regularization weights
         self.register_regularization_weights(
             embedding_attr="embedding", include_modules=["experts", "gates", "towers"]
         )
-        self.compile(
-            optimizer=optimizer,
-            optimizer_params=optimizer_params,
-            loss=self.loss,
-            loss_params=loss_params,
-        )
     def forward(self, x):
         # Get all embeddings and flatten

nextrec/models/multi_task/pepnet.py ADDED Viewed

@@ -0,0 +1,335 @@
+"""
+Date: create on 09/11/2025
+Checkpoint: edit on 30/12/2025
+Author: Yang Zhou, zyaztec@gmail.com
+Reference:
+[1] Yang et al. "PEPNet: Parameter and Embedding Personalized Network for Multi-Task Learning", 2021.
+[2] MMLRec-A-Unified-Multi-Task-and-Multi-Scenario-Learning-Benchmark-for-Recommendation:
+https://github.com/alipay/MMLRec-A-Unified-Multi-Task-and-Multi-Scenario-Learning-Benchmark-for-Recommendation/blob/main/model/pepnet.py
+PEPNet (Parameter and Embedding Personalized Network) is a multi-task learning
+model that personalizes both input features and layer transformations with
+context (scene/domain, user, item). It applies a shared feature gate to the
+backbone embedding and then uses per-task gated MLP blocks (PPNet blocks) whose
+gates are conditioned on task-specific context. This enables task-aware routing
+at both feature and layer levels, improving adaptation across scenarios/tasks.
+Workflow:
+  (1) Embed all features and build the backbone input
+  (2) Build task context embedding from domain/user/item features
+  (3) Feature gate masks backbone input using domain context
+  (4) Each task tower applies layer-wise gates conditioned on context + backbone embedding output
+  (5) Task heads produce per-task predictions
+Key Advantages:
+- Two-level personalization: feature gate + layer gates
+- Context-driven routing for multi-scenario/multi-task recommendation
+- Task towers share embeddings while adapting via gates
+- Gate input uses stop-grad on backbone embedding output for stable training
+- Compatible with heterogeneous features via unified embeddings
+PEPNet（Parameter and Embedding Personalized Network）通过场景/用户/物品等上下文
+对输入特征与网络层进行双层门控个性化。先用共享特征门控调整主干输入，再在每个
+任务塔中使用条件门控的 MLP 层（PPNet block），实现任务与场景感知的逐层路由。
+流程：
+  (1) 对全部特征做 embedding，得到主干输入
+  (2) 由场景/用户/物品特征构建任务上下文向量
+  (3) 共享特征门控按场景调制主干输入
+  (4) 任务塔逐层门控，结合上下文与主干 embedding 输出进行路由
+  (5) 任务头输出各任务预测结果
+主要优点：
+- 特征级与层级双重个性化
+- 上下文驱动的多场景/多任务适配
+- 共享 embedding 的同时通过门控实现任务定制
+- 对主干 embedding 输出 stop-grad，提高训练稳定性
+- 统一 embedding 支持多类特征
+"""
+from __future__ import annotations
+import torch
+import torch.nn as nn
+from nextrec.basic.activation import activation_layer
+from nextrec.basic.features import DenseFeature, SequenceFeature, SparseFeature
+from nextrec.basic.layers import EmbeddingLayer, GateMLP
+from nextrec.basic.heads import TaskHead
+from nextrec.basic.model import BaseModel
+from nextrec.utils.model import select_features
+from nextrec.utils.types import ActivationName, TaskTypeName
+class PPNetBlock(nn.Module):
+    """
+    PEPNet block with per-layer gates conditioned on task context.
+    """
+    def __init__(
+        self,
+        input_dim: int,
+        output_dim: int,
+        gate_input_dim: int,
+        gate_hidden_dim: int | None,
+        hidden_units: list[int] | None = None,
+        hidden_activations: ActivationName | list[ActivationName] = "relu",
+        dropout_rates: float | list[float] = 0.0,
+        batch_norm: bool = False,
+        use_bias: bool = True,
+        gate_activation: ActivationName = "relu",
+        gate_dropout: float = 0.0,
+        gate_use_bn: bool = False,
+    ) -> None:
+        super().__init__()
+        hidden_units = hidden_units or []
+        if isinstance(dropout_rates, list):
+            if len(dropout_rates) != len(hidden_units):
+                raise ValueError("dropout_rates length must match hidden_units length.")
+            dropout_list = dropout_rates
+        else:
+            dropout_list = [dropout_rates] * len(hidden_units)
+        if isinstance(hidden_activations, list):
+            if len(hidden_activations) != len(hidden_units):
+                raise ValueError(
+                    "hidden_activations length must match hidden_units length."
+                )
+            activation_list = hidden_activations
+        else:
+            activation_list = [hidden_activations] * len(hidden_units)
+        self.gate_layers = nn.ModuleList()
+        self.mlp_layers = nn.ModuleList()
+        layer_units = [input_dim] + hidden_units
+        for idx in range(len(layer_units) - 1):
+            dense_layers: list[nn.Module] = [
+                nn.Linear(layer_units[idx], layer_units[idx + 1], bias=use_bias)
+            ]
+            if batch_norm:
+                dense_layers.append(nn.BatchNorm1d(layer_units[idx + 1]))
+            dense_layers.append(activation_layer(activation_list[idx]))
+            if dropout_list[idx] > 0:
+                dense_layers.append(nn.Dropout(p=dropout_list[idx]))
+            self.gate_layers.append(
+                GateMLP(
+                    input_dim=gate_input_dim,
+                    hidden_dim=gate_hidden_dim,
+                    output_dim=layer_units[idx],
+                    activation=gate_activation,
+                    dropout=gate_dropout,
+                    use_bn=gate_use_bn,
+                    scale_factor=2.0,
+                )
+            )
+            self.mlp_layers.append(nn.Sequential(*dense_layers))
+        self.gate_layers.append(
+            GateMLP(
+                input_dim=gate_input_dim,
+                hidden_dim=gate_hidden_dim,
+                output_dim=layer_units[-1],
+                activation=gate_activation,
+                dropout=gate_dropout,
+                use_bn=gate_use_bn,
+                scale_factor=1.0,
+            )
+        )
+        self.mlp_layers.append(nn.Linear(layer_units[-1], output_dim, bias=use_bias))
+    def forward(self, o_ep: torch.Tensor, o_prior: torch.Tensor) -> torch.Tensor:
+        """
+        o_ep: EPNet output embedding (will be stop-grad in gate input)
+        o_prior: prior/task context embedding
+        """
+        gate_input = torch.cat([o_prior, o_ep.detach()], dim=-1)
+        hidden = o_ep
+        for gate, mlp in zip(self.gate_layers, self.mlp_layers):
+            gw = gate(gate_input)
+            hidden = mlp(hidden * gw)
+        return hidden
+class PEPNet(BaseModel):
+    """
+    PEPNet: feature-gated multi-task tower with task-conditioned gates.
+    """
+    @property
+    def model_name(self) -> str:
+        return "PepNet"
+    @property
+    def default_task(self) -> TaskTypeName | list[TaskTypeName]:
+        nums_task = self.nums_task if hasattr(self, "nums_task") else None
+        if nums_task is not None and nums_task > 0:
+            return ["binary"] * nums_task
+        return ["binary"]
+    def __init__(
+        self,
+        dense_features: list[DenseFeature] | None = None,
+        sparse_features: list[SparseFeature] | None = None,
+        sequence_features: list[SequenceFeature] | None = None,
+        target: list[str] | str | None = None,
+        task: TaskTypeName | list[TaskTypeName] | None = None,
+        dnn_hidden_units: list[int] | None = None,
+        dnn_activation: ActivationName = "relu",
+        dnn_dropout: float | list[float] = 0.0,
+        dnn_use_bn: bool = False,
+        feature_gate_hidden_dim: int = 128,
+        gate_hidden_dim: int | None = None,
+        gate_activation: ActivationName = "relu",
+        gate_dropout: float = 0.0,
+        gate_use_bn: bool = False,
+        domain_features: list[str] | str | None = None,
+        user_features: list[str] | str | None = None,
+        item_features: list[str] | str | None = None,
+        use_bias: bool = True,
+        **kwargs,
+    ) -> None:
+        dense_features = dense_features or []
+        sparse_features = sparse_features or []
+        sequence_features = sequence_features or []
+        dnn_hidden_units = dnn_hidden_units or [256, 128]
+        if target is None:
+            target = []
+        elif isinstance(target, str):
+            target = [target]
+        self.nums_task = len(target) if target else 1
+        resolved_task = task
+        if resolved_task is None:
+            resolved_task = self.default_task
+        elif isinstance(resolved_task, str):
+            resolved_task = [resolved_task] * self.nums_task
+        elif len(resolved_task) == 1 and self.nums_task > 1:
+            resolved_task = resolved_task * self.nums_task
+        elif len(resolved_task) != self.nums_task:
+            raise ValueError(
+                f"Length of task ({len(resolved_task)}) must match number of targets ({self.nums_task})."
+            )
+        super().__init__(
+            dense_features=dense_features,
+            sparse_features=sparse_features,
+            sequence_features=sequence_features,
+            target=target,
+            task=resolved_task,
+            **kwargs,
+        )
+        if isinstance(domain_features, str):
+            domain_features = [domain_features]
+        if isinstance(user_features, str):
+            user_features = [user_features]
+        if isinstance(item_features, str):
+            item_features = [item_features]
+        self.scene_feature_names = list(domain_features or [])
+        self.user_feature_names = list(user_features or [])
+        self.item_feature_names = list(item_features or [])
+        if not self.scene_feature_names:
+            raise ValueError("PepNet requires at least one scene feature name.")
+        self.domain_features = select_features(
+            self.all_features, self.scene_feature_names, "domain_features"
+        )
+        self.user_features = select_features(
+            self.all_features, self.user_feature_names, "user_features"
+        )
+        self.item_features = select_features(
+            self.all_features, self.item_feature_names, "item_features"
+        )
+        if not self.all_features:
+            raise ValueError("PepNet requires at least one input feature.")
+        self.embedding = EmbeddingLayer(features=self.all_features)
+        input_dim = self.embedding.get_input_dim(self.all_features)
+        domain_dim = self.embedding.get_input_dim(self.domain_features)
+        user_dim = (
+            self.embedding.get_input_dim(self.user_features)
+            if self.user_features
+            else 0
+        )
+        item_dim = (
+            self.embedding.get_input_dim(self.item_features)
+            if self.item_features
+            else 0
+        )
+        task_dim = domain_dim + user_dim + item_dim
+        self.feature_gate = GateMLP(
+            input_dim=input_dim + domain_dim,
+            hidden_dim=feature_gate_hidden_dim,
+            output_dim=input_dim,
+            activation=gate_activation,
+            dropout=gate_dropout,
+            use_bn=gate_use_bn,
+        )
+        self.ppn_blocks = nn.ModuleList(
+            [
+                PPNetBlock(
+                    input_dim=input_dim,
+                    output_dim=1,
+                    gate_input_dim=input_dim + task_dim,
+                    gate_hidden_dim=gate_hidden_dim,
+                    hidden_units=dnn_hidden_units,
+                    hidden_activations=dnn_activation,
+                    dropout_rates=dnn_dropout,
+                    batch_norm=dnn_use_bn,
+                    use_bias=use_bias,
+                    gate_activation=gate_activation,
+                    gate_dropout=gate_dropout,
+                    gate_use_bn=gate_use_bn,
+                )
+                for _ in range(self.nums_task)
+            ]
+        )
+        self.prediction_layer = TaskHead(
+            task_type=self.task, task_dims=[1] * self.nums_task
+        )
+        self.grad_norm_shared_modules = ["embedding", "feature_gate"]
+        self.register_regularization_weights(
+            embedding_attr="embedding", include_modules=["feature_gate", "ppn_blocks"]
+        )
+    def forward(self, x: dict[str, torch.Tensor]) -> torch.Tensor:
+        dnn_input = self.embedding(x=x, features=self.all_features, squeeze_dim=True)
+        domain_emb = self.embedding(
+            x=x, features=self.domain_features, squeeze_dim=True
+        ).detach()
+        task_parts = [domain_emb]
+        if self.user_features:
+            task_parts.append(
+                self.embedding(
+                    x=x, features=self.user_features, squeeze_dim=True
+                ).detach()
+            )
+        if self.item_features:
+            task_parts.append(
+                self.embedding(
+                    x=x, features=self.item_features, squeeze_dim=True
+                ).detach()
+            )
+        task_sf_emb = torch.cat(task_parts, dim=-1)
+        gate_input = torch.cat([dnn_input.detach(), domain_emb], dim=-1)
+        dnn_input = self.feature_gate(gate_input) * dnn_input
+        task_logits = []
+        for block in self.ppn_blocks:
+            task_logits.append(block(o_ep=dnn_input, o_prior=task_sf_emb))
+        y = torch.cat(task_logits, dim=1)
+        return self.prediction_layer(y)

nextrec 0.4.22__py3-none-any.whl → 0.4.24__py3-none-any.whl

nextrec 0.4.22py3-none-any.whl → 0.4.24py3-none-any.whl