PyPI - nextrec - Versions diffs - 0.1.1__py3-none-any.whl → 0.1.2__py3-none-any.whl - Mend

nextrec 0.1.1py3-none-any.whl → 0.1.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (48) hide show

nextrec/__init__.py +4 -4
nextrec/__version__.py +1 -1
nextrec/basic/activation.py +10 -9
nextrec/basic/callback.py +1 -0
nextrec/basic/dataloader.py +168 -127
nextrec/basic/features.py +24 -27
nextrec/basic/layers.py +328 -159
nextrec/basic/loggers.py +50 -37
nextrec/basic/metrics.py +255 -147
nextrec/basic/model.py +817 -462
nextrec/data/__init__.py +5 -5
nextrec/data/data_utils.py +16 -12
nextrec/data/preprocessor.py +276 -252
nextrec/loss/__init__.py +12 -12
nextrec/loss/loss_utils.py +30 -22
nextrec/loss/match_losses.py +116 -83
nextrec/models/match/__init__.py +5 -5
nextrec/models/match/dssm.py +70 -61
nextrec/models/match/dssm_v2.py +61 -51
nextrec/models/match/mind.py +89 -71
nextrec/models/match/sdm.py +93 -81
nextrec/models/match/youtube_dnn.py +62 -53
nextrec/models/multi_task/esmm.py +49 -43
nextrec/models/multi_task/mmoe.py +65 -56
nextrec/models/multi_task/ple.py +92 -65
nextrec/models/multi_task/share_bottom.py +48 -42
nextrec/models/ranking/__init__.py +7 -7
nextrec/models/ranking/afm.py +39 -30
nextrec/models/ranking/autoint.py +70 -57
nextrec/models/ranking/dcn.py +43 -35
nextrec/models/ranking/deepfm.py +34 -28
nextrec/models/ranking/dien.py +115 -79
nextrec/models/ranking/din.py +84 -60
nextrec/models/ranking/fibinet.py +51 -35
nextrec/models/ranking/fm.py +28 -26
nextrec/models/ranking/masknet.py +31 -31
nextrec/models/ranking/pnn.py +30 -31
nextrec/models/ranking/widedeep.py +36 -31
nextrec/models/ranking/xdeepfm.py +46 -39
nextrec/utils/__init__.py +9 -9
nextrec/utils/embedding.py +1 -1
nextrec/utils/initializer.py +23 -15
nextrec/utils/optimizer.py +14 -10
{nextrec-0.1.1.dist-info → nextrec-0.1.2.dist-info}/METADATA +6 -40
nextrec-0.1.2.dist-info/RECORD +51 -0
nextrec-0.1.1.dist-info/RECORD +0 -51
{nextrec-0.1.1.dist-info → nextrec-0.1.2.dist-info}/WHEEL +0 -0
{nextrec-0.1.1.dist-info → nextrec-0.1.2.dist-info}/licenses/LICENSE +0 -0

nextrec/loss/__init__.py CHANGED Viewed

@@ -18,18 +18,18 @@ from nextrec.loss.loss_utils import (
 __all__ = [
     # Match losses
-    'BPRLoss',
-    'HingeLoss',
-    'TripletLoss',
-    'SampledSoftmaxLoss',
-    'CosineContrastiveLoss',
-    'InfoNCELoss',
+    "BPRLoss",
+    "HingeLoss",
+    "TripletLoss",
+    "SampledSoftmaxLoss",
+    "CosineContrastiveLoss",
+    "InfoNCELoss",
     # Listwise losses
-    'ListNetLoss',
-    'ListMLELoss',
-    'ApproxNDCGLoss',
+    "ListNetLoss",
+    "ListMLELoss",
+    "ApproxNDCGLoss",
     # Utilities
-    'get_loss_fn',
-    'validate_training_mode',
-    'VALID_TASK_TYPES',
+    "get_loss_fn",
+    "validate_training_mode",
+    "VALID_TASK_TYPES",
 ]

nextrec/loss/loss_utils.py CHANGED Viewed

@@ -5,42 +5,52 @@ Date: create on 09/11/2025
 Author:
     Yang Zhou,zyaztec@gmail.com
 """
 import torch
 import torch.nn as nn
 from typing import Literal
 from nextrec.loss.match_losses import (
-    BPRLoss,
-    HingeLoss,
-    TripletLoss,
+    BPRLoss,
+    HingeLoss,
+    TripletLoss,
     SampledSoftmaxLoss,
-    CosineContrastiveLoss,
-    InfoNCELoss
+    CosineContrastiveLoss,
+    InfoNCELoss,
 )
 # Valid task types for validation
-VALID_TASK_TYPES = ['binary', 'multiclass', 'regression', 'multivariate_regression', 'match', 'ranking', 'multitask', 'multilabel']
+VALID_TASK_TYPES = [
+    "binary",
+    "multiclass",
+    "regression",
+    "multivariate_regression",
+    "match",
+    "ranking",
+    "multitask",
+    "multilabel",
+]
 def get_loss_fn(
     task_type: str = "binary",
     training_mode: str | None = None,
     loss: str | nn.Module | None = None,
-    **loss_kwargs
+    **loss_kwargs,
 ) -> nn.Module:
     """
     Get loss function based on task type and training mode.
     Examples:
         # Ranking task (binary classification)
         >>> loss_fn = get_loss_fn(task_type="binary", loss="bce")
         # Match task with pointwise training
         >>> loss_fn = get_loss_fn(task_type="match", training_mode="pointwise")
         # Match task with pairwise training
         >>> loss_fn = get_loss_fn(task_type="match", training_mode="pairwise", loss="bpr")
         # Match task with listwise training
         >>> loss_fn = get_loss_fn(task_type="match", training_mode="listwise", loss="sampled_softmax")
     """
@@ -57,7 +67,7 @@ def get_loss_fn(
                 return CosineContrastiveLoss(**loss_kwargs)
             elif isinstance(loss, str):
                 raise ValueError(f"Unsupported pointwise loss: {loss}")
         elif training_mode == "pairwise":
             if loss is None or loss == "bpr":
                 return BPRLoss(**loss_kwargs)
@@ -67,7 +77,7 @@ def get_loss_fn(
                 return TripletLoss(**loss_kwargs)
             elif isinstance(loss, str):
                 raise ValueError(f"Unsupported pairwise loss: {loss}")
         elif training_mode == "listwise":
             if loss is None or loss == "sampled_softmax" or loss == "softmax":
                 return SampledSoftmaxLoss(**loss_kwargs)
@@ -77,7 +87,7 @@ def get_loss_fn(
                 return nn.CrossEntropyLoss(**loss_kwargs)
             elif isinstance(loss, str):
                 raise ValueError(f"Unsupported listwise loss: {loss}")
         else:
             raise ValueError(f"Unknown training_mode: {training_mode}")
@@ -98,7 +108,7 @@ def get_loss_fn(
             return nn.CrossEntropyLoss(**loss_kwargs)
         elif isinstance(loss, str):
             raise ValueError(f"Unsupported multiclass loss: {loss}")
     elif task_type == "regression":
         if loss is None or loss == "mse":
             return nn.MSELoss(**loss_kwargs)
@@ -106,26 +116,24 @@ def get_loss_fn(
             return nn.L1Loss(**loss_kwargs)
         elif isinstance(loss, str):
             raise ValueError(f"Unsupported regression loss: {loss}")
     else:
         raise ValueError(f"Unsupported task_type: {task_type}")
     return loss
 def validate_training_mode(
-    training_mode: str,
-    support_training_modes: list[str],
-    model_name: str = "Model"
+    training_mode: str, support_training_modes: list[str], model_name: str = "Model"
 ) -> None:
     """
     Validate that the requested training mode is supported by the model.
     Args:
         training_mode: Requested training mode
         support_training_modes: List of supported training modes
         model_name: Name of the model (for error messages)
     Raises:
         ValueError: If training mode is not supported
     """

nextrec/loss/match_losses.py CHANGED Viewed

@@ -13,149 +13,167 @@ from typing import Optional
 class BPRLoss(nn.Module):
-    def __init__(self, reduction: str = 'mean'):
+    def __init__(self, reduction: str = "mean"):
         super(BPRLoss, self).__init__()
         self.reduction = reduction
     def forward(self, pos_score: torch.Tensor, neg_score: torch.Tensor) -> torch.Tensor:
         if neg_score.dim() == 2:
             pos_score = pos_score.unsqueeze(1)  # [batch_size, 1]
             diff = pos_score - neg_score  # [batch_size, num_neg]
             loss = -torch.log(torch.sigmoid(diff) + 1e-8)
-            if self.reduction == 'mean':
+            if self.reduction == "mean":
                 return loss.mean()
-            elif self.reduction == 'sum':
+            elif self.reduction == "sum":
                 return loss.sum()
             else:
                 return loss
         else:
             diff = pos_score - neg_score
             loss = -torch.log(torch.sigmoid(diff) + 1e-8)
-            if self.reduction == 'mean':
+            if self.reduction == "mean":
                 return loss.mean()
-            elif self.reduction == 'sum':
+            elif self.reduction == "sum":
                 return loss.sum()
             else:
                 return loss
-class HingeLoss(nn.Module):
-    def __init__(self, margin: float = 1.0, reduction: str = 'mean'):
+class HingeLoss(nn.Module):
+    def __init__(self, margin: float = 1.0, reduction: str = "mean"):
         super(HingeLoss, self).__init__()
         self.margin = margin
         self.reduction = reduction
     def forward(self, pos_score: torch.Tensor, neg_score: torch.Tensor) -> torch.Tensor:
         if neg_score.dim() == 2:
             pos_score = pos_score.unsqueeze(1)  # [batch_size, 1]
         diff = pos_score - neg_score
         loss = torch.clamp(self.margin - diff, min=0)
-        if self.reduction == 'mean':
+        if self.reduction == "mean":
             return loss.mean()
-        elif self.reduction == 'sum':
+        elif self.reduction == "sum":
             return loss.sum()
         else:
             return loss
 class TripletLoss(nn.Module):
-    def __init__(self, margin: float = 1.0, reduction: str = 'mean', distance: str = 'euclidean'):
+    def __init__(
+        self, margin: float = 1.0, reduction: str = "mean", distance: str = "euclidean"
+    ):
         super(TripletLoss, self).__init__()
         self.margin = margin
         self.reduction = reduction
         self.distance = distance
-    def forward(self, anchor: torch.Tensor, positive: torch.Tensor, negative: torch.Tensor) -> torch.Tensor:
-        if self.distance == 'euclidean':
+    def forward(
+        self, anchor: torch.Tensor, positive: torch.Tensor, negative: torch.Tensor
+    ) -> torch.Tensor:
+        if self.distance == "euclidean":
             pos_dist = torch.sum((anchor - positive) ** 2, dim=-1)
             if negative.dim() == 3:
                 anchor_expanded = anchor.unsqueeze(1)  # [batch_size, 1, dim]
-                neg_dist = torch.sum((anchor_expanded - negative) ** 2, dim=-1)  # [batch_size, num_neg]
+                neg_dist = torch.sum(
+                    (anchor_expanded - negative) ** 2, dim=-1
+                )  # [batch_size, num_neg]
             else:
                 neg_dist = torch.sum((anchor - negative) ** 2, dim=-1)
             if neg_dist.dim() == 2:
                 pos_dist = pos_dist.unsqueeze(1)  # [batch_size, 1]
-        elif self.distance == 'cosine':
+        elif self.distance == "cosine":
             pos_dist = 1 - F.cosine_similarity(anchor, positive, dim=-1)
             if negative.dim() == 3:
                 anchor_expanded = anchor.unsqueeze(1)  # [batch_size, 1, dim]
                 neg_dist = 1 - F.cosine_similarity(anchor_expanded, negative, dim=-1)
             else:
                 neg_dist = 1 - F.cosine_similarity(anchor, negative, dim=-1)
             if neg_dist.dim() == 2:
                 pos_dist = pos_dist.unsqueeze(1)
         else:
             raise ValueError(f"Unsupported distance: {self.distance}")
         loss = torch.clamp(pos_dist - neg_dist + self.margin, min=0)
-        if self.reduction == 'mean':
+        if self.reduction == "mean":
             return loss.mean()
-        elif self.reduction == 'sum':
+        elif self.reduction == "sum":
             return loss.sum()
         else:
             return loss
 class SampledSoftmaxLoss(nn.Module):
-    def __init__(self, reduction: str = 'mean'):
+    def __init__(self, reduction: str = "mean"):
         super(SampledSoftmaxLoss, self).__init__()
         self.reduction = reduction
-    def forward(self, pos_logits: torch.Tensor, neg_logits: torch.Tensor) -> torch.Tensor:
+    def forward(
+        self, pos_logits: torch.Tensor, neg_logits: torch.Tensor
+    ) -> torch.Tensor:
         pos_logits = pos_logits.unsqueeze(1)  # [batch_size, 1]
-        all_logits = torch.cat([pos_logits, neg_logits], dim=1)  # [batch_size, 1 + num_neg]
-        targets = torch.zeros(all_logits.size(0), dtype=torch.long, device=all_logits.device)
+        all_logits = torch.cat(
+            [pos_logits, neg_logits], dim=1
+        )  # [batch_size, 1 + num_neg]
+        targets = torch.zeros(
+            all_logits.size(0), dtype=torch.long, device=all_logits.device
+        )
         loss = F.cross_entropy(all_logits, targets, reduction=self.reduction)
         return loss
 class CosineContrastiveLoss(nn.Module):
-    def __init__(self, margin: float = 0.5, reduction: str = 'mean'):
+    def __init__(self, margin: float = 0.5, reduction: str = "mean"):
         super(CosineContrastiveLoss, self).__init__()
         self.margin = margin
         self.reduction = reduction
-    def forward(self, user_emb: torch.Tensor, item_emb: torch.Tensor, labels: torch.Tensor) -> torch.Tensor:
+    def forward(
+        self, user_emb: torch.Tensor, item_emb: torch.Tensor, labels: torch.Tensor
+    ) -> torch.Tensor:
         similarity = F.cosine_similarity(user_emb, item_emb, dim=-1)
         pos_loss = (1 - similarity) * labels
         neg_loss = torch.clamp(similarity - self.margin, min=0) * (1 - labels)
         loss = pos_loss + neg_loss
-        if self.reduction == 'mean':
+        if self.reduction == "mean":
             return loss.mean()
-        elif self.reduction == 'sum':
+        elif self.reduction == "sum":
             return loss.sum()
         else:
             return loss
 class InfoNCELoss(nn.Module):
-    def __init__(self, temperature: float = 0.07, reduction: str = 'mean'):
+    def __init__(self, temperature: float = 0.07, reduction: str = "mean"):
         super(InfoNCELoss, self).__init__()
         self.temperature = temperature
         self.reduction = reduction
-    def forward(self, query: torch.Tensor, pos_key: torch.Tensor, neg_keys: torch.Tensor) -> torch.Tensor:
+    def forward(
+        self, query: torch.Tensor, pos_key: torch.Tensor, neg_keys: torch.Tensor
+    ) -> torch.Tensor:
         pos_sim = torch.sum(query * pos_key, dim=-1) / self.temperature  # [batch_size]
         pos_sim = pos_sim.unsqueeze(1)  # [batch_size, 1]
         query_expanded = query.unsqueeze(1)  # [batch_size, 1, dim]
-        neg_sim = torch.sum(query_expanded * neg_keys, dim=-1) / self.temperature  # [batch_size, num_neg]
+        neg_sim = (
+            torch.sum(query_expanded * neg_keys, dim=-1) / self.temperature
+        )  # [batch_size, num_neg]
         logits = torch.cat([pos_sim, neg_sim], dim=1)  # [batch_size, 1 + num_neg]
         labels = torch.zeros(logits.size(0), dtype=torch.long, device=logits.device)
         loss = F.cross_entropy(logits, labels, reduction=self.reduction)
         return loss
@@ -164,22 +182,23 @@ class ListNetLoss(nn.Module):
     ListNet loss using top-1 probability distribution
     Reference: Cao et al. Learning to Rank: From Pairwise Approach to Listwise Approach (ICML 2007)
     """
-    def __init__(self, temperature: float = 1.0, reduction: str = 'mean'):
+    def __init__(self, temperature: float = 1.0, reduction: str = "mean"):
         super(ListNetLoss, self).__init__()
         self.temperature = temperature
         self.reduction = reduction
     def forward(self, scores: torch.Tensor, labels: torch.Tensor) -> torch.Tensor:
         # Convert scores and labels to probability distributions
         pred_probs = F.softmax(scores / self.temperature, dim=1)
         true_probs = F.softmax(labels / self.temperature, dim=1)
         # Cross entropy between two distributions
         loss = -torch.sum(true_probs * torch.log(pred_probs + 1e-10), dim=1)
-        if self.reduction == 'mean':
+        if self.reduction == "mean":
             return loss.mean()
-        elif self.reduction == 'sum':
+        elif self.reduction == "sum":
             return loss.sum()
         else:
             return loss
@@ -190,19 +209,24 @@ class ListMLELoss(nn.Module):
     ListMLE (Maximum Likelihood Estimation) loss
     Reference: Xia et al. Listwise approach to learning to rank: theory and algorithm (ICML 2008)
     """
-    def __init__(self, reduction: str = 'mean'):
+    def __init__(self, reduction: str = "mean"):
         super(ListMLELoss, self).__init__()
         self.reduction = reduction
     def forward(self, scores: torch.Tensor, labels: torch.Tensor) -> torch.Tensor:
         # Sort by labels in descending order to get ground truth ranking
         sorted_labels, sorted_indices = torch.sort(labels, descending=True, dim=1)
         # Reorder scores according to ground truth ranking
         batch_size, list_size = scores.shape
-        batch_indices = torch.arange(batch_size, device=scores.device).unsqueeze(1).expand(-1, list_size)
+        batch_indices = (
+            torch.arange(batch_size, device=scores.device)
+            .unsqueeze(1)
+            .expand(-1, list_size)
+        )
         sorted_scores = scores[batch_indices, sorted_indices]
         # Compute log likelihood
         # For each position, compute log(exp(score_i) / sum(exp(score_j) for j >= i))
         loss = torch.tensor(0.0, device=scores.device)
@@ -211,10 +235,10 @@ class ListMLELoss(nn.Module):
             remaining_scores = sorted_scores[:, i:]
             log_sum_exp = torch.logsumexp(remaining_scores, dim=1)
             loss = loss + (log_sum_exp - sorted_scores[:, i]).sum()
-        if self.reduction == 'mean':
+        if self.reduction == "mean":
             return loss / batch_size
-        elif self.reduction == 'sum':
+        elif self.reduction == "sum":
             return loss
         else:
             return loss / batch_size
@@ -223,72 +247,81 @@ class ListMLELoss(nn.Module):
 class ApproxNDCGLoss(nn.Module):
     """
     Approximate NDCG loss for learning to rank
-    Reference: Qin et al. A General Approximation Framework for Direct Optimization of
+    Reference: Qin et al. A General Approximation Framework for Direct Optimization of
                Information Retrieval Measures (Information Retrieval 2010)
     """
-    def __init__(self, temperature: float = 1.0, reduction: str = 'mean'):
+    def __init__(self, temperature: float = 1.0, reduction: str = "mean"):
         super(ApproxNDCGLoss, self).__init__()
         self.temperature = temperature
         self.reduction = reduction
     def _dcg(self, relevance: torch.Tensor, k: Optional[int] = None) -> torch.Tensor:
         if k is not None:
             relevance = relevance[:, :k]
         # DCG = sum(rel_i / log2(i + 2)) for i in range(list_size)
-        positions = torch.arange(1, relevance.size(1) + 1, device=relevance.device, dtype=torch.float32)
+        positions = torch.arange(
+            1, relevance.size(1) + 1, device=relevance.device, dtype=torch.float32
+        )
         discounts = torch.log2(positions + 1.0)
         dcg = torch.sum(relevance / discounts, dim=1)
         return dcg
-    def forward(self, scores: torch.Tensor, labels: torch.Tensor, k: Optional[int] = None) -> torch.Tensor:
+    def forward(
+        self, scores: torch.Tensor, labels: torch.Tensor, k: Optional[int] = None
+    ) -> torch.Tensor:
         """
         Args:
             scores: Predicted scores [batch_size, list_size]
             labels: Ground truth relevance labels [batch_size, list_size]
             k: Top-k items for NDCG@k (if None, use all items)
         Returns:
             Approximate NDCG loss (1 - NDCG)
         """
         batch_size = scores.size(0)
         # Use differentiable sorting approximation with softmax
         # Create pairwise comparison matrix
         scores_expanded = scores.unsqueeze(2)  # [batch_size, list_size, 1]
-        scores_tiled = scores.unsqueeze(1)     # [batch_size, 1, list_size]
+        scores_tiled = scores.unsqueeze(1)  # [batch_size, 1, list_size]
         # Compute pairwise probabilities using sigmoid
         pairwise_diff = (scores_expanded - scores_tiled) / self.temperature
-        pairwise_probs = torch.sigmoid(pairwise_diff)  # [batch_size, list_size, list_size]
+        pairwise_probs = torch.sigmoid(
+            pairwise_diff
+        )  # [batch_size, list_size, list_size]
         # Approximate ranking positions
         # ranking_probs[i, j] ≈ probability that item i is ranked at position j
         # We use softmax approximation for differentiable ranking
         ranking_weights = F.softmax(scores / self.temperature, dim=1)
         # Sort labels to get ideal DCG
         ideal_labels, _ = torch.sort(labels, descending=True, dim=1)
         ideal_dcg = self._dcg(ideal_labels, k)
         # Compute approximate DCG using soft ranking
         # Weight each item's relevance by its soft ranking position
-        positions = torch.arange(1, scores.size(1) + 1, device=scores.device, dtype=torch.float32)
+        positions = torch.arange(
+            1, scores.size(1) + 1, device=scores.device, dtype=torch.float32
+        )
         discounts = 1.0 / torch.log2(positions + 1.0)
         # Approximate DCG by weighting relevance with ranking probabilities
         approx_dcg = torch.sum(labels * ranking_weights * discounts, dim=1)
         # Normalize by ideal DCG to get NDCG
         ndcg = approx_dcg / (ideal_dcg + 1e-10)
         # Loss is 1 - NDCG (we want to maximize NDCG, so minimize 1 - NDCG)
         loss = 1.0 - ndcg
-        if self.reduction == 'mean':
+        if self.reduction == "mean":
             return loss.mean()
-        elif self.reduction == 'sum':
+        elif self.reduction == "sum":
             return loss.sum()
         else:
             return loss

nextrec/models/match/__init__.py CHANGED Viewed

@@ -5,9 +5,9 @@ from .mind import MIND
 from .sdm import SDM
 __all__ = [
-    'DSSM',
-    'DSSM_v2',
-    'YoutubeDNN',
-    'MIND',
-    'SDM',
+    "DSSM",
+    "DSSM_v2",
+    "YoutubeDNN",
+    "MIND",
+    "SDM",
 ]

nextrec 0.1.1__py3-none-any.whl → 0.1.2__py3-none-any.whl

nextrec 0.1.1py3-none-any.whl → 0.1.2py3-none-any.whl