PyPI - nextrec - Versions diffs - 0.3.6__py3-none-any.whl → 0.4.2__py3-none-any.whl - Mend

nextrec 0.3.6py3-none-any.whl → 0.4.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (62) hide show

nextrec/__init__.py +1 -1
nextrec/__version__.py +1 -1
nextrec/basic/activation.py +10 -5
nextrec/basic/callback.py +1 -0
nextrec/basic/features.py +30 -22
nextrec/basic/layers.py +244 -113
nextrec/basic/loggers.py +62 -43
nextrec/basic/metrics.py +268 -119
nextrec/basic/model.py +1373 -443
nextrec/basic/session.py +10 -3
nextrec/cli.py +498 -0
nextrec/data/__init__.py +19 -25
nextrec/data/batch_utils.py +11 -3
nextrec/data/data_processing.py +42 -24
nextrec/data/data_utils.py +26 -15
nextrec/data/dataloader.py +303 -96
nextrec/data/preprocessor.py +320 -199
nextrec/loss/listwise.py +17 -9
nextrec/loss/loss_utils.py +7 -8
nextrec/loss/pairwise.py +2 -0
nextrec/loss/pointwise.py +30 -12
nextrec/models/generative/hstu.py +106 -40
nextrec/models/match/dssm.py +82 -69
nextrec/models/match/dssm_v2.py +72 -58
nextrec/models/match/mind.py +175 -108
nextrec/models/match/sdm.py +104 -88
nextrec/models/match/youtube_dnn.py +73 -60
nextrec/models/multi_task/esmm.py +53 -39
nextrec/models/multi_task/mmoe.py +70 -47
nextrec/models/multi_task/ple.py +107 -50
nextrec/models/multi_task/poso.py +121 -41
nextrec/models/multi_task/share_bottom.py +54 -38
nextrec/models/ranking/afm.py +172 -45
nextrec/models/ranking/autoint.py +84 -61
nextrec/models/ranking/dcn.py +59 -42
nextrec/models/ranking/dcn_v2.py +64 -23
nextrec/models/ranking/deepfm.py +36 -26
nextrec/models/ranking/dien.py +158 -102
nextrec/models/ranking/din.py +88 -60
nextrec/models/ranking/fibinet.py +55 -35
nextrec/models/ranking/fm.py +32 -26
nextrec/models/ranking/masknet.py +95 -34
nextrec/models/ranking/pnn.py +34 -31
nextrec/models/ranking/widedeep.py +37 -29
nextrec/models/ranking/xdeepfm.py +63 -41
nextrec/utils/__init__.py +61 -32
nextrec/utils/config.py +490 -0
nextrec/utils/device.py +52 -12
nextrec/utils/distributed.py +141 -0
nextrec/utils/embedding.py +1 -0
nextrec/utils/feature.py +1 -0
nextrec/utils/file.py +32 -11
nextrec/utils/initializer.py +61 -16
nextrec/utils/optimizer.py +25 -9
nextrec/utils/synthetic_data.py +531 -0
nextrec/utils/tensor.py +24 -13
{nextrec-0.3.6.dist-info → nextrec-0.4.2.dist-info}/METADATA +15 -5
nextrec-0.4.2.dist-info/RECORD +69 -0
nextrec-0.4.2.dist-info/entry_points.txt +2 -0
nextrec-0.3.6.dist-info/RECORD +0 -64
{nextrec-0.3.6.dist-info → nextrec-0.4.2.dist-info}/WHEEL +0 -0
{nextrec-0.3.6.dist-info → nextrec-0.4.2.dist-info}/licenses/LICENSE +0 -0

nextrec/utils/synthetic_data.py ADDED Viewed

@@ -0,0 +1,531 @@
+"""
+Synthetic Data Generation Utilities
+This module provides utilities for generating synthetic datasets for testing
+and tutorial purposes in the NextRec framework.
+Date: create on 06/12/2025
+Author: Yang Zhou, zyaztec@gmail.com
+"""
+import numpy as np
+import pandas as pd
+from typing import Optional, Dict, List, Tuple
+def generate_ranking_data(
+    n_samples: int = 10000,
+    n_dense: int = 5,
+    n_sparse: int = 8,
+    n_sequences: int = 2,
+    user_vocab_size: int = 1000,
+    item_vocab_size: int = 500,
+    sparse_vocab_size: int = 50,
+    sequence_max_len: int = 20,
+    embedding_dim: int = 16,
+    seed: int = 42,
+    custom_sparse_features: Optional[Dict[str, int]] = None,
+    use_simple_names: bool = True,
+) -> Tuple[pd.DataFrame, List, List, List]:
+    """
+    Generate synthetic data for ranking tasks (CTR prediction)
+    Returns:
+        tuple: (dataframe, dense_features, sparse_features, sequence_features)
+    """
+    print(f"Generating {n_samples} synthetic ranking samples...")
+    np.random.seed(seed)
+    data = {}
+    for i in range(n_dense):
+        data[f"dense_{i}"] = np.random.randn(n_samples).astype(np.float32)
+    # Generate basic sparse features (always include user_id and item_id)
+    data["user_id"] = np.random.randint(1, user_vocab_size, n_samples)
+    data["item_id"] = np.random.randint(1, item_vocab_size, n_samples)
+    # Generate additional sparse features
+    if custom_sparse_features:
+        for feat_name, vocab_size in custom_sparse_features.items():
+            data[feat_name] = np.random.randint(0, vocab_size, n_samples)
+    else:
+        for i in range(n_sparse - 2):
+            data[f"sparse_{i}"] = np.random.randint(1, sparse_vocab_size, n_samples)
+    # Generate sequence features (list of IDs)
+    sequence_names = []
+    sequence_vocabs = []
+    for i in range(n_sequences):
+        sequences = []
+        for _ in range(n_samples):
+            seq_len = np.random.randint(5, sequence_max_len + 1)
+            if i == 0:
+                # First sequence uses item vocabulary
+                seq = np.random.randint(0, item_vocab_size, seq_len).tolist()
+                seq_vocab = item_vocab_size
+                if custom_sparse_features:
+                    seq_name = "hist_items"
+                else:
+                    seq_name = "sequence_0"
+            else:
+                # Other sequences use category vocabulary
+                if custom_sparse_features and "category" in custom_sparse_features:
+                    seq_vocab = custom_sparse_features["category"]
+                    seq = np.random.randint(0, seq_vocab, seq_len).tolist()
+                    seq_name = "hist_categories" if i == 1 else f"sequence_{i}"
+                else:
+                    seq_vocab = sparse_vocab_size
+                    seq = np.random.randint(0, seq_vocab, seq_len).tolist()
+                    seq_name = f"sequence_{i}"
+            # Padding
+            seq = seq + [0] * (sequence_max_len - len(seq))
+            sequences.append(seq)
+        data[seq_name] = sequences
+        sequence_names.append(seq_name)
+        sequence_vocabs.append(seq_vocab)
+    if "gender" in data and "dense_0" in data:
+        # Complex label generation with feature correlation
+        label_probs = 1 / (
+            1
+            + np.exp(
+                -(
+                    data["dense_0"] * 0.3
+                    + data["dense_1"] * 0.2
+                    + (data["gender"] - 0.5) * 0.5
+                    + np.random.randn(n_samples) * 0.1
+                )
+            )
+        )
+        data["label"] = (label_probs > 0.5).astype(np.float32)
+    else:
+        data["label"] = np.random.randint(0, 2, n_samples).astype(np.float32)
+    df = pd.DataFrame(data)
+    print(f"Generated data shape: {df.shape}")
+    if "gender" in data:
+        print(f"Positive rate: {data['label'].mean():.4f}")
+    # Import here to avoid circular import
+    from nextrec.basic.features import DenseFeature, SparseFeature, SequenceFeature
+    # Create feature definitions
+    # Use input_dim for dense features to be compatible with both simple and complex scenarios
+    dense_features = [
+        DenseFeature(name=f"dense_{i}", input_dim=1) for i in range(n_dense)
+    ]
+    # Create sparse features
+    sparse_features = [
+        SparseFeature(
+            name="user_id",
+            embedding_name="user_emb",
+            vocab_size=user_vocab_size,
+            embedding_dim=embedding_dim,
+        ),
+        SparseFeature(
+            name="item_id",
+            embedding_name="item_emb",
+            vocab_size=item_vocab_size,
+            embedding_dim=embedding_dim,
+        ),
+    ]
+    if custom_sparse_features:
+        # Add custom sparse features with proper vocab sizes
+        for feat_name, vocab_size in custom_sparse_features.items():
+            sparse_features.append(
+                SparseFeature(
+                    name=feat_name,
+                    embedding_name=f"{feat_name}_emb",
+                    vocab_size=vocab_size,
+                    embedding_dim=embedding_dim,
+                )
+            )
+    else:
+        # Add generic sparse features
+        sparse_features.extend(
+            [
+                SparseFeature(
+                    name=f"sparse_{i}",
+                    embedding_name=f"sparse_{i}_emb",
+                    vocab_size=sparse_vocab_size,
+                    embedding_dim=embedding_dim,
+                )
+                for i in range(n_sparse - 2)
+            ]
+        )
+    # Create sequence features
+    sequence_features = []
+    for i, (seq_name, seq_vocab) in enumerate(zip(sequence_names, sequence_vocabs)):
+        if i == 0:
+            # First sequence shares embedding with item_id
+            embedding_name = "item_emb"
+        elif (
+            custom_sparse_features
+            and "category" in custom_sparse_features
+            and seq_name == "hist_categories"
+        ):
+            # hist_categories shares embedding with category
+            embedding_name = "category_emb"
+        else:
+            # Other sequences share with sparse_0
+            embedding_name = "sparse_0_emb"
+        sequence_features.append(
+            SequenceFeature(
+                name=seq_name,
+                vocab_size=seq_vocab,
+                max_len=sequence_max_len,
+                embedding_dim=embedding_dim,
+                padding_idx=0,
+                embedding_name=embedding_name,
+            )
+        )
+    return df, dense_features, sparse_features, sequence_features
+def generate_match_data(
+    n_samples: int = 10000,
+    user_vocab_size: int = 1000,
+    item_vocab_size: int = 5000,
+    category_vocab_size: int = 100,
+    brand_vocab_size: int = 200,
+    city_vocab_size: int = 100,
+    user_feature_vocab_size: int = 50,
+    item_feature_vocab_size: int = 50,
+    sequence_max_len: int = 50,
+    user_embedding_dim: int = 32,
+    item_embedding_dim: int = 32,
+    seed: int = 42,
+) -> Tuple[pd.DataFrame, List, List, List, List, List, List]:
+    """
+    Generate synthetic data for match/retrieval tasks
+    Returns:
+        tuple: (dataframe, user_dense_features, user_sparse_features, user_sequence_features,
+                item_dense_features, item_sparse_features, item_sequence_features)
+    """
+    print(f"Generating {n_samples} synthetic match samples...")
+    np.random.seed(seed)
+    data = {}
+    # User features
+    data["user_id"] = np.random.randint(1, user_vocab_size, n_samples)
+    data["user_age"] = np.random.randn(n_samples).astype(np.float32)
+    data["user_gender"] = np.random.randint(0, 2, n_samples)
+    data["user_city"] = np.random.randint(0, city_vocab_size, n_samples)
+    for i in range(3):
+        data[f"user_feature_{i}"] = np.random.randint(
+            1, user_feature_vocab_size, n_samples
+        )
+    # User behavior sequences
+    user_hist_items = []
+    user_hist_categories = []
+    for _ in range(n_samples):
+        seq_len = np.random.randint(10, sequence_max_len + 1)
+        hist_items = np.random.randint(1, item_vocab_size, seq_len).tolist()
+        hist_items = hist_items + [0] * (sequence_max_len - len(hist_items))
+        user_hist_items.append(hist_items)
+        hist_cats = np.random.randint(1, category_vocab_size, seq_len).tolist()
+        hist_cats = hist_cats + [0] * (sequence_max_len - len(hist_cats))
+        user_hist_categories.append(hist_cats)
+    data["user_hist_items"] = user_hist_items
+    data["user_hist_categories"] = user_hist_categories
+    # Item features
+    data["item_id"] = np.random.randint(1, item_vocab_size, n_samples)
+    data["item_price"] = np.random.randn(n_samples).astype(np.float32)
+    data["item_category"] = np.random.randint(1, category_vocab_size, n_samples)
+    data["item_brand"] = np.random.randint(1, brand_vocab_size, n_samples)
+    for i in range(3):
+        data[f"item_feature_{i}"] = np.random.randint(
+            1, item_feature_vocab_size, n_samples
+        )
+    # Generate labels with some correlation to features
+    label_probs = 1 / (
+        1
+        + np.exp(
+            -(
+                data["user_age"] * 0.2
+                + (data["user_gender"] - 0.5) * 0.3
+                + data["item_price"] * 0.15
+                + np.random.randn(n_samples) * 0.5
+            )
+        )
+    )
+    data["label"] = (label_probs > 0.5).astype(np.float32)
+    df = pd.DataFrame(data)
+    print(f"Generated data shape: {df.shape}")
+    print(f"Positive rate: {data['label'].mean():.4f}")
+    # Import here to avoid circular import
+    from nextrec.basic.features import DenseFeature, SparseFeature, SequenceFeature
+    # User dense features
+    user_dense_features = [DenseFeature(name="user_age", input_dim=1)]
+    # User sparse features
+    user_sparse_features = [
+        SparseFeature(
+            name="user_id", vocab_size=user_vocab_size, embedding_dim=user_embedding_dim
+        ),
+        SparseFeature(name="user_gender", vocab_size=2, embedding_dim=8),
+        SparseFeature(name="user_city", vocab_size=city_vocab_size, embedding_dim=16),
+    ]
+    user_sparse_features.extend(
+        [
+            SparseFeature(
+                name=f"user_feature_{i}",
+                vocab_size=user_feature_vocab_size,
+                embedding_dim=8,
+            )
+            for i in range(3)
+        ]
+    )
+    # User sequence features
+    user_sequence_features = [
+        SequenceFeature(
+            name="user_hist_items",
+            vocab_size=item_vocab_size,
+            max_len=sequence_max_len,
+            embedding_dim=user_embedding_dim,
+            padding_idx=0,
+        ),
+        SequenceFeature(
+            name="user_hist_categories",
+            vocab_size=category_vocab_size,
+            max_len=sequence_max_len,
+            embedding_dim=16,
+            padding_idx=0,
+        ),
+    ]
+    # Item dense features
+    item_dense_features = [DenseFeature(name="item_price", input_dim=1)]
+    # Item sparse features
+    item_sparse_features = [
+        SparseFeature(
+            name="item_id", vocab_size=item_vocab_size, embedding_dim=item_embedding_dim
+        ),
+        SparseFeature(
+            name="item_category", vocab_size=category_vocab_size, embedding_dim=16
+        ),
+        SparseFeature(name="item_brand", vocab_size=brand_vocab_size, embedding_dim=16),
+    ]
+    item_sparse_features.extend(
+        [
+            SparseFeature(
+                name=f"item_feature_{i}",
+                vocab_size=item_feature_vocab_size,
+                embedding_dim=8,
+            )
+            for i in range(3)
+        ]
+    )
+    # Item sequence features (empty for most match models)
+    item_sequence_features = []
+    return (
+        df,
+        user_dense_features,
+        user_sparse_features,
+        user_sequence_features,
+        item_dense_features,
+        item_sparse_features,
+        item_sequence_features,
+    )
+def generate_multitask_data(
+    n_samples: int = 10000,
+    n_dense: int = 5,
+    n_sparse: int = 8,
+    n_sequences: int = 2,
+    user_vocab_size: int = 1000,
+    item_vocab_size: int = 500,
+    sparse_vocab_size: int = 50,
+    sequence_max_len: int = 20,
+    embedding_dim: int = 16,
+    seed: int = 42,
+) -> Tuple[pd.DataFrame, List, List, List]:
+    """
+    Generate synthetic data for multi-task learning
+    Returns:
+        tuple: (dataframe, dense_features, sparse_features, sequence_features)
+    """
+    print(f"Generating {n_samples} synthetic multi-task samples...")
+    np.random.seed(seed)
+    data = {}
+    # Generate dense features
+    for i in range(n_dense):
+        data[f"dense_{i}"] = np.random.randn(n_samples).astype(np.float32)
+    # Generate sparse features
+    data["user_id"] = np.random.randint(1, user_vocab_size, n_samples)
+    data["item_id"] = np.random.randint(1, item_vocab_size, n_samples)
+    for i in range(n_sparse - 2):
+        data[f"sparse_{i}"] = np.random.randint(1, sparse_vocab_size, n_samples)
+    # Generate sequence features
+    sequence_names = []
+    sequence_vocabs = []
+    for i in range(n_sequences):
+        sequences = []
+        for _ in range(n_samples):
+            seq_len = np.random.randint(5, sequence_max_len + 1)
+            if i == 0:
+                seq = np.random.randint(0, item_vocab_size, seq_len).tolist()
+                seq_vocab = item_vocab_size
+                seq_name = "sequence_0"
+            else:
+                seq = np.random.randint(0, sparse_vocab_size, seq_len).tolist()
+                seq_vocab = sparse_vocab_size
+                seq_name = f"sequence_{i}"
+            seq = seq + [0] * (sequence_max_len - len(seq))
+            sequences.append(seq)
+        data[seq_name] = sequences
+        sequence_names.append(seq_name)
+        sequence_vocabs.append(seq_vocab)
+    # Generate multi-task labels with correlation
+    # CTR (click) is relatively easier to predict
+    ctr_logits = (
+        data["dense_0"] * 0.3 + data["dense_1"] * 0.2 + np.random.randn(n_samples) * 0.5
+    )
+    data["click"] = (1 / (1 + np.exp(-ctr_logits)) > 0.5).astype(np.float32)
+    # CVR (conversion) depends on click and is harder
+    cvr_logits = (
+        data["dense_2"] * 0.2
+        + data["dense_3"] * 0.15
+        + data["click"] * 1.5  # Strong dependency on click
+        + np.random.randn(n_samples) * 0.8
+    )
+    data["conversion"] = (1 / (1 + np.exp(-cvr_logits)) > 0.3).astype(np.float32)
+    # CTCVR = click AND conversion
+    data["ctcvr"] = (data["click"] * data["conversion"]).astype(np.float32)
+    df = pd.DataFrame(data)
+    print(f"Generated data shape: {df.shape}")
+    print(f"Click rate: {data['click'].mean():.4f}")
+    print(f"Conversion rate (overall): {data['conversion'].mean():.4f}")
+    if data["click"].sum() > 0:
+        print(
+            f"Conversion rate (given click): {data['conversion'][data['click'] == 1].mean():.4f}"
+        )
+    print(f"CTCVR rate: {data['ctcvr'].mean():.4f}")
+    # Import here to avoid circular import
+    from nextrec.basic.features import DenseFeature, SparseFeature, SequenceFeature
+    # Create feature definitions
+    dense_features = [
+        DenseFeature(name=f"dense_{i}", input_dim=1) for i in range(n_dense)
+    ]
+    # Create sparse features
+    sparse_features = [
+        SparseFeature(
+            name="user_id",
+            embedding_name="user_emb",
+            vocab_size=user_vocab_size,
+            embedding_dim=embedding_dim,
+        ),
+        SparseFeature(
+            name="item_id",
+            embedding_name="item_emb",
+            vocab_size=item_vocab_size,
+            embedding_dim=embedding_dim,
+        ),
+    ]
+    sparse_features.extend(
+        [
+            SparseFeature(
+                name=f"sparse_{i}",
+                embedding_name=f"sparse_{i}_emb",
+                vocab_size=sparse_vocab_size,
+                embedding_dim=embedding_dim,
+            )
+            for i in range(n_sparse - 2)
+        ]
+    )
+    # Create sequence features
+    sequence_features = []
+    for i, (seq_name, seq_vocab) in enumerate(zip(sequence_names, sequence_vocabs)):
+        if i == 0:
+            embedding_name = "item_emb"
+        else:
+            embedding_name = "sparse_0_emb"
+        sequence_features.append(
+            SequenceFeature(
+                name=seq_name,
+                vocab_size=seq_vocab,
+                max_len=sequence_max_len,
+                embedding_dim=embedding_dim,
+                padding_idx=0,
+                embedding_name=embedding_name,
+            )
+        )
+    return df, dense_features, sparse_features, sequence_features
+def generate_distributed_ranking_data(
+    num_samples: int = 100000,
+    num_users: int = 10000,
+    num_items: int = 5000,
+    num_categories: int = 20,
+    num_cities: int = 100,
+    max_seq_len: int = 50,
+    embedding_dim: int = 32,
+    seed: int = 42,
+) -> Tuple[pd.DataFrame, List, List, List]:
+    """
+    Generate synthetic data for distributed training scenarios
+    Returns:
+        tuple: (dataframe, dense_features, sparse_features, sequence_features)
+    """
+    return generate_ranking_data(
+        n_samples=num_samples,
+        n_dense=5,
+        n_sparse=6,  # user_id, item_id + 4 custom features
+        n_sequences=2,
+        user_vocab_size=num_users + 1,
+        item_vocab_size=num_items + 1,
+        sequence_max_len=max_seq_len,
+        embedding_dim=embedding_dim,
+        seed=seed,
+        custom_sparse_features={
+            "gender": 2,
+            "age_group": 7,
+            "category": num_categories,
+            "city": num_cities,
+        },
+        use_simple_names=False,
+    )

nextrec/utils/tensor.py CHANGED Viewed

@@ -6,56 +6,67 @@ Author: Yang Zhou, zyaztec@gmail.com
 """
 import torch
-import numpy as np
 from typing import Any
 def to_tensor(
-    value: Any,
-    dtype: torch.dtype,
-    device: torch.device | str | None = None
+    value: Any, dtype: torch.dtype, device: torch.device | str | None = None
 ) -> torch.Tensor:
     if value is None:
         raise ValueError("[Tensor Utils Error] Cannot convert None to tensor.")
     tensor = value if isinstance(value, torch.Tensor) else torch.as_tensor(value)
     if tensor.dtype != dtype:
         tensor = tensor.to(dtype=dtype)
     if device is not None:
-        target_device = device if isinstance(device, torch.device) else torch.device(device)
+        target_device = (
+            device if isinstance(device, torch.device) else torch.device(device)
+        )
         if tensor.device != target_device:
             tensor = tensor.to(target_device)
     return tensor
 def stack_tensors(tensors: list[torch.Tensor], dim: int = 0) -> torch.Tensor:
     if not tensors:
         raise ValueError("[Tensor Utils Error] Cannot stack empty list of tensors.")
     return torch.stack(tensors, dim=dim)
 def concat_tensors(tensors: list[torch.Tensor], dim: int = 0) -> torch.Tensor:
     if not tensors:
-        raise ValueError("[Tensor Utils Error] Cannot concatenate empty list of tensors.")
+        raise ValueError(
+            "[Tensor Utils Error] Cannot concatenate empty list of tensors."
+        )
     return torch.cat(tensors, dim=dim)
 def pad_sequence_tensors(
     tensors: list[torch.Tensor],
     max_len: int | None = None,
     padding_value: float = 0.0,
-    padding_side: str = 'right'
+    padding_side: str = "right",
 ) -> torch.Tensor:
     if not tensors:
         raise ValueError("[Tensor Utils Error] Cannot pad empty list of tensors.")
     if max_len is None:
         max_len = max(t.size(0) for t in tensors)
     batch_size = len(tensors)
-    padded = torch.full((batch_size, max_len), padding_value, dtype=tensors[0].dtype, device=tensors[0].device)
+    padded = torch.full(
+        (batch_size, max_len),
+        padding_value,
+        dtype=tensors[0].dtype,
+        device=tensors[0].device,
+    )
     for i, tensor in enumerate(tensors):
         length = min(tensor.size(0), max_len)
-        if padding_side == 'right':
+        if padding_side == "right":
             padded[i, :length] = tensor[:length]
-        elif padding_side == 'left':
+        elif padding_side == "left":
             padded[i, -length:] = tensor[:length]
         else:
-            raise ValueError(f"[Tensor Utils Error] padding_side must be 'right' or 'left', got {padding_side}")
+            raise ValueError(
+                f"[Tensor Utils Error] padding_side must be 'right' or 'left', got {padding_side}"
+            )
     return padded

{nextrec-0.3.6.dist-info → nextrec-0.4.2.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: nextrec
-Version: 0.3.6
+Version: 0.4.2
 Summary: A comprehensive recommendation library with match, ranking, and multi-task learning models
 Project-URL: Homepage, https://github.com/zerolovesea/NextRec
 Project-URL: Repository, https://github.com/zerolovesea/NextRec
@@ -55,7 +55,7 @@ Requires-Dist: seaborn>=0.12.0; extra == 'dev'
 Description-Content-Type: text/markdown
 <p align="center">
-<img align="center" src="asserts/logo.png" width="40%">
+<img align="center" src="assets/logo.png" width="40%">
 <p>
 <div align="center">
@@ -63,7 +63,7 @@ Description-Content-Type: text/markdown
 ![Python](https://img.shields.io/badge/Python-3.10+-blue.svg)
 ![PyTorch](https://img.shields.io/badge/PyTorch-1.10+-ee4c2c.svg)
 ![License](https://img.shields.io/badge/License-Apache%202.0-green.svg)
-![Version](https://img.shields.io/badge/Version-0.3.6-orange.svg)
+![Version](https://img.shields.io/badge/Version-0.4.2-orange.svg)
 English | [中文文档](README_zh.md)
@@ -86,7 +86,7 @@ NextRec is a modern recommendation framework built on PyTorch, delivering a unif
 NextRec adopts a modular and low-coupling engineering design, enabling full-pipeline reusability and scalability across data processing → model construction → training & evaluation → inference & deployment. Its core components include: a Feature-Spec-driven Embedding architecture, the BaseModel abstraction, a set of independent reusable Layers, a unified DataLoader for both training and inference, and a ready-to-use Model Zoo.
-![NextRec Architecture](asserts/nextrec_diagram_en.png)
+![NextRec Architecture](assets/nextrec_diagram_en.png)
 > The project borrows ideas from excellent open-source rec libraries. Early layers referenced [torch-rechub](https://github.com/datawhalechina/torch-rechub) but have been replaced with in-house implementations. torch-rechub remains mature in architecture and models; the author contributed a bit there—feel free to check it out.
@@ -110,7 +110,7 @@ To dive deeper, Jupyter notebooks are available:
 - [Hands on the NextRec framework](/tutorials/notebooks/en/Hands%20on%20nextrec.ipynb)
 - [Using the data processor for preprocessing](/tutorials/notebooks/en/Hands%20on%20dataprocessor.ipynb)
-> Current version [0.3.6]: the matching module is not fully polished yet and may have compatibility issues or unexpected errors. Please raise an issue if you run into problems.
+> Current version [0.4.2]: the matching module is not fully polished yet and may have compatibility issues or unexpected errors. Please raise an issue if you run into problems.
 ## 5-Minute Quick Start
@@ -196,6 +196,16 @@ metrics = model.evaluate(
 )
 ```
+## Platform Compatibility
+The current version is 0.4.2. All models and test code have been validated on the following platforms. If you encounter compatibility issues, please report them in the issue tracker with your system version:
+| Platform | Configuration |
+|----------|---------------|
+| MacOS latest | MacBook Pro M4 Pro 24GB RAM |
+| Ubuntu latest | AutoDL 4070D Dual GPU |
+| CentOS 7 | Intel Xeon 5138Y 96 cores 377GB RAM |
 ---
 ## Supported Models

nextrec 0.3.6__py3-none-any.whl → 0.4.2__py3-none-any.whl

nextrec 0.3.6py3-none-any.whl → 0.4.2py3-none-any.whl