PyPI - replay-rec - Versions diffs - 0.20.1rc0__py3-none-any.whl → 0.20.2__py3-none-any.whl - Mend

replay-rec 0.20.1rc0py3-none-any.whl → 0.20.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (61) hide show

replay/__init__.py +1 -1
{replay_rec-0.20.1rc0.dist-info → replay_rec-0.20.2.dist-info}/METADATA +18 -12
{replay_rec-0.20.1rc0.dist-info → replay_rec-0.20.2.dist-info}/RECORD +6 -61
replay/experimental/__init__.py +0 -0
replay/experimental/metrics/__init__.py +0 -62
replay/experimental/metrics/base_metric.py +0 -603
replay/experimental/metrics/coverage.py +0 -97
replay/experimental/metrics/experiment.py +0 -175
replay/experimental/metrics/hitrate.py +0 -26
replay/experimental/metrics/map.py +0 -30
replay/experimental/metrics/mrr.py +0 -18
replay/experimental/metrics/ncis_precision.py +0 -31
replay/experimental/metrics/ndcg.py +0 -49
replay/experimental/metrics/precision.py +0 -22
replay/experimental/metrics/recall.py +0 -25
replay/experimental/metrics/rocauc.py +0 -49
replay/experimental/metrics/surprisal.py +0 -90
replay/experimental/metrics/unexpectedness.py +0 -76
replay/experimental/models/__init__.py +0 -50
replay/experimental/models/admm_slim.py +0 -257
replay/experimental/models/base_neighbour_rec.py +0 -200
replay/experimental/models/base_rec.py +0 -1386
replay/experimental/models/base_torch_rec.py +0 -234
replay/experimental/models/cql.py +0 -454
replay/experimental/models/ddpg.py +0 -932
replay/experimental/models/dt4rec/__init__.py +0 -0
replay/experimental/models/dt4rec/dt4rec.py +0 -189
replay/experimental/models/dt4rec/gpt1.py +0 -401
replay/experimental/models/dt4rec/trainer.py +0 -127
replay/experimental/models/dt4rec/utils.py +0 -264
replay/experimental/models/extensions/spark_custom_models/__init__.py +0 -0
replay/experimental/models/extensions/spark_custom_models/als_extension.py +0 -792
replay/experimental/models/hierarchical_recommender.py +0 -331
replay/experimental/models/implicit_wrap.py +0 -131
replay/experimental/models/lightfm_wrap.py +0 -303
replay/experimental/models/mult_vae.py +0 -332
replay/experimental/models/neural_ts.py +0 -986
replay/experimental/models/neuromf.py +0 -406
replay/experimental/models/scala_als.py +0 -293
replay/experimental/models/u_lin_ucb.py +0 -115
replay/experimental/nn/data/__init__.py +0 -1
replay/experimental/nn/data/schema_builder.py +0 -102
replay/experimental/preprocessing/__init__.py +0 -3
replay/experimental/preprocessing/data_preparator.py +0 -839
replay/experimental/preprocessing/padder.py +0 -229
replay/experimental/preprocessing/sequence_generator.py +0 -208
replay/experimental/scenarios/__init__.py +0 -1
replay/experimental/scenarios/obp_wrapper/__init__.py +0 -8
replay/experimental/scenarios/obp_wrapper/obp_optuna_objective.py +0 -74
replay/experimental/scenarios/obp_wrapper/replay_offline.py +0 -261
replay/experimental/scenarios/obp_wrapper/utils.py +0 -85
replay/experimental/scenarios/two_stages/__init__.py +0 -0
replay/experimental/scenarios/two_stages/reranker.py +0 -117
replay/experimental/scenarios/two_stages/two_stages_scenario.py +0 -757
replay/experimental/utils/__init__.py +0 -0
replay/experimental/utils/logger.py +0 -24
replay/experimental/utils/model_handler.py +0 -186
replay/experimental/utils/session_handler.py +0 -44
{replay_rec-0.20.1rc0.dist-info → replay_rec-0.20.2.dist-info}/WHEEL +0 -0
{replay_rec-0.20.1rc0.dist-info → replay_rec-0.20.2.dist-info}/licenses/LICENSE +0 -0
{replay_rec-0.20.1rc0.dist-info → replay_rec-0.20.2.dist-info}/licenses/NOTICE +0 -0

replay/experimental/utils/__init__.py DELETED Viewed

File without changes

replay/experimental/utils/logger.py DELETED Viewed

@@ -1,24 +0,0 @@
-import logging
-def get_logger(
-    name,
-    level=logging.INFO,
-    format_str="%(asctime)s [%(pathname)s:%(lineno)s - %(levelname)s ] %(message)s",
-    date_format="%Y-%m-%d %H:%M:%S",
-    file=False,
-):
-    """
-    Get python logger instance
-    """
-    logger = logging.getLogger(name)
-    logger.setLevel(level)
-    if not logger.hasHandlers():
-        handler = logging.StreamHandler() if not file else logging.FileHandler(name)
-        handler.setLevel(level)
-        formatter = logging.Formatter(fmt=format_str, datefmt=date_format)
-        handler.setFormatter(formatter)
-        logger.addHandler(handler)
-    return logger

replay/experimental/utils/model_handler.py DELETED Viewed

@@ -1,186 +0,0 @@
-import json
-from inspect import getfullargspec
-from os.path import join
-from pathlib import Path
-from typing import Union
-from replay.experimental.models.base_rec import BaseRecommender
-from replay.experimental.preprocessing import Indexer
-from replay.utils import PYSPARK_AVAILABLE
-from replay.utils.session_handler import State
-from replay.utils.spark_utils import load_pickled_from_parquet, save_picklable_to_parquet
-if PYSPARK_AVAILABLE:
-    import pyspark.sql.types as st
-    from pyspark.ml.feature import IndexToString, StringIndexerModel
-    from pyspark.sql import SparkSession
-    from replay.utils.model_handler import get_fs
-    def get_list_of_paths(spark: SparkSession, dir_path: str):
-        """
-        Returns list of paths to files in the `dir_path`
-        :param spark: spark session
-        :param dir_path: path to dir in hdfs or local disk
-        :return: list of paths to files
-        """
-        fs = get_fs(spark)
-        statuses = fs.listStatus(spark._jvm.org.apache.hadoop.fs.Path(dir_path))
-        return [str(f.getPath()) for f in statuses]
-def save(model: BaseRecommender, path: Union[str, Path], overwrite: bool = False):
-    """
-    Save fitted model to disk as a folder
-    :param model: Trained recommender
-    :param path: destination where model files will be stored
-    :return:
-    """
-    if isinstance(path, Path):
-        path = str(path)
-    spark = State().session
-    fs = get_fs(spark)
-    if not overwrite:
-        is_exists = fs.exists(spark._jvm.org.apache.hadoop.fs.Path(path))
-        if is_exists:
-            msg = f"Path '{path}' already exists. Mode is 'overwrite = False'."
-            raise FileExistsError(msg)
-    fs.mkdirs(spark._jvm.org.apache.hadoop.fs.Path(path))
-    model._save_model(join(path, "model"))
-    init_args = model._init_args
-    init_args["_model_name"] = str(model)
-    sc = spark.sparkContext
-    df = spark.read.json(sc.parallelize([json.dumps(init_args)]))
-    df.coalesce(1).write.mode("overwrite").option("ignoreNullFields", "false").json(join(path, "init_args.json"))
-    dataframes = model._dataframes
-    df_path = join(path, "dataframes")
-    for name, df in dataframes.items():
-        if df is not None:
-            df.write.mode("overwrite").parquet(join(df_path, name))
-    if hasattr(model, "fit_users"):
-        model.fit_users.write.mode("overwrite").parquet(join(df_path, "fit_users"))
-    if hasattr(model, "fit_items"):
-        model.fit_items.write.mode("overwrite").parquet(join(df_path, "fit_items"))
-    if hasattr(model, "study"):
-        save_picklable_to_parquet(model.study, join(path, "study"))
-def load(path: str, model_type=None) -> BaseRecommender:
-    """
-    Load saved model from disk
-    :param path: path to model folder
-    :return: Restored trained model
-    """
-    spark = State().session
-    args = spark.read.json(join(path, "init_args.json")).first().asDict(recursive=True)
-    name = args["_model_name"]
-    del args["_model_name"]
-    model_class = model_type if model_type is not None else globals()[name]
-    if name == "CQL":
-        for a in args:
-            if isinstance(args[a], dict) and "type" in args[a] and args[a]["type"] == "none":
-                args[a]["params"] = {}
-    init_args = getfullargspec(model_class.__init__).args
-    init_args.remove("self")
-    extra_args = set(args) - set(init_args)
-    if len(extra_args) > 0:
-        extra_args = {key: args[key] for key in args}
-        init_args = {key: args[key] for key in init_args}
-    else:
-        init_args = args
-        extra_args = {}
-    model = model_class(**init_args)
-    for arg in extra_args:
-        model.arg = extra_args[arg]
-    dataframes_paths = get_list_of_paths(spark, join(path, "dataframes"))
-    for dataframe_path in dataframes_paths:
-        df = spark.read.parquet(dataframe_path)
-        attr_name = dataframe_path.split("/")[-1]
-        setattr(model, attr_name, df)
-    model._load_model(join(path, "model"))
-    fs = get_fs(spark)
-    model.study = (
-        load_pickled_from_parquet(join(path, "study"))
-        if fs.exists(spark._jvm.org.apache.hadoop.fs.Path(join(path, "study")))
-        else None
-    )
-    return model
-def save_indexer(indexer: Indexer, path: Union[str, Path], overwrite: bool = False):
-    """
-    Save fitted indexer to disk as a folder
-    :param indexer: Trained indexer
-    :param path: destination where indexer files will be stored
-    """
-    if isinstance(path, Path):
-        path = str(path)
-    spark = State().session
-    if not overwrite:
-        fs = get_fs(spark)
-        is_exists = fs.exists(spark._jvm.org.apache.hadoop.fs.Path(path))
-        if is_exists:
-            msg = f"Path '{path}' already exists. Mode is 'overwrite = False'."
-            raise FileExistsError(msg)
-    init_args = indexer._init_args
-    init_args["user_type"] = str(indexer.user_type)
-    init_args["item_type"] = str(indexer.item_type)
-    sc = spark.sparkContext
-    df = spark.read.json(sc.parallelize([json.dumps(init_args)]))
-    df.coalesce(1).write.mode("overwrite").json(join(path, "init_args.json"))
-    indexer.user_indexer.write().overwrite().save(join(path, "user_indexer"))
-    indexer.item_indexer.write().overwrite().save(join(path, "item_indexer"))
-    indexer.inv_user_indexer.write().overwrite().save(join(path, "inv_user_indexer"))
-    indexer.inv_item_indexer.write().overwrite().save(join(path, "inv_item_indexer"))
-def load_indexer(path: str) -> Indexer:
-    """
-    Load saved indexer from disk
-    :param path: path to folder
-    :return: restored Indexer
-    """
-    spark = State().session
-    args = spark.read.json(join(path, "init_args.json")).first().asDict()
-    user_type = args["user_type"]
-    del args["user_type"]
-    item_type = args["item_type"]
-    del args["item_type"]
-    indexer = Indexer(**args)
-    if user_type.endswith("()"):
-        user_type = user_type[:-2]
-        item_type = item_type[:-2]
-    user_type = getattr(st, user_type)
-    item_type = getattr(st, item_type)
-    indexer.user_type = user_type()
-    indexer.item_type = item_type()
-    indexer.user_indexer = StringIndexerModel.load(join(path, "user_indexer"))
-    indexer.item_indexer = StringIndexerModel.load(join(path, "item_indexer"))
-    indexer.inv_user_indexer = IndexToString.load(join(path, "inv_user_indexer"))
-    indexer.inv_item_indexer = IndexToString.load(join(path, "inv_item_indexer"))
-    return indexer

replay/experimental/utils/session_handler.py DELETED Viewed

@@ -1,44 +0,0 @@
-from typing import Optional
-import torch
-from replay.utils.session_handler import Borg, get_spark_session, logger_with_settings
-from replay.utils.types import PYSPARK_AVAILABLE, MissingImport
-if PYSPARK_AVAILABLE:
-    from pyspark.sql import SparkSession
-else:
-    SparkSession = MissingImport
-class State(Borg):
-    """
-    All modules look for Spark session via this class. You can put your own session here.
-    Other parameters are stored here too: ``default device`` for ``pytorch`` (CPU/CUDA)
-    """
-    def __init__(
-        self,
-        session: Optional[SparkSession] = None,
-        device: Optional[torch.device] = None,
-    ):
-        Borg.__init__(self)
-        if not hasattr(self, "logger_set"):
-            self.logger = logger_with_settings()
-            self.logger_set = True
-        if session is None:
-            if not hasattr(self, "session"):
-                self.session = get_spark_session()
-        else:
-            self.session = session
-        if device is None:
-            if not hasattr(self, "device"):
-                if torch.cuda.is_available():
-                    self.device = torch.device(f"cuda:{torch.cuda.current_device()}")
-                else:
-                    self.device = torch.device("cpu")
-        else:
-            self.device = device

{replay_rec-0.20.1rc0.dist-info → replay_rec-0.20.2.dist-info}/WHEEL RENAMED Viewed

File without changes

{replay_rec-0.20.1rc0.dist-info → replay_rec-0.20.2.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

{replay_rec-0.20.1rc0.dist-info → replay_rec-0.20.2.dist-info}/licenses/NOTICE RENAMED Viewed

File without changes

replay-rec 0.20.1rc0__py3-none-any.whl → 0.20.2__py3-none-any.whl

replay-rec 0.20.1rc0py3-none-any.whl → 0.20.2py3-none-any.whl