PyPI - easy-cs-rec-custommodel - Versions diffs - 0.8.6__py2.py3-none-any.whl - Mend

easy-cs-rec-custommodel 0.8.6__py2.py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of easy-cs-rec-custommodel might be problematic. Click here for more details.

Files changed (336) hide show

easy_cs_rec_custommodel-0.8.6.dist-info/LICENSE +203 -0
easy_cs_rec_custommodel-0.8.6.dist-info/METADATA +48 -0
easy_cs_rec_custommodel-0.8.6.dist-info/RECORD +336 -0
easy_cs_rec_custommodel-0.8.6.dist-info/WHEEL +6 -0
easy_cs_rec_custommodel-0.8.6.dist-info/top_level.txt +2 -0
easy_rec/__init__.py +114 -0
easy_rec/python/__init__.py +0 -0
easy_rec/python/builders/__init__.py +0 -0
easy_rec/python/builders/hyperparams_builder.py +78 -0
easy_rec/python/builders/loss_builder.py +333 -0
easy_rec/python/builders/optimizer_builder.py +211 -0
easy_rec/python/builders/strategy_builder.py +44 -0
easy_rec/python/compat/__init__.py +0 -0
easy_rec/python/compat/adam_s.py +245 -0
easy_rec/python/compat/array_ops.py +229 -0
easy_rec/python/compat/dynamic_variable.py +542 -0
easy_rec/python/compat/early_stopping.py +653 -0
easy_rec/python/compat/embedding_ops.py +162 -0
easy_rec/python/compat/embedding_parallel_saver.py +316 -0
easy_rec/python/compat/estimator_train.py +116 -0
easy_rec/python/compat/exporter.py +473 -0
easy_rec/python/compat/feature_column/__init__.py +0 -0
easy_rec/python/compat/feature_column/feature_column.py +3675 -0
easy_rec/python/compat/feature_column/feature_column_v2.py +5233 -0
easy_rec/python/compat/feature_column/sequence_feature_column.py +648 -0
easy_rec/python/compat/feature_column/utils.py +154 -0
easy_rec/python/compat/layers.py +329 -0
easy_rec/python/compat/ops.py +14 -0
easy_rec/python/compat/optimizers.py +619 -0
easy_rec/python/compat/queues.py +311 -0
easy_rec/python/compat/regularizers.py +208 -0
easy_rec/python/compat/sok_optimizer.py +440 -0
easy_rec/python/compat/sync_replicas_optimizer.py +528 -0
easy_rec/python/compat/weight_decay_optimizers.py +475 -0
easy_rec/python/core/__init__.py +0 -0
easy_rec/python/core/easyrec_metrics/__init__.py +24 -0
easy_rec/python/core/easyrec_metrics/distribute_metrics_impl_pai.py +3702 -0
easy_rec/python/core/easyrec_metrics/distribute_metrics_impl_tf.py +3768 -0
easy_rec/python/core/learning_schedules.py +228 -0
easy_rec/python/core/metrics.py +402 -0
easy_rec/python/core/sampler.py +844 -0
easy_rec/python/eval.py +102 -0
easy_rec/python/export.py +150 -0
easy_rec/python/feature_column/__init__.py +0 -0
easy_rec/python/feature_column/feature_column.py +664 -0
easy_rec/python/feature_column/feature_group.py +89 -0
easy_rec/python/hpo/__init__.py +0 -0
easy_rec/python/hpo/emr_hpo.py +140 -0
easy_rec/python/hpo/generate_hpo_sql.py +71 -0
easy_rec/python/hpo/pai_hpo.py +297 -0
easy_rec/python/inference/__init__.py +0 -0
easy_rec/python/inference/csv_predictor.py +189 -0
easy_rec/python/inference/hive_parquet_predictor.py +200 -0
easy_rec/python/inference/hive_predictor.py +166 -0
easy_rec/python/inference/odps_predictor.py +70 -0
easy_rec/python/inference/parquet_predictor.py +147 -0
easy_rec/python/inference/parquet_predictor_v2.py +147 -0
easy_rec/python/inference/predictor.py +621 -0
easy_rec/python/inference/processor/__init__.py +0 -0
easy_rec/python/inference/processor/test.py +170 -0
easy_rec/python/inference/vector_retrieve.py +124 -0
easy_rec/python/input/__init__.py +0 -0
easy_rec/python/input/batch_tfrecord_input.py +117 -0
easy_rec/python/input/criteo_binary_reader.py +259 -0
easy_rec/python/input/criteo_input.py +107 -0
easy_rec/python/input/csv_input.py +175 -0
easy_rec/python/input/csv_input_ex.py +72 -0
easy_rec/python/input/csv_input_v2.py +68 -0
easy_rec/python/input/datahub_input.py +320 -0
easy_rec/python/input/dummy_input.py +58 -0
easy_rec/python/input/hive_input.py +123 -0
easy_rec/python/input/hive_parquet_input.py +140 -0
easy_rec/python/input/hive_rtp_input.py +174 -0
easy_rec/python/input/input.py +1064 -0
easy_rec/python/input/kafka_dataset.py +144 -0
easy_rec/python/input/kafka_input.py +235 -0
easy_rec/python/input/load_parquet.py +317 -0
easy_rec/python/input/odps_input.py +101 -0
easy_rec/python/input/odps_input_v2.py +110 -0
easy_rec/python/input/odps_input_v3.py +132 -0
easy_rec/python/input/odps_rtp_input.py +187 -0
easy_rec/python/input/odps_rtp_input_v2.py +104 -0
easy_rec/python/input/parquet_input.py +397 -0
easy_rec/python/input/parquet_input_v2.py +180 -0
easy_rec/python/input/parquet_input_v3.py +203 -0
easy_rec/python/input/rtp_input.py +225 -0
easy_rec/python/input/rtp_input_v2.py +145 -0
easy_rec/python/input/tfrecord_input.py +100 -0
easy_rec/python/layers/__init__.py +0 -0
easy_rec/python/layers/backbone.py +571 -0
easy_rec/python/layers/capsule_layer.py +176 -0
easy_rec/python/layers/cmbf.py +390 -0
easy_rec/python/layers/common_layers.py +192 -0
easy_rec/python/layers/dnn.py +87 -0
easy_rec/python/layers/embed_input_layer.py +25 -0
easy_rec/python/layers/fm.py +26 -0
easy_rec/python/layers/input_layer.py +396 -0
easy_rec/python/layers/keras/__init__.py +34 -0
easy_rec/python/layers/keras/activation.py +114 -0
easy_rec/python/layers/keras/attention.py +267 -0
easy_rec/python/layers/keras/auxiliary_loss.py +47 -0
easy_rec/python/layers/keras/blocks.py +262 -0
easy_rec/python/layers/keras/bst.py +119 -0
easy_rec/python/layers/keras/custom_ops.py +250 -0
easy_rec/python/layers/keras/data_augment.py +133 -0
easy_rec/python/layers/keras/din.py +67 -0
easy_rec/python/layers/keras/einsum_dense.py +598 -0
easy_rec/python/layers/keras/embedding.py +81 -0
easy_rec/python/layers/keras/fibinet.py +251 -0
easy_rec/python/layers/keras/interaction.py +416 -0
easy_rec/python/layers/keras/layer_norm.py +364 -0
easy_rec/python/layers/keras/mask_net.py +166 -0
easy_rec/python/layers/keras/multi_head_attention.py +717 -0
easy_rec/python/layers/keras/multi_task.py +125 -0
easy_rec/python/layers/keras/numerical_embedding.py +376 -0
easy_rec/python/layers/keras/ppnet.py +194 -0
easy_rec/python/layers/keras/transformer.py +192 -0
easy_rec/python/layers/layer_norm.py +51 -0
easy_rec/python/layers/mmoe.py +83 -0
easy_rec/python/layers/multihead_attention.py +162 -0
easy_rec/python/layers/multihead_cross_attention.py +749 -0
easy_rec/python/layers/senet.py +73 -0
easy_rec/python/layers/seq_input_layer.py +134 -0
easy_rec/python/layers/sequence_feature_layer.py +249 -0
easy_rec/python/layers/uniter.py +301 -0
easy_rec/python/layers/utils.py +248 -0
easy_rec/python/layers/variational_dropout_layer.py +130 -0
easy_rec/python/loss/__init__.py +0 -0
easy_rec/python/loss/circle_loss.py +82 -0
easy_rec/python/loss/contrastive_loss.py +79 -0
easy_rec/python/loss/f1_reweight_loss.py +38 -0
easy_rec/python/loss/focal_loss.py +93 -0
easy_rec/python/loss/jrc_loss.py +128 -0
easy_rec/python/loss/listwise_loss.py +161 -0
easy_rec/python/loss/multi_similarity.py +68 -0
easy_rec/python/loss/pairwise_loss.py +307 -0
easy_rec/python/loss/softmax_loss_with_negative_mining.py +110 -0
easy_rec/python/loss/zero_inflated_lognormal.py +76 -0
easy_rec/python/main.py +878 -0
easy_rec/python/model/__init__.py +0 -0
easy_rec/python/model/autoint.py +73 -0
easy_rec/python/model/cmbf.py +47 -0
easy_rec/python/model/collaborative_metric_learning.py +182 -0
easy_rec/python/model/custom_model.py +323 -0
easy_rec/python/model/dat.py +138 -0
easy_rec/python/model/dbmtl.py +116 -0
easy_rec/python/model/dcn.py +70 -0
easy_rec/python/model/deepfm.py +106 -0
easy_rec/python/model/dlrm.py +73 -0
easy_rec/python/model/dropoutnet.py +207 -0
easy_rec/python/model/dssm.py +154 -0
easy_rec/python/model/dssm_senet.py +143 -0
easy_rec/python/model/dummy_model.py +48 -0
easy_rec/python/model/easy_rec_estimator.py +739 -0
easy_rec/python/model/easy_rec_model.py +467 -0
easy_rec/python/model/esmm.py +242 -0
easy_rec/python/model/fm.py +63 -0
easy_rec/python/model/match_model.py +357 -0
easy_rec/python/model/mind.py +445 -0
easy_rec/python/model/mmoe.py +70 -0
easy_rec/python/model/multi_task_model.py +303 -0
easy_rec/python/model/multi_tower.py +62 -0
easy_rec/python/model/multi_tower_bst.py +190 -0
easy_rec/python/model/multi_tower_din.py +130 -0
easy_rec/python/model/multi_tower_recall.py +68 -0
easy_rec/python/model/pdn.py +203 -0
easy_rec/python/model/ple.py +120 -0
easy_rec/python/model/rank_model.py +485 -0
easy_rec/python/model/rocket_launching.py +203 -0
easy_rec/python/model/simple_multi_task.py +54 -0
easy_rec/python/model/uniter.py +46 -0
easy_rec/python/model/wide_and_deep.py +121 -0
easy_rec/python/ops/1.12/incr_record.so +0 -0
easy_rec/python/ops/1.12/kafka.so +0 -0
easy_rec/python/ops/1.12/libcustom_ops.so +0 -0
easy_rec/python/ops/1.12/libembed_op.so +0 -0
easy_rec/python/ops/1.12/libhiredis.so.1.0.0 +0 -0
easy_rec/python/ops/1.12/librdkafka++.so.1 +0 -0
easy_rec/python/ops/1.12/librdkafka.so.1 +0 -0
easy_rec/python/ops/1.12/libredis++.so +0 -0
easy_rec/python/ops/1.12/libredis++.so.1 +0 -0
easy_rec/python/ops/1.12/libredis++.so.1.2.3 +0 -0
easy_rec/python/ops/1.12/libstr_avx_op.so +0 -0
easy_rec/python/ops/1.12/libwrite_sparse_kv.so +0 -0
easy_rec/python/ops/1.15/incr_record.so +0 -0
easy_rec/python/ops/1.15/kafka.so +0 -0
easy_rec/python/ops/1.15/libcustom_ops.so +0 -0
easy_rec/python/ops/1.15/libembed_op.so +0 -0
easy_rec/python/ops/1.15/libhiredis.so.1.0.0 +0 -0
easy_rec/python/ops/1.15/librdkafka++.so +0 -0
easy_rec/python/ops/1.15/librdkafka++.so.1 +0 -0
easy_rec/python/ops/1.15/librdkafka.so +0 -0
easy_rec/python/ops/1.15/librdkafka.so.1 +0 -0
easy_rec/python/ops/1.15/libredis++.so.1 +0 -0
easy_rec/python/ops/1.15/libstr_avx_op.so +0 -0
easy_rec/python/ops/2.12/libcustom_ops.so +0 -0
easy_rec/python/ops/2.12/libload_embed.so +0 -0
easy_rec/python/ops/2.12/libstr_avx_op.so +0 -0
easy_rec/python/ops/__init__.py +0 -0
easy_rec/python/ops/gen_kafka_ops.py +193 -0
easy_rec/python/ops/gen_str_avx_op.py +28 -0
easy_rec/python/ops/incr_record.py +30 -0
easy_rec/python/predict.py +170 -0
easy_rec/python/protos/__init__.py +0 -0
easy_rec/python/protos/autoint_pb2.py +122 -0
easy_rec/python/protos/backbone_pb2.py +1416 -0
easy_rec/python/protos/cmbf_pb2.py +435 -0
easy_rec/python/protos/collaborative_metric_learning_pb2.py +252 -0
easy_rec/python/protos/custom_model_pb2.py +57 -0
easy_rec/python/protos/dat_pb2.py +262 -0
easy_rec/python/protos/data_source_pb2.py +422 -0
easy_rec/python/protos/dataset_pb2.py +1920 -0
easy_rec/python/protos/dbmtl_pb2.py +191 -0
easy_rec/python/protos/dcn_pb2.py +197 -0
easy_rec/python/protos/deepfm_pb2.py +163 -0
easy_rec/python/protos/dlrm_pb2.py +163 -0
easy_rec/python/protos/dnn_pb2.py +329 -0
easy_rec/python/protos/dropoutnet_pb2.py +239 -0
easy_rec/python/protos/dssm_pb2.py +262 -0
easy_rec/python/protos/dssm_senet_pb2.py +282 -0
easy_rec/python/protos/easy_rec_model_pb2.py +1672 -0
easy_rec/python/protos/esmm_pb2.py +133 -0
easy_rec/python/protos/eval_pb2.py +930 -0
easy_rec/python/protos/export_pb2.py +379 -0
easy_rec/python/protos/feature_config_pb2.py +1359 -0
easy_rec/python/protos/fm_pb2.py +90 -0
easy_rec/python/protos/hive_config_pb2.py +138 -0
easy_rec/python/protos/hyperparams_pb2.py +624 -0
easy_rec/python/protos/keras_layer_pb2.py +692 -0
easy_rec/python/protos/layer_pb2.py +1936 -0
easy_rec/python/protos/loss_pb2.py +1713 -0
easy_rec/python/protos/mind_pb2.py +497 -0
easy_rec/python/protos/mmoe_pb2.py +215 -0
easy_rec/python/protos/multi_tower_pb2.py +295 -0
easy_rec/python/protos/multi_tower_recall_pb2.py +198 -0
easy_rec/python/protos/optimizer_pb2.py +2017 -0
easy_rec/python/protos/pdn_pb2.py +293 -0
easy_rec/python/protos/pipeline_pb2.py +516 -0
easy_rec/python/protos/ple_pb2.py +231 -0
easy_rec/python/protos/predict_pb2.py +1140 -0
easy_rec/python/protos/rocket_launching_pb2.py +169 -0
easy_rec/python/protos/seq_encoder_pb2.py +1084 -0
easy_rec/python/protos/simi_pb2.py +54 -0
easy_rec/python/protos/simple_multi_task_pb2.py +97 -0
easy_rec/python/protos/tf_predict_pb2.py +630 -0
easy_rec/python/protos/tower_pb2.py +661 -0
easy_rec/python/protos/train_pb2.py +1197 -0
easy_rec/python/protos/uniter_pb2.py +307 -0
easy_rec/python/protos/variational_dropout_pb2.py +91 -0
easy_rec/python/protos/wide_and_deep_pb2.py +131 -0
easy_rec/python/test/__init__.py +0 -0
easy_rec/python/test/csv_input_test.py +340 -0
easy_rec/python/test/custom_early_stop_func.py +19 -0
easy_rec/python/test/dh_local_run.py +104 -0
easy_rec/python/test/embed_test.py +155 -0
easy_rec/python/test/emr_run.py +119 -0
easy_rec/python/test/eval_metric_test.py +107 -0
easy_rec/python/test/excel_convert_test.py +64 -0
easy_rec/python/test/export_test.py +513 -0
easy_rec/python/test/fg_test.py +70 -0
easy_rec/python/test/hive_input_test.py +311 -0
easy_rec/python/test/hpo_test.py +235 -0
easy_rec/python/test/kafka_test.py +373 -0
easy_rec/python/test/local_incr_test.py +122 -0
easy_rec/python/test/loss_test.py +110 -0
easy_rec/python/test/odps_command.py +61 -0
easy_rec/python/test/odps_local_run.py +86 -0
easy_rec/python/test/odps_run.py +254 -0
easy_rec/python/test/odps_test_cls.py +39 -0
easy_rec/python/test/odps_test_prepare.py +198 -0
easy_rec/python/test/odps_test_util.py +237 -0
easy_rec/python/test/pre_check_test.py +54 -0
easy_rec/python/test/predictor_test.py +394 -0
easy_rec/python/test/rtp_convert_test.py +133 -0
easy_rec/python/test/run.py +138 -0
easy_rec/python/test/train_eval_test.py +1299 -0
easy_rec/python/test/util_test.py +85 -0
easy_rec/python/test/zero_inflated_lognormal_test.py +53 -0
easy_rec/python/tools/__init__.py +0 -0
easy_rec/python/tools/add_boundaries_to_config.py +67 -0
easy_rec/python/tools/add_feature_info_to_config.py +145 -0
easy_rec/python/tools/convert_config_format.py +48 -0
easy_rec/python/tools/convert_rtp_data.py +79 -0
easy_rec/python/tools/convert_rtp_fg.py +106 -0
easy_rec/python/tools/create_config_from_excel.py +427 -0
easy_rec/python/tools/criteo/__init__.py +0 -0
easy_rec/python/tools/criteo/convert_data.py +157 -0
easy_rec/python/tools/edit_lookup_graph.py +134 -0
easy_rec/python/tools/faiss_index_pai.py +116 -0
easy_rec/python/tools/feature_selection.py +316 -0
easy_rec/python/tools/hit_rate_ds.py +223 -0
easy_rec/python/tools/hit_rate_pai.py +138 -0
easy_rec/python/tools/pre_check.py +120 -0
easy_rec/python/tools/predict_and_chk.py +111 -0
easy_rec/python/tools/read_kafka.py +55 -0
easy_rec/python/tools/split_model_pai.py +286 -0
easy_rec/python/tools/split_pdn_model_pai.py +272 -0
easy_rec/python/tools/test_saved_model.py +80 -0
easy_rec/python/tools/view_saved_model.py +39 -0
easy_rec/python/tools/write_kafka.py +65 -0
easy_rec/python/train_eval.py +325 -0
easy_rec/python/utils/__init__.py +15 -0
easy_rec/python/utils/activation.py +120 -0
easy_rec/python/utils/check_utils.py +87 -0
easy_rec/python/utils/compat.py +14 -0
easy_rec/python/utils/config_util.py +652 -0
easy_rec/python/utils/constant.py +43 -0
easy_rec/python/utils/convert_rtp_fg.py +616 -0
easy_rec/python/utils/dag.py +192 -0
easy_rec/python/utils/distribution_utils.py +268 -0
easy_rec/python/utils/ds_util.py +65 -0
easy_rec/python/utils/embedding_utils.py +73 -0
easy_rec/python/utils/estimator_utils.py +1036 -0
easy_rec/python/utils/export_big_model.py +630 -0
easy_rec/python/utils/expr_util.py +118 -0
easy_rec/python/utils/fg_util.py +53 -0
easy_rec/python/utils/hit_rate_utils.py +220 -0
easy_rec/python/utils/hive_utils.py +183 -0
easy_rec/python/utils/hpo_util.py +137 -0
easy_rec/python/utils/hvd_utils.py +56 -0
easy_rec/python/utils/input_utils.py +108 -0
easy_rec/python/utils/io_util.py +282 -0
easy_rec/python/utils/load_class.py +249 -0
easy_rec/python/utils/meta_graph_editor.py +941 -0
easy_rec/python/utils/multi_optimizer.py +62 -0
easy_rec/python/utils/numpy_utils.py +18 -0
easy_rec/python/utils/odps_util.py +79 -0
easy_rec/python/utils/pai_util.py +86 -0
easy_rec/python/utils/proto_util.py +90 -0
easy_rec/python/utils/restore_filter.py +89 -0
easy_rec/python/utils/shape_utils.py +432 -0
easy_rec/python/utils/static_shape.py +71 -0
easy_rec/python/utils/test_utils.py +866 -0
easy_rec/python/utils/tf_utils.py +56 -0
easy_rec/version.py +4 -0
test/__init__.py +0 -0

easy_rec/python/model/__init__.py ADDED Viewed

File without changes

easy_rec/python/model/autoint.py ADDED Viewed

@@ -0,0 +1,73 @@
+# -*- encoding:utf-8 -*-
+# Copyright (c) Alibaba, Inc. and its affiliates.
+import logging
+import tensorflow as tf
+from easy_rec.python.layers import multihead_attention
+from easy_rec.python.model.rank_model import RankModel
+from easy_rec.python.protos.autoint_pb2 import AutoInt as AutoIntConfig  # NOQA
+if tf.__version__ >= '2.0':
+  tf = tf.compat.v1
+class AutoInt(RankModel):
+  def __init__(self,
+               model_config,
+               feature_configs,
+               features,
+               labels=None,
+               is_training=False):
+    super(AutoInt, self).__init__(model_config, feature_configs, features,
+                                  labels, is_training)
+    assert self._model_config.WhichOneof('model') == 'autoint', \
+        'invalid model config: %s' % self._model_config.WhichOneof('model')
+    self._features, _ = self._input_layer(self._feature_dict, 'all')
+    self._feature_num = len(self._model_config.feature_groups[0].feature_names)
+    self._seq_key_num = 0
+    if len(self._model_config.feature_groups[0].sequence_features) > 0:
+      for seq_fea in self._model_config.feature_groups[0].sequence_features:
+        for seq_att in seq_fea.seq_att_map:
+          self._feature_num += len(seq_att.hist_seq)
+          self._seq_key_num += len(seq_att.key)
+    self._model_config = self._model_config.autoint
+    assert isinstance(self._model_config, AutoIntConfig)
+    fea_emb_dim_list = []
+    for feature_config in feature_configs:
+      fea_emb_dim_list.append(feature_config.embedding_dim)
+    assert len(set(fea_emb_dim_list)) == 1 and len(fea_emb_dim_list) == self._feature_num, \
+        'AutoInt requires that all feature dimensions must be consistent.'
+    self._d_model = fea_emb_dim_list[0]
+    self._head_num = self._model_config.multi_head_num
+    self._head_size = self._model_config.multi_head_size
+  def build_predict_graph(self):
+    logging.info('feature_num: {0}'.format(self._feature_num))
+    attention_fea = tf.reshape(
+        self._features,
+        shape=[-1, self._feature_num + self._seq_key_num, self._d_model])
+    for i in range(self._model_config.interacting_layer_num):
+      attention_layer = multihead_attention.MultiHeadAttention(
+          head_num=self._head_num,
+          head_size=self._head_size,
+          l2_reg=self._l2_reg,
+          use_res=True,
+          name='multi_head_self_attention_layer_%d' % i)
+      attention_fea = attention_layer(attention_fea)
+    attention_fea = tf.reshape(
+        attention_fea,
+        shape=[-1, attention_fea.shape[1] * attention_fea.shape[2]])
+    final = tf.layers.dense(attention_fea, self._num_class, name='output')
+    self._add_to_prediction_dict(final)
+    return self._prediction_dict

easy_rec/python/model/cmbf.py ADDED Viewed

@@ -0,0 +1,47 @@
+# -*- encoding:utf-8 -*-
+# Copyright (c) Alibaba, Inc. and its affiliates.
+import tensorflow as tf
+from easy_rec.python.layers import cmbf
+from easy_rec.python.layers import dnn
+from easy_rec.python.model.rank_model import RankModel
+from easy_rec.python.protos.cmbf_pb2 import CMBF as CMBFConfig  # NOQA
+if tf.__version__ >= '2.0':
+  tf = tf.compat.v1
+class CMBF(RankModel):
+  """CMBF: Cross-Modal-Based Fusion Recommendation Algorithm.
+  This is almost an exact implementation of the original CMBF model.
+  See the original paper:
+  https://www.mdpi.com/1424-8220/21/16/5275
+  """
+  def __init__(self,
+               model_config,
+               feature_configs,
+               features,
+               labels=None,
+               is_training=False):
+    super(CMBF, self).__init__(model_config, feature_configs, features, labels,
+                               is_training)
+    assert self._model_config.WhichOneof('model') == 'cmbf', (
+        'invalid model config: %s' % self._model_config.WhichOneof('model'))
+    self._cmbf_layer = cmbf.CMBF(model_config, feature_configs, features,
+                                 self._model_config.cmbf.config,
+                                 self._input_layer)
+    self._model_config = self._model_config.cmbf
+  def build_predict_graph(self):
+    hidden = self._cmbf_layer(self._is_training, l2_reg=self._l2_reg)
+    final_dnn_layer = dnn.DNN(self._model_config.final_dnn, self._l2_reg,
+                              'final_dnn', self._is_training)
+    all_fea = final_dnn_layer(hidden)
+    final = tf.layers.dense(all_fea, self._num_class, name='output')
+    self._add_to_prediction_dict(final)
+    return self._prediction_dict

easy_rec/python/model/collaborative_metric_learning.py ADDED Viewed

@@ -0,0 +1,182 @@
+import tensorflow as tf
+from easy_rec.python.core.metrics import metric_learning_average_precision_at_k
+from easy_rec.python.core.metrics import metric_learning_recall_at_k
+from easy_rec.python.layers import dnn
+from easy_rec.python.layers.common_layers import highway
+from easy_rec.python.loss.circle_loss import circle_loss
+from easy_rec.python.loss.multi_similarity import ms_loss
+from easy_rec.python.model.easy_rec_model import EasyRecModel
+from easy_rec.python.protos.loss_pb2 import LossType
+from easy_rec.python.utils.activation import gelu
+from easy_rec.python.utils.proto_util import copy_obj
+from easy_rec.python.protos.collaborative_metric_learning_pb2 import CoMetricLearningI2I as MetricLearningI2IConfig  # NOQA
+if tf.__version__ >= '2.0':
+  tf = tf.compat.v1
+class CoMetricLearningI2I(EasyRecModel):
+  def __init__(
+      self,
+      model_config,  # pipeline.model_config
+      feature_configs,  # pipeline.feature_configs
+      features,  # same as model_fn input
+      labels=None,
+      is_training=False):
+    super(CoMetricLearningI2I, self).__init__(model_config, feature_configs,
+                                              features, labels, is_training)
+    model = self._model_config.WhichOneof('model')
+    assert model == 'metric_learning', 'invalid model config: %s' % model
+    self._loss_type = self._model_config.loss_type
+    loss_type_name = LossType.Name(self._loss_type).lower()
+    self._model_config = self._model_config.metric_learning
+    assert isinstance(self._model_config, MetricLearningI2IConfig)
+    model_loss = self._model_config.WhichOneof('loss').lower()
+    assert model_loss == loss_type_name, 'invalid loss type: %s' % model_loss
+    if self._loss_type == LossType.CIRCLE_LOSS:
+      self.loss = self._model_config.circle_loss
+    elif self._loss_type == LossType.MULTI_SIMILARITY_LOSS:
+      self.loss = self._model_config.multi_similarity_loss
+    else:
+      raise ValueError('unsupported loss type: %s' %
+                       LossType.Name(self._loss_type))
+    if not self.has_backbone:
+      self._highway_features = {}
+      self._highway_num = len(self._model_config.highway)
+      for _id in range(self._highway_num):
+        highway_cfg = self._model_config.highway[_id]
+        highway_feature, _ = self._input_layer(self._feature_dict,
+                                               highway_cfg.input)
+        self._highway_features[highway_cfg.input] = highway_feature
+      self.input_features = []
+      if self._model_config.HasField('input'):
+        input_feature, _ = self._input_layer(self._feature_dict,
+                                             self._model_config.input)
+        self.input_features.append(input_feature)
+      self.dnn = copy_obj(self._model_config.dnn)
+    if self._labels is not None:
+      if self._model_config.HasField('session_id'):
+        self.session_ids = self._labels.pop(self._model_config.session_id)
+      else:
+        self.session_ids = None
+      assert len(self._labels) > 0
+      self.labels = list(self._labels.values())[0]
+    if self._model_config.HasField('sample_id'):
+      self.sample_id = self._model_config.sample_id
+    else:
+      self.sample_id = None
+  def build_predict_graph(self):
+    if self.has_backbone:
+      tower_emb = self.backbone
+    else:
+      for _id in range(self._highway_num):
+        highway_cfg = self._model_config.highway[_id]
+        highway_fea = tf.layers.batch_normalization(
+            self._highway_features[highway_cfg.input],
+            training=self._is_training,
+            trainable=True,
+            name='highway_%s_bn' % highway_cfg.input)
+        highway_fea = highway(
+            highway_fea,
+            highway_cfg.emb_size,
+            activation=gelu,
+            scope='highway_%s' % _id)
+        print('highway_fea: ', highway_fea)
+        self.input_features.append(highway_fea)
+      feature = tf.concat(self.input_features, axis=1)
+      num_dnn_layer = len(self.dnn.hidden_units)
+      last_hidden = self.dnn.hidden_units.pop()
+      dnn_net = dnn.DNN(self.dnn, self._l2_reg, 'dnn', self._is_training)
+      net_output = dnn_net(feature)
+      tower_emb = tf.layers.dense(
+          inputs=net_output,
+          units=last_hidden,
+          kernel_regularizer=self._l2_reg,
+          name='dnn/dnn_%d' % (num_dnn_layer - 1))
+    if self._model_config.output_l2_normalized_emb:
+      norm_emb = tf.nn.l2_normalize(tower_emb, axis=-1)
+      self._prediction_dict['norm_emb'] = norm_emb
+      self._prediction_dict['norm_embedding'] = tf.reduce_join(
+          tf.as_string(norm_emb), axis=-1, separator=',')
+    self._prediction_dict['float_emb'] = tower_emb
+    self._prediction_dict['embedding'] = tf.reduce_join(
+        tf.as_string(tower_emb), axis=-1, separator=',')
+    if self.sample_id is not None and self.sample_id in self._feature_dict:
+      self._prediction_dict['sample_id'] = tf.identity(
+          self._feature_dict[self.sample_id])
+    return self._prediction_dict
+  def build_loss_graph(self):
+    emb = self._prediction_dict['float_emb']
+    emb_normed = self._model_config.output_l2_normalized_emb
+    norm_emb = self._prediction_dict['norm_emb'] if emb_normed else emb
+    if self._loss_type == LossType.CIRCLE_LOSS:
+      self._loss_dict['circle_loss'] = circle_loss(
+          norm_emb,
+          self.labels,
+          self.session_ids,
+          self.loss.margin,
+          self.loss.gamma,
+          embed_normed=emb_normed)
+    elif self._loss_type == LossType.MULTI_SIMILARITY_LOSS:
+      self._loss_dict['ms_loss'] = ms_loss(
+          norm_emb,
+          self.labels,
+          self.session_ids,
+          self.loss.alpha,
+          self.loss.beta,
+          self.loss.lamb,
+          self.loss.eps,
+          embed_normed=emb_normed)
+    else:
+      raise ValueError('invalid loss type: %s' % LossType.Name(self._loss_type))
+    return self._loss_dict
+  def get_outputs(self):
+    outputs = ['embedding', 'float_emb']
+    if self.sample_id is not None and 'sample_id' in self._prediction_dict:
+      outputs.append('sample_id')
+    if self._model_config.output_l2_normalized_emb:
+      outputs.append('norm_embedding')
+      outputs.append('norm_emb')
+    return outputs
+  def build_metric_graph(self, eval_config):
+    metric_dict = {}
+    recall_at_k = []
+    precision_at_k = []
+    for metric in eval_config.metrics_set:
+      if metric.WhichOneof('metric') == 'recall_at_topk':
+        recall_at_k.append(metric.recall_at_topk.topk)
+      elif metric.WhichOneof('metric') == 'precision_at_topk':
+        precision_at_k.append(metric.precision_at_topk.topk)
+    emb = self._prediction_dict['float_emb']
+    if len(recall_at_k) > 0:
+      metric_dict.update(
+          metric_learning_recall_at_k(recall_at_k, emb, self.labels,
+                                      self.session_ids))
+    if len(precision_at_k) > 0:
+      metric_dict.update(
+          metric_learning_average_precision_at_k(precision_at_k, emb,
+                                                 self.labels, self.session_ids))
+    return metric_dict

easy_rec/python/model/custom_model.py ADDED Viewed

@@ -0,0 +1,323 @@
+# easy_rec/python/model/custom_model.py
+import os
+import sys
+import six
+import tensorflow as tf
+from easy_rec.python.builders import loss_builder
+from easy_rec.python.compat import regularizers
+from easy_rec.python.feature_column.feature_column import FeatureColumnParser
+from easy_rec.python.model.easy_rec_model import EasyRecModel
+from easy_rec.python.protos.deepfm_pb2 import DeepFM as DeepFMConfig
+# from easy_rec.python.protos.easy_rec_model_pb2 import LossType
+from easy_rec.python.protos.loss_pb2 import LossType
+if tf.__version__ >= '2.0':
+  tf = tf.compat.v1
+class MultiHeadAttention(tf.compat.v1.keras.layers.Layer):
+  def __init__(self, num_heads, d_model):
+    super(MultiHeadAttention, self).__init__()
+    self.num_heads = num_heads
+    self.d_model = d_model
+    assert d_model % num_heads == 0
+    self.depth = d_model // num_heads
+    self.wq = tf.compat.v1.keras.layers.Dense(d_model)
+    self.wk = tf.compat.v1.keras.layers.Dense(d_model)
+    self.wv = tf.compat.v1.keras.layers.Dense(d_model)
+    self.dense = tf.compat.v1.keras.layers.Dense(d_model)
+  def split_heads(self, x, batch_size):
+    x = tf.reshape(x, (batch_size, 15, self.num_heads, self.depth))
+    return tf.transpose(x, perm=[0, 2, 1, 3])
+  def __call__(self, q, k, v, mask):
+    batch_size = tf.shape(q)[0]
+    q = self.wq(q)
+    k = self.wk(k)
+    v = self.wv(v)
+    q = self.split_heads(q, batch_size)
+    k = self.split_heads(k, batch_size)
+    v = self.split_heads(v, batch_size)
+    scaled_attention, attention_weights = self.scaled_dot_product_attention(
+        q, k, v, mask)
+    scaled_attention = tf.transpose(scaled_attention, perm=[0, 2, 1, 3])
+    concat_attention = tf.reshape(scaled_attention,
+                                  (batch_size, 15, self.d_model))
+    output = self.dense(concat_attention)
+    return output, attention_weights
+  def scaled_dot_product_attention(self, q, k, v, mask):
+    matmul_qk = tf.matmul(q, k, transpose_b=True)
+    dk = tf.cast(tf.shape(k)[-1], tf.float32)
+    scaled_attention_logits = matmul_qk / tf.math.sqrt(dk)
+    if mask is not None:
+      scaled_attention_logits += (mask * -1e9)
+    attention_weights = tf.nn.softmax(scaled_attention_logits, axis=-1)
+    output = tf.matmul(attention_weights, v)
+    return output, attention_weights
+class CustomModel(EasyRecModel):
+  def __init__(self,
+               model_config,
+               feature_configs,
+               features,
+               labels=None,
+               is_training=False):
+    """
+        Args:
+          model_config: easy_rec.python.protos.easy_rec_model_pb2.EasyRecModel
+               model_config.custom_model is instance of:
+                     easy_rec.python.protos.easy_rec_model_pb2.CustomModel
+          feature_configs: a collection of easy_rec.python.protos.feature_config.FeatureConfig
+          features: dict of feature tensors, which are described by easy_rec.python.protos.DatasetConfig.input_fields
+          labels: dict of labels tensors, which are described by easy_rec.python.protos.DatasetConfig.label_fields
+        """
+    super(CustomModel, self).__init__(model_config, feature_configs, features,
+                                      labels, is_training)
+    self.drop_out_rate = 0.05
+    self._raw_features, self._raw_feature_lst = self._input_layer(
+        self._feature_dict, 'raw_feature')
+    self._seq_features, _, _ = self._input_layer(
+        self._feature_dict, 'seq_feature', is_combine=False)
+    self._multi_head_1_features, _, _ = self._input_layer(
+        self._feature_dict, 'multi_head_feature_1', is_combine=False)
+    self._multi_head_2_features, _, _ = self._input_layer(
+        self._feature_dict, 'multi_head_feature_2', is_combine=False)
+    self._seq_features_concat = self._get_features_concat(
+        self._get_seq_features_reduce(
+            self._seq_features, reduce_type='mean', axis=1, keepdims=False),
+        axis=-1)
+    self._multi_head_1_features_concat = self._get_features_concat(
+        self._get_seq_features_reduce(
+            self._multi_head_1_features,
+            reduce_type='mean',
+            axis=1,
+            keepdims=True),
+        axis=1)
+    self._multi_head_2_features_concat = self._get_features_concat(
+        self._get_seq_features_reduce(
+            self._multi_head_2_features,
+            reduce_type='mean',
+            axis=1,
+            keepdims=True),
+        axis=1)
+    self._multi_head_1_layer = MultiHeadAttention(4, 12)
+    self._multi_head_2_layer = MultiHeadAttention(4, 12)
+    self._multi_head_1_output, _ = self._multi_head_1_layer(
+        self._multi_head_1_features_concat, self._multi_head_1_features_concat,
+        self._multi_head_1_features_concat, None)
+    self._multi_head_2_output, _ = self._multi_head_2_layer(
+        self._multi_head_2_features_concat, self._multi_head_2_features_concat,
+        self._multi_head_2_features_concat, None)
+    self._multi_head_1_output_end = self._get_seq_feature_reduce(
+        self._multi_head_1_output, reduce_type='mean', axis=1, keepdims=False)
+    self._multi_head_2_output_end = self._get_seq_feature_reduce(
+        self._multi_head_2_output, reduce_type='mean', axis=1, keepdims=False)
+    self.deep_input = self._get_features_concat([
+        self._raw_features, self._seq_features_concat,
+        self._multi_head_1_output_end, self._multi_head_2_output_end
+    ],
+                                                axis=-1)
+  def _get_seq_features_reduce(self, seq_features, reduce_type, axis: int,
+                               keepdims: bool):
+    assert reduce_type in ['mean', 'sum',
+                           'max'], 'reduce_type  must in mean | sum | max'
+    assert axis in [-1, 1, 2], 'axis  must in -1 | 1 | 2'
+    seq_features_reduce = []
+    for feature in seq_features:
+      if reduce_type == 'mean':
+        seq_features_reduce.append(
+            tf.reduce_mean(feature[0], axis=axis, keepdims=keepdims))
+      elif reduce_type == 'sum':
+        seq_features_reduce.append(
+            tf.reduce_sum(feature[0], axis=axis, keepdims=keepdims))
+      elif reduce_type == 'max':
+        seq_features_reduce.append(
+            tf.reduce_max(feature[0], axis=axis, keepdims=keepdims))
+      else:
+        pass
+    return seq_features_reduce
+  def _get_seq_feature_reduce(self, seq_feature, reduce_type, axis: int,
+                              keepdims: bool):
+    assert reduce_type in ['mean', 'sum',
+                           'max'], 'reduce_type  must in mean | sum | max'
+    assert axis in [-1, 1, 2], 'axis  must in -1 | 1 | 2'
+    if reduce_type == 'mean':
+      return tf.reduce_mean(seq_feature, axis=axis, keepdims=keepdims)
+    elif reduce_type == 'sum':
+      return tf.reduce_sum(seq_feature, axis=axis, keepdims=keepdims)
+    elif reduce_type == 'max':
+      return tf.reduce_max(seq_feature, axis=axis, keepdims=keepdims)
+    else:
+      pass
+  def _get_features_concat(self, features, axis):
+    assert axis in [-1, 1, 2], 'axis  must in -1 | 1 | 2'
+    return tf.concat(features, axis=axis)
+  def build_predict_graph(self):
+    # build forward graph
+    dnn_1_list = self.get_layer_1(
+        self.deep_input, '1:64', prefix='dnn_1_1', n=1)
+    dnn_1_2_list = self.get_layer_n(
+        dnn_1_list, '1:32', prefix='dnn_1_2', branch_num=2)
+    dnn_1_3_list = self.get_layer_n(
+        dnn_1_2_list, '1:16', prefix='dnn_1_3', branch_num=2)
+    dnn_1_4_list = self.get_layer_n(
+        dnn_1_3_list, '1:8', prefix='dnn_1_4', branch_num=2)
+    dnn_1_5_list = self.get_layer_n(
+        dnn_1_4_list, '1:4', prefix='dnn_1_5', branch_num=2)
+    dnn_1_concat = tf.concat(dnn_1_5_list, axis=-1, name='dnn_1_concat')
+    dnn_2_1 = tf.keras.layers.Dense(
+        units=32, activation='relu', name=f'dnn_layer_2_1')(
+            dnn_1_concat)
+    if self.drop_out_rate == 0:
+      dnn_2_1_dropout = dnn_2_1
+    else:
+      dnn_2_1_dropout = tf.keras.layers.Dropout(
+          self.drop_out_rate, noise_shape=None, seed=None)(
+              dnn_2_1)
+    dnn_2_2 = tf.keras.layers.Dense(
+        units=16, activation='relu', name=f'dnn_layer_2_2')(
+            dnn_2_1_dropout)
+    if self.drop_out_rate == 0:
+      dnn_2_2_dropout = dnn_2_2
+    else:
+      dnn_2_2_dropout = tf.keras.layers.Dropout(
+          self.drop_out_rate, noise_shape=None, seed=None)(
+              dnn_2_2)
+    dnn_2_3 = tf.keras.layers.Dense(
+        units=8, activation='relu', name=f'dnn_layer_2_3')(
+            dnn_2_2_dropout)
+    if self.drop_out_rate == 0:
+      dnn_2_3_dropout = dnn_2_3
+    else:
+      dnn_2_3_dropout = tf.keras.layers.Dropout(
+          self.drop_out_rate, noise_shape=None, seed=None)(
+              dnn_2_3)
+    dnn_1_sig = tf.keras.layers.Dense(
+        units=1, activation='sigmoid', name='dnn_1_sig')(
+            dnn_2_3_dropout)
+    self._prediction_dict['label'] = dnn_1_sig
+    return self._prediction_dict
+  def build_loss_graph(self):
+    # assert self._model_config.loss_type == LossType.CLASSIFICATION
+    loss = tf.keras.losses.BinaryFocalCrossentropy(gamma=2, from_logits=False)
+    label = list(self._labels.values())[0]
+    self._loss_dict['custom_loss'] = loss(label, self._prediction_dict['label'])
+    return self._loss_dict
+  def build_metric_graph(self, eval_config):
+    metric_dict = {}
+    num_thresholds = eval_config.metrics_set[0].auc.num_thresholds
+    metric_dict['auc'] = tf.metrics.auc(
+        list(self._labels.values())[0],
+        self._prediction_dict['label'],
+        num_thresholds=num_thresholds)
+    return metric_dict
+  def get_outputs(self):
+    return ['label']
+  def get_layer_1(self, input, dnn_layers, prefix, n=2):
+    output_list = []
+    dnn_layers_list = dnn_layers.split(',')
+    for i in range(n):
+      for j in range(len(dnn_layers_list)):
+        dnn_info_list = dnn_layers_list[j].split(':')
+        if j == 0:
+          deep_layer = tf.keras.layers.Dense(
+              units=int(dnn_info_list[1]),
+              activation='relu'
+              # , kernel_regularizer=tf.keras.regularizers.l1_l2(l1=0.01, l2=0.01)
+              ,
+              name=f'dnn_layer_{prefix}_{i}_{j}')(
+                  input)
+        else:
+          deep_layer = tf.keras.layers.Dense(
+              units=int(dnn_info_list[1]),
+              activation='relu'
+              # , kernel_regularizer=tf.keras.regularizers.l1_l2(l1=0.01, l2=0.01)
+              ,
+              name=f'dnn_layer_{prefix}_{i}_{j}')(
+                  deep_layer)
+      output_list.append(deep_layer)
+    return output_list
+  def get_layer_n(self, layer_output_list, dnn_layers, prefix, branch_num=2):
+    output_list = []
+    dnn_layers_list = dnn_layers.split(',')
+    for branch in range(branch_num):
+      for i in range(len(layer_output_list)):
+        for j in range(len(dnn_layers_list)):
+          dnn_info_list = dnn_layers_list[j].split(':')
+          if j == 0:
+            deep_layer = tf.keras.layers.Dense(
+                units=int(dnn_info_list[1]),
+                activation='relu'
+                # , kernel_regularizer=tf.keras.regularizers.l1_l2(l1=0.01, l2=0.01)
+                ,
+                name=f'dnn_layer_{prefix}_{branch}_{i}_{j}')(
+                    layer_output_list[i])
+          else:
+            deep_layer = tf.keras.layers.Dense(
+                units=int(dnn_info_list[1]),
+                activation='relu'
+                # , kernel_regularizer=tf.keras.regularizers.l1_l2(l1=0.01, l2=0.01)
+                ,
+                name=f'dnn_layer_{prefix}_{branch}_{i}_{j}')(
+                    deep_layer)
+        # deep_layer_end = tf.concat([deep_layer,bundle_info_sum],axis=-1)
+        if self.drop_out_rate == 0:
+          deep_layer_dropout = deep_layer
+        else:
+          deep_layer_dropout = tf.keras.layers.Dropout(
+              self.drop_out_rate, noise_shape=None, seed=None)(
+                  deep_layer)
+        output_list.append(deep_layer_dropout)
+    return output_list