PyPI - easy-cs-rec-custommodel - Versions diffs - 0.8.6__py2.py3-none-any.whl - Mend

easy-cs-rec-custommodel 0.8.6__py2.py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of easy-cs-rec-custommodel might be problematic. Click here for more details.

Files changed (336) hide show

easy_cs_rec_custommodel-0.8.6.dist-info/LICENSE +203 -0
easy_cs_rec_custommodel-0.8.6.dist-info/METADATA +48 -0
easy_cs_rec_custommodel-0.8.6.dist-info/RECORD +336 -0
easy_cs_rec_custommodel-0.8.6.dist-info/WHEEL +6 -0
easy_cs_rec_custommodel-0.8.6.dist-info/top_level.txt +2 -0
easy_rec/__init__.py +114 -0
easy_rec/python/__init__.py +0 -0
easy_rec/python/builders/__init__.py +0 -0
easy_rec/python/builders/hyperparams_builder.py +78 -0
easy_rec/python/builders/loss_builder.py +333 -0
easy_rec/python/builders/optimizer_builder.py +211 -0
easy_rec/python/builders/strategy_builder.py +44 -0
easy_rec/python/compat/__init__.py +0 -0
easy_rec/python/compat/adam_s.py +245 -0
easy_rec/python/compat/array_ops.py +229 -0
easy_rec/python/compat/dynamic_variable.py +542 -0
easy_rec/python/compat/early_stopping.py +653 -0
easy_rec/python/compat/embedding_ops.py +162 -0
easy_rec/python/compat/embedding_parallel_saver.py +316 -0
easy_rec/python/compat/estimator_train.py +116 -0
easy_rec/python/compat/exporter.py +473 -0
easy_rec/python/compat/feature_column/__init__.py +0 -0
easy_rec/python/compat/feature_column/feature_column.py +3675 -0
easy_rec/python/compat/feature_column/feature_column_v2.py +5233 -0
easy_rec/python/compat/feature_column/sequence_feature_column.py +648 -0
easy_rec/python/compat/feature_column/utils.py +154 -0
easy_rec/python/compat/layers.py +329 -0
easy_rec/python/compat/ops.py +14 -0
easy_rec/python/compat/optimizers.py +619 -0
easy_rec/python/compat/queues.py +311 -0
easy_rec/python/compat/regularizers.py +208 -0
easy_rec/python/compat/sok_optimizer.py +440 -0
easy_rec/python/compat/sync_replicas_optimizer.py +528 -0
easy_rec/python/compat/weight_decay_optimizers.py +475 -0
easy_rec/python/core/__init__.py +0 -0
easy_rec/python/core/easyrec_metrics/__init__.py +24 -0
easy_rec/python/core/easyrec_metrics/distribute_metrics_impl_pai.py +3702 -0
easy_rec/python/core/easyrec_metrics/distribute_metrics_impl_tf.py +3768 -0
easy_rec/python/core/learning_schedules.py +228 -0
easy_rec/python/core/metrics.py +402 -0
easy_rec/python/core/sampler.py +844 -0
easy_rec/python/eval.py +102 -0
easy_rec/python/export.py +150 -0
easy_rec/python/feature_column/__init__.py +0 -0
easy_rec/python/feature_column/feature_column.py +664 -0
easy_rec/python/feature_column/feature_group.py +89 -0
easy_rec/python/hpo/__init__.py +0 -0
easy_rec/python/hpo/emr_hpo.py +140 -0
easy_rec/python/hpo/generate_hpo_sql.py +71 -0
easy_rec/python/hpo/pai_hpo.py +297 -0
easy_rec/python/inference/__init__.py +0 -0
easy_rec/python/inference/csv_predictor.py +189 -0
easy_rec/python/inference/hive_parquet_predictor.py +200 -0
easy_rec/python/inference/hive_predictor.py +166 -0
easy_rec/python/inference/odps_predictor.py +70 -0
easy_rec/python/inference/parquet_predictor.py +147 -0
easy_rec/python/inference/parquet_predictor_v2.py +147 -0
easy_rec/python/inference/predictor.py +621 -0
easy_rec/python/inference/processor/__init__.py +0 -0
easy_rec/python/inference/processor/test.py +170 -0
easy_rec/python/inference/vector_retrieve.py +124 -0
easy_rec/python/input/__init__.py +0 -0
easy_rec/python/input/batch_tfrecord_input.py +117 -0
easy_rec/python/input/criteo_binary_reader.py +259 -0
easy_rec/python/input/criteo_input.py +107 -0
easy_rec/python/input/csv_input.py +175 -0
easy_rec/python/input/csv_input_ex.py +72 -0
easy_rec/python/input/csv_input_v2.py +68 -0
easy_rec/python/input/datahub_input.py +320 -0
easy_rec/python/input/dummy_input.py +58 -0
easy_rec/python/input/hive_input.py +123 -0
easy_rec/python/input/hive_parquet_input.py +140 -0
easy_rec/python/input/hive_rtp_input.py +174 -0
easy_rec/python/input/input.py +1064 -0
easy_rec/python/input/kafka_dataset.py +144 -0
easy_rec/python/input/kafka_input.py +235 -0
easy_rec/python/input/load_parquet.py +317 -0
easy_rec/python/input/odps_input.py +101 -0
easy_rec/python/input/odps_input_v2.py +110 -0
easy_rec/python/input/odps_input_v3.py +132 -0
easy_rec/python/input/odps_rtp_input.py +187 -0
easy_rec/python/input/odps_rtp_input_v2.py +104 -0
easy_rec/python/input/parquet_input.py +397 -0
easy_rec/python/input/parquet_input_v2.py +180 -0
easy_rec/python/input/parquet_input_v3.py +203 -0
easy_rec/python/input/rtp_input.py +225 -0
easy_rec/python/input/rtp_input_v2.py +145 -0
easy_rec/python/input/tfrecord_input.py +100 -0
easy_rec/python/layers/__init__.py +0 -0
easy_rec/python/layers/backbone.py +571 -0
easy_rec/python/layers/capsule_layer.py +176 -0
easy_rec/python/layers/cmbf.py +390 -0
easy_rec/python/layers/common_layers.py +192 -0
easy_rec/python/layers/dnn.py +87 -0
easy_rec/python/layers/embed_input_layer.py +25 -0
easy_rec/python/layers/fm.py +26 -0
easy_rec/python/layers/input_layer.py +396 -0
easy_rec/python/layers/keras/__init__.py +34 -0
easy_rec/python/layers/keras/activation.py +114 -0
easy_rec/python/layers/keras/attention.py +267 -0
easy_rec/python/layers/keras/auxiliary_loss.py +47 -0
easy_rec/python/layers/keras/blocks.py +262 -0
easy_rec/python/layers/keras/bst.py +119 -0
easy_rec/python/layers/keras/custom_ops.py +250 -0
easy_rec/python/layers/keras/data_augment.py +133 -0
easy_rec/python/layers/keras/din.py +67 -0
easy_rec/python/layers/keras/einsum_dense.py +598 -0
easy_rec/python/layers/keras/embedding.py +81 -0
easy_rec/python/layers/keras/fibinet.py +251 -0
easy_rec/python/layers/keras/interaction.py +416 -0
easy_rec/python/layers/keras/layer_norm.py +364 -0
easy_rec/python/layers/keras/mask_net.py +166 -0
easy_rec/python/layers/keras/multi_head_attention.py +717 -0
easy_rec/python/layers/keras/multi_task.py +125 -0
easy_rec/python/layers/keras/numerical_embedding.py +376 -0
easy_rec/python/layers/keras/ppnet.py +194 -0
easy_rec/python/layers/keras/transformer.py +192 -0
easy_rec/python/layers/layer_norm.py +51 -0
easy_rec/python/layers/mmoe.py +83 -0
easy_rec/python/layers/multihead_attention.py +162 -0
easy_rec/python/layers/multihead_cross_attention.py +749 -0
easy_rec/python/layers/senet.py +73 -0
easy_rec/python/layers/seq_input_layer.py +134 -0
easy_rec/python/layers/sequence_feature_layer.py +249 -0
easy_rec/python/layers/uniter.py +301 -0
easy_rec/python/layers/utils.py +248 -0
easy_rec/python/layers/variational_dropout_layer.py +130 -0
easy_rec/python/loss/__init__.py +0 -0
easy_rec/python/loss/circle_loss.py +82 -0
easy_rec/python/loss/contrastive_loss.py +79 -0
easy_rec/python/loss/f1_reweight_loss.py +38 -0
easy_rec/python/loss/focal_loss.py +93 -0
easy_rec/python/loss/jrc_loss.py +128 -0
easy_rec/python/loss/listwise_loss.py +161 -0
easy_rec/python/loss/multi_similarity.py +68 -0
easy_rec/python/loss/pairwise_loss.py +307 -0
easy_rec/python/loss/softmax_loss_with_negative_mining.py +110 -0
easy_rec/python/loss/zero_inflated_lognormal.py +76 -0
easy_rec/python/main.py +878 -0
easy_rec/python/model/__init__.py +0 -0
easy_rec/python/model/autoint.py +73 -0
easy_rec/python/model/cmbf.py +47 -0
easy_rec/python/model/collaborative_metric_learning.py +182 -0
easy_rec/python/model/custom_model.py +323 -0
easy_rec/python/model/dat.py +138 -0
easy_rec/python/model/dbmtl.py +116 -0
easy_rec/python/model/dcn.py +70 -0
easy_rec/python/model/deepfm.py +106 -0
easy_rec/python/model/dlrm.py +73 -0
easy_rec/python/model/dropoutnet.py +207 -0
easy_rec/python/model/dssm.py +154 -0
easy_rec/python/model/dssm_senet.py +143 -0
easy_rec/python/model/dummy_model.py +48 -0
easy_rec/python/model/easy_rec_estimator.py +739 -0
easy_rec/python/model/easy_rec_model.py +467 -0
easy_rec/python/model/esmm.py +242 -0
easy_rec/python/model/fm.py +63 -0
easy_rec/python/model/match_model.py +357 -0
easy_rec/python/model/mind.py +445 -0
easy_rec/python/model/mmoe.py +70 -0
easy_rec/python/model/multi_task_model.py +303 -0
easy_rec/python/model/multi_tower.py +62 -0
easy_rec/python/model/multi_tower_bst.py +190 -0
easy_rec/python/model/multi_tower_din.py +130 -0
easy_rec/python/model/multi_tower_recall.py +68 -0
easy_rec/python/model/pdn.py +203 -0
easy_rec/python/model/ple.py +120 -0
easy_rec/python/model/rank_model.py +485 -0
easy_rec/python/model/rocket_launching.py +203 -0
easy_rec/python/model/simple_multi_task.py +54 -0
easy_rec/python/model/uniter.py +46 -0
easy_rec/python/model/wide_and_deep.py +121 -0
easy_rec/python/ops/1.12/incr_record.so +0 -0
easy_rec/python/ops/1.12/kafka.so +0 -0
easy_rec/python/ops/1.12/libcustom_ops.so +0 -0
easy_rec/python/ops/1.12/libembed_op.so +0 -0
easy_rec/python/ops/1.12/libhiredis.so.1.0.0 +0 -0
easy_rec/python/ops/1.12/librdkafka++.so.1 +0 -0
easy_rec/python/ops/1.12/librdkafka.so.1 +0 -0
easy_rec/python/ops/1.12/libredis++.so +0 -0
easy_rec/python/ops/1.12/libredis++.so.1 +0 -0
easy_rec/python/ops/1.12/libredis++.so.1.2.3 +0 -0
easy_rec/python/ops/1.12/libstr_avx_op.so +0 -0
easy_rec/python/ops/1.12/libwrite_sparse_kv.so +0 -0
easy_rec/python/ops/1.15/incr_record.so +0 -0
easy_rec/python/ops/1.15/kafka.so +0 -0
easy_rec/python/ops/1.15/libcustom_ops.so +0 -0
easy_rec/python/ops/1.15/libembed_op.so +0 -0
easy_rec/python/ops/1.15/libhiredis.so.1.0.0 +0 -0
easy_rec/python/ops/1.15/librdkafka++.so +0 -0
easy_rec/python/ops/1.15/librdkafka++.so.1 +0 -0
easy_rec/python/ops/1.15/librdkafka.so +0 -0
easy_rec/python/ops/1.15/librdkafka.so.1 +0 -0
easy_rec/python/ops/1.15/libredis++.so.1 +0 -0
easy_rec/python/ops/1.15/libstr_avx_op.so +0 -0
easy_rec/python/ops/2.12/libcustom_ops.so +0 -0
easy_rec/python/ops/2.12/libload_embed.so +0 -0
easy_rec/python/ops/2.12/libstr_avx_op.so +0 -0
easy_rec/python/ops/__init__.py +0 -0
easy_rec/python/ops/gen_kafka_ops.py +193 -0
easy_rec/python/ops/gen_str_avx_op.py +28 -0
easy_rec/python/ops/incr_record.py +30 -0
easy_rec/python/predict.py +170 -0
easy_rec/python/protos/__init__.py +0 -0
easy_rec/python/protos/autoint_pb2.py +122 -0
easy_rec/python/protos/backbone_pb2.py +1416 -0
easy_rec/python/protos/cmbf_pb2.py +435 -0
easy_rec/python/protos/collaborative_metric_learning_pb2.py +252 -0
easy_rec/python/protos/custom_model_pb2.py +57 -0
easy_rec/python/protos/dat_pb2.py +262 -0
easy_rec/python/protos/data_source_pb2.py +422 -0
easy_rec/python/protos/dataset_pb2.py +1920 -0
easy_rec/python/protos/dbmtl_pb2.py +191 -0
easy_rec/python/protos/dcn_pb2.py +197 -0
easy_rec/python/protos/deepfm_pb2.py +163 -0
easy_rec/python/protos/dlrm_pb2.py +163 -0
easy_rec/python/protos/dnn_pb2.py +329 -0
easy_rec/python/protos/dropoutnet_pb2.py +239 -0
easy_rec/python/protos/dssm_pb2.py +262 -0
easy_rec/python/protos/dssm_senet_pb2.py +282 -0
easy_rec/python/protos/easy_rec_model_pb2.py +1672 -0
easy_rec/python/protos/esmm_pb2.py +133 -0
easy_rec/python/protos/eval_pb2.py +930 -0
easy_rec/python/protos/export_pb2.py +379 -0
easy_rec/python/protos/feature_config_pb2.py +1359 -0
easy_rec/python/protos/fm_pb2.py +90 -0
easy_rec/python/protos/hive_config_pb2.py +138 -0
easy_rec/python/protos/hyperparams_pb2.py +624 -0
easy_rec/python/protos/keras_layer_pb2.py +692 -0
easy_rec/python/protos/layer_pb2.py +1936 -0
easy_rec/python/protos/loss_pb2.py +1713 -0
easy_rec/python/protos/mind_pb2.py +497 -0
easy_rec/python/protos/mmoe_pb2.py +215 -0
easy_rec/python/protos/multi_tower_pb2.py +295 -0
easy_rec/python/protos/multi_tower_recall_pb2.py +198 -0
easy_rec/python/protos/optimizer_pb2.py +2017 -0
easy_rec/python/protos/pdn_pb2.py +293 -0
easy_rec/python/protos/pipeline_pb2.py +516 -0
easy_rec/python/protos/ple_pb2.py +231 -0
easy_rec/python/protos/predict_pb2.py +1140 -0
easy_rec/python/protos/rocket_launching_pb2.py +169 -0
easy_rec/python/protos/seq_encoder_pb2.py +1084 -0
easy_rec/python/protos/simi_pb2.py +54 -0
easy_rec/python/protos/simple_multi_task_pb2.py +97 -0
easy_rec/python/protos/tf_predict_pb2.py +630 -0
easy_rec/python/protos/tower_pb2.py +661 -0
easy_rec/python/protos/train_pb2.py +1197 -0
easy_rec/python/protos/uniter_pb2.py +307 -0
easy_rec/python/protos/variational_dropout_pb2.py +91 -0
easy_rec/python/protos/wide_and_deep_pb2.py +131 -0
easy_rec/python/test/__init__.py +0 -0
easy_rec/python/test/csv_input_test.py +340 -0
easy_rec/python/test/custom_early_stop_func.py +19 -0
easy_rec/python/test/dh_local_run.py +104 -0
easy_rec/python/test/embed_test.py +155 -0
easy_rec/python/test/emr_run.py +119 -0
easy_rec/python/test/eval_metric_test.py +107 -0
easy_rec/python/test/excel_convert_test.py +64 -0
easy_rec/python/test/export_test.py +513 -0
easy_rec/python/test/fg_test.py +70 -0
easy_rec/python/test/hive_input_test.py +311 -0
easy_rec/python/test/hpo_test.py +235 -0
easy_rec/python/test/kafka_test.py +373 -0
easy_rec/python/test/local_incr_test.py +122 -0
easy_rec/python/test/loss_test.py +110 -0
easy_rec/python/test/odps_command.py +61 -0
easy_rec/python/test/odps_local_run.py +86 -0
easy_rec/python/test/odps_run.py +254 -0
easy_rec/python/test/odps_test_cls.py +39 -0
easy_rec/python/test/odps_test_prepare.py +198 -0
easy_rec/python/test/odps_test_util.py +237 -0
easy_rec/python/test/pre_check_test.py +54 -0
easy_rec/python/test/predictor_test.py +394 -0
easy_rec/python/test/rtp_convert_test.py +133 -0
easy_rec/python/test/run.py +138 -0
easy_rec/python/test/train_eval_test.py +1299 -0
easy_rec/python/test/util_test.py +85 -0
easy_rec/python/test/zero_inflated_lognormal_test.py +53 -0
easy_rec/python/tools/__init__.py +0 -0
easy_rec/python/tools/add_boundaries_to_config.py +67 -0
easy_rec/python/tools/add_feature_info_to_config.py +145 -0
easy_rec/python/tools/convert_config_format.py +48 -0
easy_rec/python/tools/convert_rtp_data.py +79 -0
easy_rec/python/tools/convert_rtp_fg.py +106 -0
easy_rec/python/tools/create_config_from_excel.py +427 -0
easy_rec/python/tools/criteo/__init__.py +0 -0
easy_rec/python/tools/criteo/convert_data.py +157 -0
easy_rec/python/tools/edit_lookup_graph.py +134 -0
easy_rec/python/tools/faiss_index_pai.py +116 -0
easy_rec/python/tools/feature_selection.py +316 -0
easy_rec/python/tools/hit_rate_ds.py +223 -0
easy_rec/python/tools/hit_rate_pai.py +138 -0
easy_rec/python/tools/pre_check.py +120 -0
easy_rec/python/tools/predict_and_chk.py +111 -0
easy_rec/python/tools/read_kafka.py +55 -0
easy_rec/python/tools/split_model_pai.py +286 -0
easy_rec/python/tools/split_pdn_model_pai.py +272 -0
easy_rec/python/tools/test_saved_model.py +80 -0
easy_rec/python/tools/view_saved_model.py +39 -0
easy_rec/python/tools/write_kafka.py +65 -0
easy_rec/python/train_eval.py +325 -0
easy_rec/python/utils/__init__.py +15 -0
easy_rec/python/utils/activation.py +120 -0
easy_rec/python/utils/check_utils.py +87 -0
easy_rec/python/utils/compat.py +14 -0
easy_rec/python/utils/config_util.py +652 -0
easy_rec/python/utils/constant.py +43 -0
easy_rec/python/utils/convert_rtp_fg.py +616 -0
easy_rec/python/utils/dag.py +192 -0
easy_rec/python/utils/distribution_utils.py +268 -0
easy_rec/python/utils/ds_util.py +65 -0
easy_rec/python/utils/embedding_utils.py +73 -0
easy_rec/python/utils/estimator_utils.py +1036 -0
easy_rec/python/utils/export_big_model.py +630 -0
easy_rec/python/utils/expr_util.py +118 -0
easy_rec/python/utils/fg_util.py +53 -0
easy_rec/python/utils/hit_rate_utils.py +220 -0
easy_rec/python/utils/hive_utils.py +183 -0
easy_rec/python/utils/hpo_util.py +137 -0
easy_rec/python/utils/hvd_utils.py +56 -0
easy_rec/python/utils/input_utils.py +108 -0
easy_rec/python/utils/io_util.py +282 -0
easy_rec/python/utils/load_class.py +249 -0
easy_rec/python/utils/meta_graph_editor.py +941 -0
easy_rec/python/utils/multi_optimizer.py +62 -0
easy_rec/python/utils/numpy_utils.py +18 -0
easy_rec/python/utils/odps_util.py +79 -0
easy_rec/python/utils/pai_util.py +86 -0
easy_rec/python/utils/proto_util.py +90 -0
easy_rec/python/utils/restore_filter.py +89 -0
easy_rec/python/utils/shape_utils.py +432 -0
easy_rec/python/utils/static_shape.py +71 -0
easy_rec/python/utils/test_utils.py +866 -0
easy_rec/python/utils/tf_utils.py +56 -0
easy_rec/version.py +4 -0
test/__init__.py +0 -0

easy_rec/python/utils/hpo_util.py ADDED Viewed

@@ -0,0 +1,137 @@
+# -*- encoding:utf-8 -*-
+# Copyright (c) Alibaba, Inc. and its affiliates.
+import json
+import logging
+import os
+import psutil
+import tensorflow as tf
+from tensorflow.python.summary import summary_iterator
+if tf.__version__ >= '2.0':
+  gfile = tf.compat.v1.gfile
+else:
+  gfile = tf.gfile
+def get_all_eval_result(event_file_pattern):
+  """Get the best eval result from event files.
+  Args:
+    event_files: Absolute pattern of event files.
+  Returns:
+    The best eval result.
+  """
+  all_eval_result = []
+  for event_file in gfile.Glob(os.path.join(event_file_pattern)):
+    for event in summary_iterator.summary_iterator(event_file):
+      if event.HasField('summary'):
+        event_eval_result = {}
+        event_eval_result['global_step'] = event.step
+        for value in event.summary.value:
+          if value.HasField('simple_value'):
+            event_eval_result[value.tag] = value.simple_value
+        if len(event_eval_result) >= 2:
+          all_eval_result.append(event_eval_result)
+  return all_eval_result
+def save_eval_metrics(model_dir, metric_save_path, has_evaluator=True):
+  """Save evaluation metrics.
+  Args:
+    model_dir: train model directory
+    metric_save_path: metric saving path
+    has_evaluator: evaluation is done on a separate evaluator, not on master.
+  """
+  def _get_eval_event_file_pattern():
+    eval_dir = os.path.join(model_dir, 'eval_val/')
+    if not gfile.Exists(eval_dir):
+      eval_dir = os.path.join(model_dir, 'eval/')
+      assert gfile.Exists(eval_dir), 'eval_val or eval does exists'
+    event_file_pattern = os.path.join(eval_dir, '*.tfevents.*')
+    logging.info('event_file_pattern: %s' % event_file_pattern)
+    return event_file_pattern
+  all_eval_res = []
+  if 'TF_CONFIG' in os.environ:
+    # check whether evaluator exists
+    tf_config = json.loads(os.environ['TF_CONFIG'])
+    logging.info('tf_config = %s' % json.dumps(tf_config))
+    logging.info('model_dir = %s' % model_dir)
+    if has_evaluator:
+      if tf_config['task']['type'] == 'evaluator':
+        event_file_pattern = _get_eval_event_file_pattern()
+        all_eval_res = get_all_eval_result(event_file_pattern)
+    elif 'master' in tf_config['cluster'] or 'chief' in tf_config['cluster']:
+      if tf_config['task']['type'] in ['master', 'chief']:
+        event_file_pattern = _get_eval_event_file_pattern()
+        all_eval_res = get_all_eval_result(event_file_pattern)
+    else:
+      assert False, 'invalid cluster config, could not find master or chief or evaluator'
+  else:
+    # standalone mode
+    event_file_pattern = _get_eval_event_file_pattern()
+    all_eval_res = get_all_eval_result(event_file_pattern)
+  logging.info('all_eval_res num = %d' % len(all_eval_res))
+  if len(all_eval_res) > 0:
+    with gfile.GFile(metric_save_path, 'w') as fout:
+      for eval_res in all_eval_res:
+        fout.write(json.dumps(eval_res) + '\n')
+    logging.info('save all evaluation result to %s' % metric_save_path)
+def kill_old_proc(tmp_dir, platform='pai'):
+  curr_pid = os.getpid()
+  if platform == 'pai':
+    for p in psutil.process_iter():
+      try:
+        cmd = ' '.join(p.cmdline())
+        if 'easy_rec.python.hpo.pai_hpo' in cmd and 'python' in cmd:
+          if p.pid != curr_pid:
+            logging.info('will kill: [%d] %s' % (p.pid, cmd))
+            p.terminate()
+        if 'client/experiment_main.py' in cmd and 'python' in cmd:
+          if p.pid != curr_pid:
+            logging.info('will kill: [%d] %s' % (p.pid, cmd))
+            p.terminate()
+      except Exception:
+        pass
+  else:
+    for p in psutil.process_iter():
+      try:
+        cmd = ' '.join(p.cmdline())
+        if 'easy_rec.python.hpo.emr_hpo' in cmd and 'python' in cmd:
+          if p.pid != curr_pid:
+            logging.info('will kill: [%d] %s' % (p.pid, cmd))
+            p.terminate()
+        if 'client/experiment_main.py' in cmd and 'python' in cmd:
+          if p.pid != curr_pid:
+            logging.info('will kill: [%d] %s' % (p.pid, cmd))
+            p.terminate()
+        if 'el_submit' in cmd and 'easy_rec_hpo' in cmd:
+          if p.pid != curr_pid:
+            logging.info('will kill: [%d] %s' % (p.pid, cmd))
+            p.terminate()
+      except Exception:
+        pass
+  if platform == 'emr':
+    # clear easy_rec_hpo yarn jobs
+    yarn_job_file = os.path.join(tmp_dir, 'yarn_job.txt')
+    os.system(
+        "yarn application -list | awk '{ if ($2 == \"easy_rec_hpo\") print $1 }' > %s"
+        % yarn_job_file)
+    yarn_job_arr = []
+    with open(yarn_job_file, 'r') as fin:
+      for line_str in fin:
+        line_str = line_str.strip()
+        yarn_job_arr.append(line_str)
+    yarn_job_arr = list(set(yarn_job_arr))
+    if len(yarn_job_arr) > 0:
+      logging.info('will kill the easy_rec_hpo yarn jobs: %s' %
+                   ','.join(yarn_job_arr))
+      os.system('yarn application -kill %s' % ' '.join(yarn_job_arr))

easy_rec/python/utils/hvd_utils.py ADDED Viewed

@@ -0,0 +1,56 @@
+# -*- encoding: utf-8 -*-
+import logging
+import tensorflow as tf
+from tensorflow.python.framework import ops
+from tensorflow.python.training import session_run_hook
+from easy_rec.python.utils import constant
+# from horovod.tensorflow.compression import Compression
+try:
+  from horovod.tensorflow.functions import broadcast_variables
+except Exception:
+  pass
+if tf.__version__ >= '2.0':
+  tf = tf.compat.v1
+class BroadcastGlobalVariablesHook(session_run_hook.SessionRunHook):
+  """SessionRunHook that will broadcast all global variables from root rank to all other processes during initialization.
+  This is necessary to ensure consistent initialization of all workers when
+  training is started with random weights or restored from a checkpoint.
+  """  # noqa: E501
+  def __init__(self, root_rank, device=''):
+    """Construct a new BroadcastGlobalVariablesHook that will broadcast all global variables from root rank to all other processes during initialization.
+    Args:
+      root_rank:
+        Rank that will send data, other ranks will receive data.
+      device:
+        Device to be used for broadcasting. Uses GPU by default
+        if Horovod was built with HOROVOD_GPU_OPERATIONS.
+    """  # noqa: E501
+    super(BroadcastGlobalVariablesHook, self).__init__()
+    self.root_rank = root_rank
+    self.bcast_op = None
+    self.device = device
+  def begin(self):
+    bcast_vars = []
+    embed_para_vars = ops.get_collection(constant.EmbeddingParallel)
+    for x in tf.global_variables():
+      # if '/embedding' not in x.name and 'DynamicVariable' not in str(type(x)):
+      if x.name not in embed_para_vars:
+        bcast_vars.append(x)
+        logging.info('will broadcast variable: name=%s shape=%s' %
+                     (x.name, x.get_shape()))
+    if not self.bcast_op or self.bcast_op.graph != tf.get_default_graph():
+      with tf.device(self.device):
+        self.bcast_op = broadcast_variables(bcast_vars, self.root_rank)
+  def after_create_session(self, session, coord):
+    session.run(self.bcast_op)

easy_rec/python/utils/input_utils.py ADDED Viewed

@@ -0,0 +1,108 @@
+# -*- encoding:utf-8 -*-
+# Copyright (c) Alibaba, Inc. and its affiliates.
+import numpy as np
+import pandas as pd
+import tensorflow as tf
+from easy_rec.python.protos.dataset_pb2 import DatasetConfig
+if tf.__version__ >= '2.0':
+  tf = tf.compat.v1
+def get_type_defaults(field_type, default_val=''):
+  type_defaults = {
+      DatasetConfig.INT32: 0,
+      DatasetConfig.INT64: 0,
+      DatasetConfig.STRING: '',
+      DatasetConfig.BOOL: False,
+      DatasetConfig.FLOAT: 0.0,
+      DatasetConfig.DOUBLE: 0.0
+  }
+  assert field_type in type_defaults, 'invalid type: %s' % field_type
+  if default_val == '':
+    default_val = type_defaults[field_type]
+  if field_type == DatasetConfig.INT32:
+    return int(default_val)
+  elif field_type == DatasetConfig.INT64:
+    return np.int64(default_val)
+  elif field_type == DatasetConfig.STRING:
+    return default_val
+  elif field_type == DatasetConfig.BOOL:
+    return default_val.lower() == 'true'
+  elif field_type in [DatasetConfig.FLOAT]:
+    return float(default_val)
+  elif field_type in [DatasetConfig.DOUBLE]:
+    return np.float64(default_val)
+  return type_defaults[field_type]
+def string_to_number(field, ftype, default_value, name=''):
+  """Type conversion for parsing rtp fg input format.
+  Args:
+    field: field to be converted.
+    ftype: field dtype set in DatasetConfig.
+    default_value: default value for this field
+    name: field name for
+  Returns: A name for the operation (optional).
+  """
+  default_vals = tf.tile(tf.constant([str(default_value)]), tf.shape(field))
+  field = tf.where(tf.greater(tf.strings.length(field), 0), field, default_vals)
+  if ftype in [DatasetConfig.INT32, DatasetConfig.INT64]:
+    # Int type is not supported in fg.
+    # If you specify INT32, INT64 in DatasetConfig, you need to perform a cast at here.
+    tmp_field = tf.string_to_number(
+        field, tf.double, name='field_as_flt_%s' % name)
+    if ftype in [DatasetConfig.INT64]:
+      tmp_field = tf.cast(tmp_field, tf.int64)
+    else:
+      tmp_field = tf.cast(tmp_field, tf.int32)
+  elif ftype in [DatasetConfig.FLOAT]:
+    tmp_field = tf.string_to_number(
+        field, tf.float32, name='field_as_flt_%s' % name)
+  elif ftype in [DatasetConfig.DOUBLE]:
+    tmp_field = tf.string_to_number(
+        field, tf.float64, name='field_as_flt_%s' % name)
+  elif ftype in [DatasetConfig.BOOL]:
+    tmp_field = tf.logical_or(tf.equal(field, 'True'), tf.equal(field, 'true'))
+  elif ftype in [DatasetConfig.STRING]:
+    tmp_field = field
+  else:
+    assert False, 'invalid types: %s' % str(ftype)
+  return tmp_field
+def np_to_tf_type(np_type):
+  _types_map = {
+      int: tf.int32,
+      np.int32: tf.int32,
+      np.int64: tf.int64,
+      str: tf.string,
+      np.float: tf.float32,
+      np.float32: tf.float32,
+      float: tf.float32,
+      np.double: tf.float64
+  }
+  if np_type in _types_map:
+    return _types_map[np_type]
+  else:
+    return tf.string
+def get_tf_type_from_parquet_file(cols, parquet_file):
+  # gfile not supported, read_parquet requires random access
+  input_data = pd.read_parquet(parquet_file, columns=cols)
+  tf_types = []
+  for col in cols:
+    obj = input_data[col][0]
+    if isinstance(obj, list):
+      data_type = type(obj[0])
+    elif isinstance(obj, np.ndarray):
+      data_type = type(obj[0])
+    else:
+      data_type = type(obj)
+    tf_types.append(np_to_tf_type(data_type))
+  return tf_types

easy_rec/python/utils/io_util.py ADDED Viewed

@@ -0,0 +1,282 @@
+# -*- encoding:utf-8 -*-
+# Copyright (c) Alibaba, Inc. and its affiliates.
+"""IO utils.
+isort:skip_file
+"""
+import logging
+from future import standard_library
+standard_library.install_aliases()
+import os
+import traceback
+from subprocess import getstatusoutput
+import six
+import tensorflow as tf
+from six.moves import http_client
+from six.moves import urllib
+import json
+if six.PY2:
+  from urllib import quote
+else:
+  from urllib.parse import quote
+if tf.__version__ >= '2.0':
+  tf = tf.compat.v1
+EASY_REC_RES_DIR = 'easy_rec_user_resources'
+HTTP_MAX_NUM_RETRY = 5
+HTTP_MAX_TIMEOUT = 600
+def http_read(url, timeout=HTTP_MAX_TIMEOUT, max_retry=HTTP_MAX_NUM_RETRY):
+  """Read data from url with maximum retry.
+  Args:
+    url: http url to be read
+    timeout: specifies a timeout in seconds for blocking operations.
+    max_retry: http max retry times.
+  """
+  num_read_try = 0
+  data = None
+  while num_read_try < max_retry:
+    try:
+      if six.PY2:
+        url = url.encode('utf-8')
+      url = quote(url, safe='%/:?=&')
+      data = urllib.request.urlopen(url, timeout=timeout).read()
+      break
+    except http_client.IncompleteRead:
+      tf.logging.warning('incomplete read exception, will retry: %s' % url)
+      num_read_try += 1
+    except Exception:
+      tf.logging.error(traceback.format_exc())
+      break
+  if data is None:
+    tf.logging.error('http read %s failed' % url)
+  return data
+def download(oss_or_url, dst_dir=''):
+  """Download file.
+  Args:
+    oss_or_url: http or oss path
+    dst_dir: destination directory
+  Return:
+    dst_file: local path for the downloaded file
+  """
+  _, basename = os.path.split(oss_or_url)
+  if oss_or_url[:3] == 'oss':
+    with tf.gfile.GFile(oss_or_url, 'rb') as infile:
+      file_content = infile.read()
+  elif oss_or_url[:4] == 'http':
+    try:
+      response = urllib.request.urlopen(oss_or_url, timeout=HTTP_MAX_TIMEOUT)
+      file_content = response.read()
+    except Exception as e:
+      raise RuntimeError('Download %s failed: %s\n %s' %
+                         (oss_or_url, str(e), traceback.format_exc()))
+  else:
+    tf.logging.warning('skip downloading %s, seems to be a local file' %
+                       oss_or_url)
+    return oss_or_url
+  if dst_dir != '' and not os.path.exists(dst_dir):
+    os.makedirs(dst_dir)
+  dst_file = os.path.join(dst_dir, basename)
+  with tf.gfile.GFile(dst_file, 'wb') as ofile:
+    ofile.write(file_content)
+  return dst_file
+def create_module_dir(dst_dir):
+  if not os.path.exists(dst_dir):
+    os.makedirs(dst_dir)
+    with open(os.path.join(dst_dir, '__init__.py'), 'w') as ofile:
+      ofile.write('\n')
+def download_resource(resource_path, dst_dir=EASY_REC_RES_DIR):
+  """Download user resource.
+  Args:
+    resource_path: http or oss path
+    dst_dir: destination directory
+  """
+  create_module_dir(dst_dir)
+  _, basename = os.path.split(resource_path)
+  if not basename.endswith('.py'):
+    raise ValueError('resource %s should be python file' % resource_path)
+  target = download(resource_path, dst_dir)
+  return target
+def download_and_uncompress_resource(resource_path, dst_dir=EASY_REC_RES_DIR):
+  """Download user resource and uncompress it if necessary.
+  Args:
+    resource_path: http or oss path
+    dst_dir: download destination directory
+  """
+  create_module_dir(dst_dir)
+  _, basename = os.path.split(resource_path)
+  if not basename.endswith('.tar.gz') and not basename.endswith('.zip') and \
+     not basename.endswith('.py'):
+    raise ValueError('resource %s should be tar.gz or zip or py' %
+                     resource_path)
+  download(resource_path, dst_dir)
+  stat = 0
+  if basename.endswith('tar.gz'):
+    stat, output = getstatusoutput('cd %s && tar -zxf %s' % (dst_dir, basename))
+  elif basename.endswith('zip'):
+    stat, output = getstatusoutput('cd %s && unzip %s' % (dst_dir, basename))
+  if stat != 0:
+    raise ValueError('uncompress resoruce %s failed: %s' % resource_path,
+                     output)
+  return dst_dir
+def oss_has_t_mode(target_file):
+  """Test if current enviroment support t-mode written to oss."""
+  if 'PAI' not in tf.__version__:
+    return False
+  # test if running on cluster
+  test_file = target_file + '.tmp'
+  try:
+    with tf.gfile.GFile(test_file, 't') as ofile:
+      ofile.write('a')
+      pass
+    tf.gfile.Remove(test_file)
+    return True
+  except:  # noqa: E722
+    return False
+def fix_oss_dir(path):
+  """Make sure that oss dir endswith /."""
+  if path.startswith('oss://') and not path.endswith('/'):
+    return path + '/'
+  return path
+def save_data_to_json_path(json_path, data):
+  with tf.gfile.GFile(json_path, 'w') as fout:
+    fout.write(json.dumps(data))
+  assert tf.gfile.Exists(json_path), 'in_save_data_to_json_path, save_failed'
+def read_data_from_json_path(json_path):
+  if json_path and tf.gfile.Exists(json_path):
+    with tf.gfile.GFile(json_path, 'r') as fin:
+      data = json.loads(fin.read())
+    return data
+  else:
+    logging.info('json_path not exists, return None')
+    return None
+def convert_tf_flags_to_argparse(flags):
+  """Convert tf.app.flags.FLAGS to argparse.ArgumentParser.
+  Args:
+      flags: tf.app.flags.FLAGS
+  Returns:
+      argparse.ArgumentParser: configurate ArgumentParser object
+  """
+  import argparse
+  import ast
+  parser = argparse.ArgumentParser()
+  args = {}
+  for flag in flags._flags().values():
+    flag_name = flag.name
+    if flag_name in args:
+      args[flag_name][0] = True
+      continue
+    default = flag.value
+    flag_type = type(default)
+    help_str = flag.help or ''
+    args[flag_name] = [
+        False, flag_type, default, help_str,
+        flag.choices if hasattr(flag, 'choices') else None
+    ]
+  def str2bool(v):
+    if isinstance(v, bool):
+      return v
+    if v.lower() in ('yes', 'true', 't', 'y', '1'):
+      return True
+    elif v.lower() in ('no', 'false', 'f', 'n', '0'):
+      return False
+    else:
+      raise argparse.ArgumentTypeError('Boolean value expected.')
+  for flag_name, (multi, flag_type, default, help_str, choices) in args.items():
+    if flag_type == bool:
+      parser.add_argument(
+          '--' + flag_name,
+          type=str2bool,
+          nargs='?',
+          const=True,
+          default=False,
+          help=help_str)
+    elif flag_type == str:
+      if choices:
+        parser.add_argument(
+            '--' + flag_name,
+            type=str,
+            choices=choices,
+            default=default,
+            help=help_str)
+      elif multi:
+        parser.add_argument(
+            '--' + flag_name,
+            type=str,
+            action='append',
+            default=default,
+            help=help_str)
+      else:
+        parser.add_argument(
+            '--' + flag_name, type=str, default=default, help=help_str)
+    elif flag_type in (list, dict):
+      parser.add_argument(
+          '--' + flag_name,
+          type=lambda s: ast.literal_eval(s),
+          default=default,
+          help=help_str)
+    elif flag_type in (int, float):
+      parser.add_argument(
+          '--' + flag_name, type=flag_type, default=default, help=help_str)
+    else:
+      parser.add_argument(
+          '--' + flag_name, type=str, default=default, help=help_str)
+  return parser
+def filter_unknown_args(flags, args):
+  """Filter unknown args."""
+  known_args = [args[0]]
+  parser = convert_tf_flags_to_argparse(flags)
+  args, unknown = parser.parse_known_args(args)
+  if len(unknown) > 1:
+    logging.info('undefined arguments: %s', ', '.join(unknown[1:]))
+  for key, value in vars(args).items():
+    if value is None:
+      continue
+    if type(value) in (list, dict) and not value:
+      continue
+    known_args.append('--' + key + '=' + str(value))
+  logging.info('defined arguments: %s', ', '.join(known_args[1:]))
+  return known_args