upgini 1.2.96a2__tar.gz → 1.2.96a3906.dev1__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (79) hide show
  1. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/PKG-INFO +1 -1
  2. upgini-1.2.96a3906.dev1/src/upgini/__about__.py +1 -0
  3. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/autofe/unary.py +8 -0
  4. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/features_enricher.py +2 -12
  5. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/resource_bundle/strings.properties +2 -2
  6. upgini-1.2.96a2/src/upgini/__about__.py +0 -1
  7. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/.gitignore +0 -0
  8. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/LICENSE +0 -0
  9. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/README.md +0 -0
  10. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/pyproject.toml +0 -0
  11. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/__init__.py +0 -0
  12. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/ads.py +0 -0
  13. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/ads_management/__init__.py +0 -0
  14. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/ads_management/ads_manager.py +0 -0
  15. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/autofe/__init__.py +0 -0
  16. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/autofe/all_operators.py +0 -0
  17. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/autofe/binary.py +0 -0
  18. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/autofe/date.py +0 -0
  19. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/autofe/feature.py +0 -0
  20. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/autofe/groupby.py +0 -0
  21. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/autofe/operator.py +0 -0
  22. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/autofe/timeseries/__init__.py +0 -0
  23. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/autofe/timeseries/base.py +0 -0
  24. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/autofe/timeseries/cross.py +0 -0
  25. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/autofe/timeseries/delta.py +0 -0
  26. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/autofe/timeseries/lag.py +0 -0
  27. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/autofe/timeseries/roll.py +0 -0
  28. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/autofe/timeseries/trend.py +0 -0
  29. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/autofe/timeseries/volatility.py +0 -0
  30. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/autofe/utils.py +0 -0
  31. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/autofe/vector.py +0 -0
  32. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/data_source/__init__.py +0 -0
  33. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/data_source/data_source_publisher.py +0 -0
  34. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/dataset.py +0 -0
  35. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/errors.py +0 -0
  36. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/http.py +0 -0
  37. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/mdc/__init__.py +0 -0
  38. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/mdc/context.py +0 -0
  39. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/metadata.py +0 -0
  40. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/metrics.py +0 -0
  41. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/normalizer/__init__.py +0 -0
  42. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/normalizer/normalize_utils.py +0 -0
  43. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/resource_bundle/__init__.py +0 -0
  44. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/resource_bundle/exceptions.py +0 -0
  45. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/resource_bundle/strings_widget.properties +0 -0
  46. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/sampler/__init__.py +0 -0
  47. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/sampler/base.py +0 -0
  48. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/sampler/random_under_sampler.py +0 -0
  49. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/sampler/utils.py +0 -0
  50. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/search_task.py +0 -0
  51. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/spinner.py +0 -0
  52. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/utils/Roboto-Regular.ttf +0 -0
  53. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/utils/__init__.py +0 -0
  54. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/utils/base_search_key_detector.py +0 -0
  55. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/utils/blocked_time_series.py +0 -0
  56. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/utils/country_utils.py +0 -0
  57. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/utils/custom_loss_utils.py +0 -0
  58. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/utils/cv_utils.py +0 -0
  59. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/utils/datetime_utils.py +0 -0
  60. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/utils/deduplicate_utils.py +0 -0
  61. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/utils/display_utils.py +0 -0
  62. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/utils/email_utils.py +0 -0
  63. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/utils/fallback_progress_bar.py +0 -0
  64. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/utils/feature_info.py +0 -0
  65. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/utils/features_validator.py +0 -0
  66. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/utils/format.py +0 -0
  67. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/utils/ip_utils.py +0 -0
  68. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/utils/mstats.py +0 -0
  69. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/utils/phone_utils.py +0 -0
  70. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/utils/postal_code_utils.py +0 -0
  71. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/utils/progress_bar.py +0 -0
  72. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/utils/sample_utils.py +0 -0
  73. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/utils/sklearn_ext.py +0 -0
  74. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/utils/sort.py +0 -0
  75. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/utils/target_utils.py +0 -0
  76. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/utils/track_info.py +0 -0
  77. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/utils/ts_utils.py +0 -0
  78. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/utils/warning_counter.py +0 -0
  79. {upgini-1.2.96a2 → upgini-1.2.96a3906.dev1}/src/upgini/version_validator.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: upgini
3
- Version: 1.2.96a2
3
+ Version: 1.2.96a3906.dev1
4
4
  Summary: Intelligent data search & enrichment for Machine Learning
5
5
  Project-URL: Bug Reports, https://github.com/upgini/upgini/issues
6
6
  Project-URL: Homepage, https://upgini.com/
@@ -0,0 +1 @@
1
+ __version__ = "1.2.96a3906.dev1"
@@ -190,3 +190,11 @@ class Bin(PandasOperator):
190
190
  if isinstance(value, str):
191
191
  return json.loads(value)
192
192
  return value
193
+
194
+
195
+ class Cluster(PandasOperator):
196
+ name: str = "cluster"
197
+ is_unary: bool = True
198
+ input_type: Optional[str] = "vector"
199
+ output_type: Optional[str] = "category"
200
+ is_categorical: bool = True
@@ -1122,7 +1122,6 @@ class FeaturesEnricher(TransformerMixin):
1122
1122
  # and calculate final metric (and uplift)
1123
1123
  enriched_metric = None
1124
1124
  uplift = None
1125
- uplift_perc = None
1126
1125
  enriched_estimator = None
1127
1126
  if set(fitting_X.columns) != set(fitting_enriched_X.columns):
1128
1127
  self.logger.info(
@@ -1154,7 +1153,6 @@ class FeaturesEnricher(TransformerMixin):
1154
1153
  self.logger.info(f"Enriched {metric} on train combined features: {enriched_metric}")
1155
1154
  if baseline_metric is not None and enriched_metric is not None:
1156
1155
  uplift = (enriched_cv_result.metric - baseline_cv_result.metric) * multiplier
1157
- uplift_perc = uplift / abs(baseline_cv_result.metric) * 100
1158
1156
 
1159
1157
  train_metrics = {
1160
1158
  self.bundle.get("quality_metrics_segment_header"): self.bundle.get(
@@ -1181,10 +1179,7 @@ class FeaturesEnricher(TransformerMixin):
1181
1179
  enriched_metric
1182
1180
  )
1183
1181
  if uplift is not None:
1184
- train_metrics[self.bundle.get("quality_metrics_uplift_header")] = round(uplift, 3)
1185
- train_metrics[self.bundle.get("quality_metrics_uplift_perc_header")] = (
1186
- f"{round(uplift_perc, 1)}%"
1187
- )
1182
+ train_metrics[self.bundle.get("quality_metrics_uplift_header")] = uplift
1188
1183
  metrics = [train_metrics]
1189
1184
 
1190
1185
  # 3 If eval_set is presented - fit final model on train enriched data and score each
@@ -1233,10 +1228,8 @@ class FeaturesEnricher(TransformerMixin):
1233
1228
 
1234
1229
  if etalon_eval_metric is not None and enriched_eval_metric is not None:
1235
1230
  eval_uplift = (enriched_eval_results.metric - etalon_eval_results.metric) * multiplier
1236
- eval_uplift_perc = eval_uplift / abs(etalon_eval_results.metric) * 100
1237
1231
  else:
1238
1232
  eval_uplift = None
1239
- eval_uplift_perc = None
1240
1233
 
1241
1234
  eval_metrics = {
1242
1235
  self.bundle.get("quality_metrics_segment_header"): self.bundle.get(
@@ -1267,10 +1260,7 @@ class FeaturesEnricher(TransformerMixin):
1267
1260
  enriched_eval_metric
1268
1261
  )
1269
1262
  if eval_uplift is not None:
1270
- eval_metrics[self.bundle.get("quality_metrics_uplift_header")] = round(eval_uplift, 3)
1271
- eval_metrics[self.bundle.get("quality_metrics_uplift_perc_header")] = (
1272
- f"{round(eval_uplift_perc, 1)}%"
1273
- )
1263
+ eval_metrics[self.bundle.get("quality_metrics_uplift_header")] = eval_uplift
1274
1264
 
1275
1265
  metrics.append(eval_metrics)
1276
1266
 
@@ -284,8 +284,8 @@ quality_metrics_segment_header=Dataset type
284
284
  quality_metrics_match_rate_header=Match rate
285
285
  quality_metrics_baseline_header=Baseline {}
286
286
  quality_metrics_enriched_header=Enriched {}
287
- quality_metrics_uplift_header=Uplift, abs
288
- quality_metrics_uplift_perc_header=Uplift, %
287
+ quality_metrics_uplift_header=Uplift
288
+ quality_metrics_uplift_prc_header=Uplift, %
289
289
 
290
290
  # Legacy native api messages
291
291
  dataset_dataframe_or_path_empty=Either `df` or `path` must be provided
@@ -1 +0,0 @@
1
- __version__ = "1.2.96a2"
File without changes
File without changes
File without changes