upgini 1.2.46__tar.gz → 1.2.47__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of upgini might be problematic. Click here for more details.

Files changed (67) hide show
  1. {upgini-1.2.46 → upgini-1.2.47}/PKG-INFO +1 -1
  2. upgini-1.2.47/src/upgini/__about__.py +1 -0
  3. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/http.py +19 -7
  4. upgini-1.2.46/src/upgini/__about__.py +0 -1
  5. {upgini-1.2.46 → upgini-1.2.47}/.gitignore +0 -0
  6. {upgini-1.2.46 → upgini-1.2.47}/LICENSE +0 -0
  7. {upgini-1.2.46 → upgini-1.2.47}/README.md +0 -0
  8. {upgini-1.2.46 → upgini-1.2.47}/pyproject.toml +0 -0
  9. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/__init__.py +0 -0
  10. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/ads.py +0 -0
  11. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/ads_management/__init__.py +0 -0
  12. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/ads_management/ads_manager.py +0 -0
  13. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/autofe/__init__.py +0 -0
  14. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/autofe/all_operands.py +0 -0
  15. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/autofe/binary.py +0 -0
  16. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/autofe/date.py +0 -0
  17. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/autofe/feature.py +0 -0
  18. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/autofe/groupby.py +0 -0
  19. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/autofe/operand.py +0 -0
  20. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/autofe/unary.py +0 -0
  21. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/autofe/vector.py +0 -0
  22. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/data_source/__init__.py +0 -0
  23. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/data_source/data_source_publisher.py +0 -0
  24. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/dataset.py +0 -0
  25. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/errors.py +0 -0
  26. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/features_enricher.py +0 -0
  27. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/lazy_import.py +0 -0
  28. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/mdc/__init__.py +0 -0
  29. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/mdc/context.py +0 -0
  30. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/metadata.py +0 -0
  31. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/metrics.py +0 -0
  32. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/normalizer/__init__.py +0 -0
  33. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/normalizer/normalize_utils.py +0 -0
  34. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/resource_bundle/__init__.py +0 -0
  35. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/resource_bundle/exceptions.py +0 -0
  36. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/resource_bundle/strings.properties +0 -0
  37. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/resource_bundle/strings_widget.properties +0 -0
  38. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/sampler/__init__.py +0 -0
  39. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/sampler/base.py +0 -0
  40. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/sampler/random_under_sampler.py +0 -0
  41. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/sampler/utils.py +0 -0
  42. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/search_task.py +0 -0
  43. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/spinner.py +0 -0
  44. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/utils/Roboto-Regular.ttf +0 -0
  45. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/utils/__init__.py +0 -0
  46. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/utils/base_search_key_detector.py +0 -0
  47. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/utils/blocked_time_series.py +0 -0
  48. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/utils/country_utils.py +0 -0
  49. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/utils/custom_loss_utils.py +0 -0
  50. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/utils/cv_utils.py +0 -0
  51. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/utils/datetime_utils.py +0 -0
  52. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/utils/deduplicate_utils.py +0 -0
  53. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/utils/display_utils.py +0 -0
  54. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/utils/email_utils.py +0 -0
  55. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/utils/fallback_progress_bar.py +0 -0
  56. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/utils/feature_info.py +0 -0
  57. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/utils/features_validator.py +0 -0
  58. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/utils/format.py +0 -0
  59. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/utils/ip_utils.py +0 -0
  60. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/utils/phone_utils.py +0 -0
  61. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/utils/postal_code_utils.py +0 -0
  62. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/utils/progress_bar.py +0 -0
  63. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/utils/sklearn_ext.py +0 -0
  64. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/utils/target_utils.py +0 -0
  65. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/utils/track_info.py +0 -0
  66. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/utils/warning_counter.py +0 -0
  67. {upgini-1.2.46 → upgini-1.2.47}/src/upgini/version_validator.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: upgini
3
- Version: 1.2.46
3
+ Version: 1.2.47
4
4
  Summary: Intelligent data search & enrichment for Machine Learning
5
5
  Project-URL: Bug Reports, https://github.com/upgini/upgini/issues
6
6
  Project-URL: Homepage, https://upgini.com/
@@ -0,0 +1 @@
1
+ __version__ = "1.2.47"
@@ -16,7 +16,7 @@ from typing import Any, Dict, List, Optional, Tuple
16
16
  from urllib.parse import urljoin
17
17
 
18
18
  import jwt
19
- import pandas as pd
19
+ # import pandas as pd
20
20
  import requests
21
21
  from pydantic import BaseModel
22
22
  from pythonjsonlogger import jsonlogger
@@ -422,6 +422,16 @@ class _RestClient:
422
422
  lambda: self._send_post_file_req_v2(api_path, files, trace_id=trace_id, need_json_response=False)
423
423
  )
424
424
 
425
+ @staticmethod
426
+ def compute_file_digest(filepath: str, algorithm="sha256", chunk_size=4096) -> str:
427
+ hash_func = getattr(hashlib, algorithm)()
428
+
429
+ with open(filepath, "rb") as f:
430
+ for chunk in iter(lambda: f.read(chunk_size), b""):
431
+ hash_func.update(chunk)
432
+
433
+ return hash_func.hexdigest()
434
+
425
435
  def initial_search_v2(
426
436
  self,
427
437
  trace_id: str,
@@ -442,9 +452,10 @@ class _RestClient:
442
452
  digest = md5_hash.hexdigest()
443
453
  metadata_with_md5 = metadata.copy(update={"checksumMD5": digest})
444
454
 
445
- digest_sha256 = hashlib.sha256(
446
- pd.util.hash_pandas_object(pd.read_parquet(file_path, engine="fastparquet")).values
447
- ).hexdigest()
455
+ # digest_sha256 = hashlib.sha256(
456
+ # pd.util.hash_pandas_object(pd.read_parquet(file_path, engine="fastparquet")).values
457
+ # ).hexdigest()
458
+ digest_sha256 = self.compute_file_digest(file_path)
448
459
  metadata_with_md5 = metadata_with_md5.copy(update={"digest": digest_sha256})
449
460
 
450
461
  with open(file_path, "rb") as file:
@@ -530,9 +541,10 @@ class _RestClient:
530
541
  digest = md5_hash.hexdigest()
531
542
  metadata_with_md5 = metadata.copy(update={"checksumMD5": digest})
532
543
 
533
- digest_sha256 = hashlib.sha256(
534
- pd.util.hash_pandas_object(pd.read_parquet(file_path, engine="fastparquet")).values
535
- ).hexdigest()
544
+ # digest_sha256 = hashlib.sha256(
545
+ # pd.util.hash_pandas_object(pd.read_parquet(file_path, engine="fastparquet")).values
546
+ # ).hexdigest()
547
+ digest_sha256 = self.compute_file_digest(file_path)
536
548
  metadata_with_md5 = metadata_with_md5.copy(update={"digest": digest_sha256})
537
549
 
538
550
  with open(file_path, "rb") as file:
@@ -1 +0,0 @@
1
- __version__ = "1.2.46"
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes