sws-spark-dissemination-helper 0.0.90__tar.gz → 0.0.92__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (16) hide show
  1. {sws_spark_dissemination_helper-0.0.90 → sws_spark_dissemination_helper-0.0.92}/PKG-INFO +1 -1
  2. {sws_spark_dissemination_helper-0.0.90 → sws_spark_dissemination_helper-0.0.92}/pyproject.toml +1 -1
  3. {sws_spark_dissemination_helper-0.0.90 → sws_spark_dissemination_helper-0.0.92}/src/sws_spark_dissemination_helper/SWSBronzeIcebergSparkHelper.py +12 -7
  4. {sws_spark_dissemination_helper-0.0.90 → sws_spark_dissemination_helper-0.0.92}/.gitignore +0 -0
  5. {sws_spark_dissemination_helper-0.0.90 → sws_spark_dissemination_helper-0.0.92}/LICENSE +0 -0
  6. {sws_spark_dissemination_helper-0.0.90 → sws_spark_dissemination_helper-0.0.92}/README.md +0 -0
  7. {sws_spark_dissemination_helper-0.0.90 → sws_spark_dissemination_helper-0.0.92}/old_requirements.txt +0 -0
  8. {sws_spark_dissemination_helper-0.0.90 → sws_spark_dissemination_helper-0.0.92}/requirements.txt +0 -0
  9. {sws_spark_dissemination_helper-0.0.90 → sws_spark_dissemination_helper-0.0.92}/src/sws_spark_dissemination_helper/SWSGoldIcebergSparkHelper.py +0 -0
  10. {sws_spark_dissemination_helper-0.0.90 → sws_spark_dissemination_helper-0.0.92}/src/sws_spark_dissemination_helper/SWSPostgresSparkReader.py +0 -0
  11. {sws_spark_dissemination_helper-0.0.90 → sws_spark_dissemination_helper-0.0.92}/src/sws_spark_dissemination_helper/SWSSilverIcebergSparkHelper.py +0 -0
  12. {sws_spark_dissemination_helper-0.0.90 → sws_spark_dissemination_helper-0.0.92}/src/sws_spark_dissemination_helper/__init__.py +0 -0
  13. {sws_spark_dissemination_helper-0.0.90 → sws_spark_dissemination_helper-0.0.92}/src/sws_spark_dissemination_helper/constants.py +0 -0
  14. {sws_spark_dissemination_helper-0.0.90 → sws_spark_dissemination_helper-0.0.92}/src/sws_spark_dissemination_helper/utils.py +0 -0
  15. {sws_spark_dissemination_helper-0.0.90 → sws_spark_dissemination_helper-0.0.92}/tests/__init__.py +0 -0
  16. {sws_spark_dissemination_helper-0.0.90 → sws_spark_dissemination_helper-0.0.92}/tests/test.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: sws-spark-dissemination-helper
3
- Version: 0.0.90
3
+ Version: 0.0.92
4
4
  Summary: A Python helper package providing streamlined Spark functions for efficient data dissemination processes
5
5
  Project-URL: Repository, https://bitbucket.org/cioapps/sws-it-python-spark-dissemination-helper
6
6
  Author-email: Daniele Mansillo <danielemansillo@gmail.com>
@@ -4,7 +4,7 @@ build-backend = "hatchling.build"
4
4
 
5
5
  [project]
6
6
  name = "sws-spark-dissemination-helper"
7
- version = "0.0.90"
7
+ version = "0.0.92"
8
8
  dependencies = [
9
9
  "annotated-types==0.7.0",
10
10
  "boto3==1.36.18",
@@ -447,18 +447,23 @@ class SWSBronzeIcebergSparkHelper:
447
447
  def write_bronze_disseminated_tag_data_to_iceberg_and_csv(
448
448
  self, dimensions: Dict[str, List[str]]
449
449
  ) -> DataFrame:
450
- self.spark.sql(
451
- f"ALTER TABLE {self.iceberg_tables.BRONZE.iceberg_id}.`tag_{self.tag_name}` CREATE OR REPLACE BRANCH `diss_tag_{self.tag_name}`" # AS OF VERSION `{tag_name}`
452
- )
450
+
451
+ create_branch_query = f"ALTER TABLE {self.iceberg_tables.BRONZE.iceberg_id}.`tag_{self.tag_name}` CREATE OR REPLACE BRANCH `diss_tag_{self.tag_name}`" # AS OF VERSION `{tag_name}`
452
+ logging.info(f"create_branch_query: {create_branch_query}")
453
+ self.spark.sql(create_branch_query)
454
+ logging.info(f"dimensions: {dimensions}")
453
455
 
454
456
  for dimension_name, codes in dimensions.items():
457
+ logging.info(f"dimension_name: {dimension_name}")
458
+ logging.info(f"codes: {codes}")
455
459
  if len(codes) != 0:
456
460
  not_in_codes = ",".join([f"'{code}'" for code in codes])
457
- self.spark.sql(
458
- f"DELETE FROM {self.iceberg_tables.BRONZE.iceberg_id}.`branch_diss_tag_{self.tag_name}` WHERE {dimension_name} NOT IN ({not_in_codes})"
459
- )
461
+ delete_from_branch_query = f"DELETE FROM {self.iceberg_tables.BRONZE.iceberg_id}.`branch_diss_tag_{self.tag_name}` WHERE {dimension_name} NOT IN ({not_in_codes})"
462
+ logging.info(f"delete_from_branch_query: {delete_from_branch_query}")
463
+ self.spark.sql(delete_from_branch_query)
464
+
460
465
  self.disseminated_tag_df = self.spark.read.option(
461
- "branch", self.tag_name
466
+ "branch", f"`diss_tag_{self.tag_name}`"
462
467
  ).table(self.iceberg_tables.BRONZE.iceberg_id)
463
468
 
464
469
  disseminated_tag_df = self.disseminated_tag_df.withColumn(