PyPI - pywombat - Versions diffs - 0.1.0__py3-none-any.whl → 0.2.0__py3-none-any.whl - Mend

pywombat 0.1.0py3-none-any.whl → 0.2.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

pywombat/cli.py CHANGED Viewed

@@ -1,5 +1,6 @@
 """CLI for wombat tool."""
+import gzip
 import re
 import warnings
 from pathlib import Path
@@ -22,9 +23,9 @@ import yaml
     "-f",
     "--format",
     "output_format",
-    type=click.Choice(["tsv", "parquet"], case_sensitive=False),
+    type=click.Choice(["tsv", "tsv.gz", "parquet"], case_sensitive=False),
     default="tsv",
-    help="Output format: tsv (default) or parquet.",
+    help="Output format: tsv (default), tsv.gz (compressed), or parquet.",
 )
 @click.option("-v", "--verbose", is_flag=True, help="Enable verbose output.")
 @click.option(
@@ -73,7 +74,13 @@ def cli(
         if verbose:
             click.echo(f"Reading input file: {input_file}", err=True)
-        # Read the TSV file
+        # Detect if file is gzipped based on extension
+        is_gzipped = str(input_file).endswith(".gz")
+        if verbose and is_gzipped:
+            click.echo("Detected gzipped file", err=True)
+        # Read the TSV file (handles both plain and gzipped)
         df = pl.read_csv(input_file, separator="\t")
         if verbose:
@@ -104,6 +111,23 @@ def cli(
                 click.echo(f"Reading filter config: {filter_config}", err=True)
             filter_config_data = load_filter_config(filter_config)
+        # Determine output prefix
+        if output is None:
+            # Generate default output prefix from input filename
+            input_stem = input_file.name
+            # Remove .tsv.gz or .tsv extension
+            if input_stem.endswith(".tsv.gz"):
+                input_stem = input_stem[:-7]  # Remove .tsv.gz
+            elif input_stem.endswith(".tsv"):
+                input_stem = input_stem[:-4]  # Remove .tsv
+            # Add config name if filter is provided
+            if filter_config:
+                config_name = filter_config.stem  # Get basename without extension
+                output = f"{input_stem}.{config_name}"
+            else:
+                output = input_stem
         # Apply filters and write output
         if filter_config_data:
             apply_filters_and_write(
@@ -115,25 +139,19 @@ def cli(
             )
         else:
             # No filters - write single output file
-            if output:
-                # Construct output filename with prefix and format
-                output_path = Path(f"{output}.{output_format}")
+            # Construct output filename with prefix and format
+            output_path = Path(f"{output}.{output_format}")
-                if output_format == "tsv":
-                    formatted_df.write_csv(output_path, separator="\t")
-                elif output_format == "parquet":
-                    formatted_df.write_parquet(output_path)
+            if output_format == "tsv":
+                formatted_df.write_csv(output_path, separator="\t")
+            elif output_format == "tsv.gz":
+                csv_content = formatted_df.write_csv(separator="\t")
+                with gzip.open(output_path, "wt") as f:
+                    f.write(csv_content)
+            elif output_format == "parquet":
+                formatted_df.write_parquet(output_path)
-                click.echo(f"Formatted data written to {output_path}", err=True)
-            else:
-                # Write to stdout (only for TSV format)
-                if output_format != "tsv":
-                    click.echo(
-                        "Error: stdout output only supported for TSV format. Use -o to specify an output prefix for parquet.",
-                        err=True,
-                    )
-                    raise click.Abort()
-                click.echo(formatted_df.write_csv(separator="\t"), nl=False)
+            click.echo(f"Formatted data written to {output_path}", err=True)
     except Exception as e:
         click.echo(f"Error: {e}", err=True)
@@ -555,11 +573,15 @@ def apply_impact_filters(
             )
         # Write to file
-        output_filename = f"{output_prefix}_{name}.{output_format}"
+        output_filename = f"{output_prefix}.{name}.{output_format}"
         output_path = Path(output_filename)
         if output_format == "tsv":
             filtered_df.write_csv(output_path, separator="\t")
+        elif output_format == "tsv.gz":
+            csv_content = filtered_df.write_csv(separator="\t")
+            with gzip.open(output_path, "wt") as f:
+                f.write(csv_content)
         elif output_format == "parquet":
             filtered_df.write_parquet(output_path)
@@ -599,6 +621,10 @@ def apply_filters_and_write(
             if output_format == "tsv":
                 filtered_df.write_csv(output_path, separator="\t")
+            elif output_format == "tsv.gz":
+                csv_content = filtered_df.write_csv(separator="\t")
+                with gzip.open(output_path, "wt") as f:
+                    f.write(csv_content)
             elif output_format == "parquet":
                 filtered_df.write_parquet(output_path)

{pywombat-0.1.0.dist-info → pywombat-0.2.0.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: pywombat
-Version: 0.1.0
+Version: 0.2.0
 Summary: A CLI tool for processing and filtering bcftools tabulated TSV files with pedigree support
 Project-URL: Homepage, https://github.com/bourgeron-lab/pywombat
 Project-URL: Repository, https://github.com/bourgeron-lab/pywombat

pywombat-0.2.0.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,6 @@
+pywombat/__init__.py,sha256=iIPN9vJtsIUhl_DiKNnknxCamLinfayodLLFK8y-aJg,54
+pywombat/cli.py,sha256=PZKV6FoqZyGgG7_mMIO2FzyeONdBaCqnhDATYsQJqMo,33899
+pywombat-0.2.0.dist-info/METADATA,sha256=7Qg2XnaTM92pmIewu5fw_vrcQW5JCVkkj2q6mNC9v88,4982
+pywombat-0.2.0.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
+pywombat-0.2.0.dist-info/entry_points.txt,sha256=Vt7U2ypbiEgCBlEV71ZPk287H5_HKmPBT4iBu6duEcE,44
+pywombat-0.2.0.dist-info/RECORD,,

{pywombat-0.1.0.dist-info → pywombat-0.2.0.dist-info}/WHEEL RENAMED Viewed

@@ -1,4 +1,4 @@
 Wheel-Version: 1.0
-Generator: hatchling 1.27.0
+Generator: hatchling 1.28.0
 Root-Is-Purelib: true
 Tag: py3-none-any

pywombat-0.1.0.dist-info/RECORD DELETED Viewed

@@ -1,6 +0,0 @@
-pywombat/__init__.py,sha256=iIPN9vJtsIUhl_DiKNnknxCamLinfayodLLFK8y-aJg,54
-pywombat/cli.py,sha256=kUokXfnaSCKLXiCu7jXbYOPlGTtL5wSzocM9gFtPy30,32801
-pywombat-0.1.0.dist-info/METADATA,sha256=3RlA_lLC7hKUxIrhQvvbBKEolYGOl_EVJgyDfDLI0sU,4982
-pywombat-0.1.0.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
-pywombat-0.1.0.dist-info/entry_points.txt,sha256=Vt7U2ypbiEgCBlEV71ZPk287H5_HKmPBT4iBu6duEcE,44
-pywombat-0.1.0.dist-info/RECORD,,

{pywombat-0.1.0.dist-info → pywombat-0.2.0.dist-info}/entry_points.txt RENAMED Viewed

File without changes

pywombat 0.1.0__py3-none-any.whl → 0.2.0__py3-none-any.whl

pywombat 0.1.0py3-none-any.whl → 0.2.0py3-none-any.whl