PyPI - TSUMUGI - Versions diffs - 1.0.1__py3-none-any.whl - Mend

TSUMUGI 1.0.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (64) hide show

TSUMUGI/annotator.py +103 -0
TSUMUGI/argparser.py +599 -0
TSUMUGI/core.py +185 -0
TSUMUGI/data/impc_phenodigm.csv +3406 -0
TSUMUGI/data/mp.obo +143993 -0
TSUMUGI/filterer.py +36 -0
TSUMUGI/formatter.py +122 -0
TSUMUGI/genewise_annotation_builder.py +94 -0
TSUMUGI/io_handler.py +189 -0
TSUMUGI/main.py +300 -0
TSUMUGI/network_constructor.py +603 -0
TSUMUGI/ontology_handler.py +62 -0
TSUMUGI/pairwise_similarity_builder.py +66 -0
TSUMUGI/report_generator.py +122 -0
TSUMUGI/similarity_calculator.py +498 -0
TSUMUGI/subcommands/count_filterer.py +47 -0
TSUMUGI/subcommands/genes_filterer.py +89 -0
TSUMUGI/subcommands/graphml_builder.py +158 -0
TSUMUGI/subcommands/life_stage_filterer.py +48 -0
TSUMUGI/subcommands/mp_filterer.py +142 -0
TSUMUGI/subcommands/score_filterer.py +22 -0
TSUMUGI/subcommands/sex_filterer.py +48 -0
TSUMUGI/subcommands/webapp_builder.py +358 -0
TSUMUGI/subcommands/zygosity_filterer.py +48 -0
TSUMUGI/validator.py +65 -0
TSUMUGI/web/app/css/app.css +1129 -0
TSUMUGI/web/app/genelist/network_genelist.html +339 -0
TSUMUGI/web/app/genelist/network_genelist.js +421 -0
TSUMUGI/web/app/js/data/dataLoader.js +41 -0
TSUMUGI/web/app/js/export/graphExporter.js +214 -0
TSUMUGI/web/app/js/graph/centrality.js +495 -0
TSUMUGI/web/app/js/graph/components.js +30 -0
TSUMUGI/web/app/js/graph/filters.js +158 -0
TSUMUGI/web/app/js/graph/highlighter.js +52 -0
TSUMUGI/web/app/js/graph/layoutController.js +454 -0
TSUMUGI/web/app/js/graph/valueScaler.js +43 -0
TSUMUGI/web/app/js/search/geneSearcher.js +93 -0
TSUMUGI/web/app/js/search/phenotypeSearcher.js +292 -0
TSUMUGI/web/app/js/ui/dynamicFontSize.js +30 -0
TSUMUGI/web/app/js/ui/mobilePanel.js +77 -0
TSUMUGI/web/app/js/ui/slider.js +22 -0
TSUMUGI/web/app/js/ui/tooltips.js +514 -0
TSUMUGI/web/app/js/viewer/pageSetup.js +217 -0
TSUMUGI/web/app/viewer.html +515 -0
TSUMUGI/web/app/viewer.js +1593 -0
TSUMUGI/web/css/sanitize.css +363 -0
TSUMUGI/web/css/top.css +391 -0
TSUMUGI/web/image/tsumugi-favicon.ico +0 -0
TSUMUGI/web/image/tsumugi-icon.png +0 -0
TSUMUGI/web/image/tsumugi-logo.png +0 -0
TSUMUGI/web/image/tsumugi-logo.svg +69 -0
TSUMUGI/web/js/genelist_formatter.js +123 -0
TSUMUGI/web/js/top.js +338 -0
TSUMUGI/web/open_webapp_linux.sh +25 -0
TSUMUGI/web/open_webapp_mac.command +25 -0
TSUMUGI/web/open_webapp_windows.bat +37 -0
TSUMUGI/web/serve_index.py +110 -0
TSUMUGI/web/template/template_index.html +197 -0
TSUMUGI/web_deployer.py +150 -0
tsumugi-1.0.1.dist-info/METADATA +504 -0
tsumugi-1.0.1.dist-info/RECORD +64 -0
tsumugi-1.0.1.dist-info/WHEEL +4 -0
tsumugi-1.0.1.dist-info/entry_points.txt +3 -0
tsumugi-1.0.1.dist-info/licenses/LICENSE +21 -0

TSUMUGI/annotator.py ADDED Viewed

@@ -0,0 +1,103 @@
+from __future__ import annotations
+import re
+from collections.abc import Generator, Iterable, Iterator
+###########################################################
+# annotate_life_stage
+###########################################################
+def _annotate_life_stage(procedure_name: str, pipeline_name: str, embryo_pattern: re.Pattern) -> str:
+    if bool(embryo_pattern.search(procedure_name)):
+        return "Embryo"
+    if "Interval" in pipeline_name or "interval" in pipeline_name:
+        return "Interval"
+    elif "Late" in pipeline_name or "late" in pipeline_name:
+        return "Late"
+    else:
+        return "Early"
+def annotate_life_stage(records_annotated, embryo_assays: set[str]) -> Iterator[dict]:
+    embryo_pattern = re.compile("|".join(map(re.escape, embryo_assays)))
+    for record in records_annotated:
+        record["life_stage"] = _annotate_life_stage(record["procedure_name"], record["pipeline_name"], embryo_pattern)
+        yield record
+###########################################################
+# annotate_sexual_dimorphism
+###########################################################
+def _annotate_sexual_dimorphism(
+    female_ko_effect_p_value: float, male_ko_effect_p_value: float, threshold: float = 1e-4
+) -> str:
+    if female_ko_effect_p_value <= threshold and male_ko_effect_p_value > threshold:
+        return "Female"
+    elif male_ko_effect_p_value <= threshold and female_ko_effect_p_value > threshold:
+        return "Male"
+    else:
+        return "None"
+def annotate_sexual_dimorphism(records_annotated, threshold: float = 1e-4) -> Generator[dict]:
+    for record in records_annotated:
+        # Annotate sexual dimorphism
+        record["sexual_dimorphism"] = _annotate_sexual_dimorphism(
+            record["female_ko_effect_p_value"], record["male_ko_effect_p_value"], threshold
+        )
+        # Set effect_size based on sexual_dimorphism
+        if record["sexual_dimorphism"] == "Female":
+            record["effect_size"] = record["female_ko_parameter_estimate"]
+        elif record["sexual_dimorphism"] == "Male":
+            record["effect_size"] = record["male_ko_parameter_estimate"]
+        yield record
+###########################################################
+# annotate_diseases
+###########################################################
+def annotate_diseases(records_annotated, disease_annotations_by_gene: dict) -> Generator[dict]:
+    for record in records_annotated:
+        if not record["significant"]:
+            record["disease_annotation"] = []
+            continue
+        record["disease_annotation"] = set()
+        marker = record["marker_symbol"]
+        record_zygosity = record["zygosity"]
+        record_life_stage = record["life_stage"]
+        if marker in disease_annotations_by_gene:
+            for disease_annotation in disease_annotations_by_gene[marker]:
+                if (
+                    record_zygosity == disease_annotation["zygosity"]
+                    and record_life_stage == disease_annotation["life_stage"]
+                ):
+                    record["disease_annotation"].add(disease_annotation["disorder_name"])
+        record["disease_annotation"] = sorted(record["disease_annotation"])
+        yield record
+def annotate_significant(records_annotated: Iterable[dict]) -> Generator[dict]:
+    for record in records_annotated:
+        if record["mp_term_id"]:
+            record["significant"] = True
+            yield record
+        record["effect_size"] = 0.0
+        record["p_value"] = 1.0
+        record["significant"] = False
+        record["mp_term_id"] = record["intermediate_mp_term_id"].split(",")[-1]
+        record["mp_term_name"] = record["intermediate_mp_term_name"].split(",")[-1]
+        yield record

TSUMUGI/argparser.py ADDED Viewed

@@ -0,0 +1,599 @@
+from __future__ import annotations
+import argparse
+from importlib.metadata import PackageNotFoundError, version as pkg_version
+from importlib.resources import files
+from pathlib import Path
+def _get_version() -> str:
+    """
+    Get TSUMUGI version defined in pyproject.toml.
+    The argument must match [project.name] (distribution name).
+    """
+    try:
+        return pkg_version("tsumugi")
+    except PackageNotFoundError:
+        return "not-available"
+def build_parser() -> argparse.ArgumentParser:
+    parser = argparse.ArgumentParser(
+        description="Run TSUMUGI pipeline and subcommands",
+        formatter_class=argparse.RawTextHelpFormatter,
+    )
+    # tsumugi -v / --version
+    parser.add_argument(
+        "-v",
+        "--version",
+        action="version",
+        version=f"%(prog)s {_get_version()}",
+        help="Show TSUMUGI version and exit.",
+    )
+    subparsers = parser.add_subparsers(dest="cmd", required=True)
+    # =========================================================
+    # run: Run TSUMUGI pipeline
+    # =========================================================
+    run = subparsers.add_parser(
+        "run",
+        help="Run TSUMUGI pipeline",
+        formatter_class=argparse.RawTextHelpFormatter,
+    )
+    run.add_argument(
+        "-o",
+        "--output_dir",
+        type=str,
+        required=True,
+        help=(
+            "Output directory for TSUMUGI results.\n"
+            "All generated files (intermediate and final results) will be saved here.\n"
+        ),
+    )
+    run.add_argument(
+        "-s",
+        "--statistical_results",
+        type=str,
+        required=True,
+        help=(
+            "Path to IMPC statistical_results_ALL.csv file.\n"
+            "This file contains statistical test results (effect sizes, p-values, etc.) "
+            "for all IMPC phenotyping experiments.\n"
+            "If not available, download 'statistical-results-ALL.csv.gz' manually from:\n"
+            "https://ftp.ebi.ac.uk/pub/databases/impc/all-data-releases/latest/TSUMUGI-results/"
+        ),
+    )
+    run.add_argument(
+        "-m",
+        "--mp_obo",
+        type=str,
+        required=False,
+        help=(
+            "Path to Mammalian Phenotype ontology file (mp.obo).\n"
+            "Used to map and infer hierarchical relationships among MP terms.\n"
+            "If not available, download 'mp.obo' manually from:\n"
+            "https://obofoundry.org/ontology/mp.html"
+        ),
+    )
+    run.add_argument(
+        "-i",
+        "--impc_phenodigm",
+        type=str,
+        required=False,
+        help=(
+            "Path to IMPC Phenodigm annotation file (impc_phenodigm.csv).\n"
+            "This file links mouse phenotypes to human diseases based on Phenodigm similarity.\n"
+            "If not available, download manually from:\n"
+            "https://diseasemodels.research.its.qmul.ac.uk/\n"
+        ),
+    )
+    run.add_argument(
+        "-t",
+        "--threads",
+        type=int,
+        default=1,
+        help=("Number of threads to use for TSUMUGI pipeline.\nIf not specified, defaults to 1.\n"),
+    )
+    # Debug options (hidden) to retain temporary files
+    run.add_argument(
+        "--debug",
+        action="store_true",
+        help=argparse.SUPPRESS,
+    )
+    # Web specific debug options (hidden) to
+    # skip preprocessing and retain temporary files
+    run.add_argument(
+        "--debug_web",
+        action="store_true",
+        help=argparse.SUPPRESS,
+    )
+    # =========================================================
+    # mp: Filter gene pairs by a specific MP term and its descendants
+    # =========================================================
+    mp_parser = subparsers.add_parser(
+        "mp",
+        help="Filter gene pairs by a specific MP term and its descendants",
+        formatter_class=argparse.RawTextHelpFormatter,
+    )
+    # --- Group A: MP include/exclude ---
+    group_mp_filter = mp_parser.add_mutually_exclusive_group(required=True)
+    group_mp_filter.add_argument(
+        "-i",
+        "--include",
+        dest="include",
+        metavar="MP_ID",
+        help=("Include gene pairs that share the specified MP term (descendants included).\nExample: -i MP:0001146"),
+    )
+    group_mp_filter.add_argument(
+        "-e",
+        "--exclude",
+        dest="exclude",
+        metavar="MP_ID",
+        help=(
+            "Exclude gene pairs that (when measured) lack the specified MP term "
+            "(descendants included).\n"
+            "Example: -e MP:0001146"
+        ),
+    )
+    # --- Group B: granularity (genewise / pairwise) ---
+    group_level = mp_parser.add_mutually_exclusive_group(required=False)
+    group_level.add_argument(
+        "-g", "--genewise", action="store_true", help="Filter by number of phenotypes per KO mouse"
+    )
+    group_level.add_argument(
+        "-p", "--pairwise", action="store_true", help="Filter by number of shared phenotypes between KO pairs"
+    )
+    mp_parser.add_argument(
+        "-m",
+        "--mp_obo",
+        type=str,
+        required=False,
+        help=(
+            "Path to Mammalian Phenotype ontology file (mp.obo).\n"
+            "Used to map and infer hierarchical relationships among MP terms.\n"
+            "If not available, download 'mp.obo' manually from:\n"
+            "https://obofoundry.org/ontology/mp.html"
+        ),
+    )
+    mp_parser.add_argument(
+        "-a",
+        "--genewise_annotations",
+        dest="path_genewise",
+        type=str,
+        required=False,
+        help=(
+            "Path to the 'genewise_phenotype_annotations' file (JSONL or JSONL.gz).\n"
+            "Required when using '-e/--exclude' to determine genes that were measured\n"
+            "and showed no phenotype for the target MP term.\n"
+        ),
+    )
+    mp_parser.add_argument(
+        "--in",
+        dest="path_pairwise",
+        type=str,
+        required=False,
+        help=(
+            "Path to 'pairwise_similarity_annotations' file (JSONL or JSONL.gz).\n"
+            "If omitted, data are read from STDIN.\n"
+        ),
+    )
+    # Annotations
+    mp_parser.add_argument(
+        "--life_stage",
+        type=str,
+        required=False,
+        help=("Filter by life stage. 'Embryo', 'Early', 'Interval', and 'Late'."),
+    )
+    mp_parser.add_argument(
+        "--sex",
+        type=str,
+        required=False,
+        help=("Filter by sexual dimorphism. 'Male' or 'Female'."),
+    )
+    mp_parser.add_argument(
+        "--zygosity", type=str, required=False, help=("Filter by zygosity.  'Homo', 'Hetero' or 'Hemi'.")
+    )
+    # =========================================================
+    # count (Filter by the number of phenotypes)
+    # =========================================================
+    count_parser = subparsers.add_parser(
+        "count",
+        help="Filter genes or gene pairs by the number of phenotypes",
+        description="Filter genes based on the number of detected phenotypes per KO or shared between KO pairs.",
+    )
+    group_count = count_parser.add_mutually_exclusive_group(required=True)
+    group_count.add_argument(
+        "-g", "--genewise", action="store_true", help="Filter by number of phenotypes per KO mouse"
+    )
+    group_count.add_argument(
+        "-p", "--pairwise", action="store_true", help="Filter by number of shared phenotypes between KO pairs"
+    )
+    count_parser.add_argument("--min", type=int, help="Minimum number threshold")
+    count_parser.add_argument("--max", type=int, help="Maximum number threshold")
+    count_parser.add_argument(
+        "--in",
+        dest="path_pairwise",
+        type=str,
+        required=False,
+        help=(
+            "Path to 'pairwise_similarity_annotations' file (JSONL or JSONL.gz).\n"
+            "If omitted, data are read from STDIN.\n"
+        ),
+    )
+    count_parser.add_argument(
+        "-a",
+        "--genewise_annotations",
+        dest="path_genewise",
+        type=str,
+        required=False,
+        help=(
+            "Path to the 'genewise_phenotype_annotations' file (JSONL or JSONL.gz).\n"
+            "Required when using '-g/--genewise' to determine genes that were measured.\n"
+        ),
+    )
+    # =========================================================
+    # score (Filter by the similarity score of gene pairs)
+    # =========================================================
+    score_parser = subparsers.add_parser(
+        "score",
+        help="Filter genes or gene pairs by the similarity score",
+        description="Filter genes based on the similarity score per KO or shared between KO pairs.",
+    )
+    score_parser.add_argument("--min", type=int, help="Minimum number threshold")
+    score_parser.add_argument("--max", type=int, help="Maximum number threshold")
+    score_parser.add_argument(
+        "--in",
+        dest="path_pairwise",
+        type=str,
+        required=False,
+        help=(
+            "Path to 'pairwise_similarity_annotations' file (JSONL or JSONL.gz).\n"
+            "If omitted, data are read from STDIN.\n"
+        ),
+    )
+    # =========================================================
+    # genes (Filter by gene symbols or gene pairs)
+    # =========================================================
+    genes_parser = subparsers.add_parser(
+        "genes",
+        help="Filter gene pairs by gene symbols or gene pairs of phenotype annotations",
+        formatter_class=argparse.RawTextHelpFormatter,
+    )
+    group_genes = genes_parser.add_mutually_exclusive_group(required=True)
+    group_genes.add_argument(
+        "-k",
+        "--keep",
+        metavar="GENE_SYMBOL",
+        help="Keep ONLY annotations with the specified gene symbols (comma-separated or path of text file)",
+    )
+    group_genes.add_argument(
+        "-d",
+        "--drop",
+        metavar="GENE_SYMBOL",
+        help="Drop annotations with the specified gene symbols (comma-separated or path of text file)",
+    )
+    group_level = genes_parser.add_mutually_exclusive_group(required=False)
+    group_level.add_argument("-g", "--genewise", action="store_true", help="Filter by user-provided gene symbols")
+    group_level.add_argument("-p", "--pairwise", action="store_true", help="Filter by user-provided  gene pairs")
+    genes_parser.add_argument(
+        "--in",
+        dest="path_pairwise",
+        type=str,
+        required=False,
+        help=(
+            "Path to 'pairwise_similarity_annotations' file (JSONL or JSONL.gz).\n"
+            "If omitted, data are read from STDIN.\n"
+        ),
+    )
+    # =========================================================
+    # life-stage (Filter by life stage)
+    # =========================================================
+    LIFE_STAGES = ("Embryo", "Early", "Interval", "Late")
+    life_stage_parser = subparsers.add_parser(
+        "life-stage",
+        help="Filter gene pairs by life stage of phenotype annotations",
+        formatter_class=argparse.RawTextHelpFormatter,
+    )
+    group_life_stage = life_stage_parser.add_mutually_exclusive_group(required=True)
+    group_life_stage.add_argument(
+        "-k",
+        "--keep",
+        choices=LIFE_STAGES,
+        metavar="LIFE_STAGE",
+        help="Keep ONLY annotations with the specified life stage",
+    )
+    group_life_stage.add_argument(
+        "-d",
+        "--drop",
+        choices=LIFE_STAGES,
+        metavar="LIFE_STAGE",
+        help="Drop annotations with the specified life stage",
+    )
+    life_stage_parser.add_argument(
+        "--in",
+        dest="path_pairwise",
+        type=str,
+        required=False,
+        help=(
+            "Path to 'pairwise_similarity_annotations' file (JSONL or JSONL.gz).\n"
+            "If omitted, data are read from STDIN.\n"
+        ),
+    )
+    # =========================================================
+    # sex (Filter by sexual dimorphism)
+    # =========================================================
+    SEXES = ("Male", "Female", "None")
+    sex_parser = subparsers.add_parser(
+        "sex",
+        help="Filter gene pairs by sexual dimorphism of phenotype annotations",
+        formatter_class=argparse.RawTextHelpFormatter,
+    )
+    group_sex = sex_parser.add_mutually_exclusive_group(required=True)
+    group_sex.add_argument(
+        "-k",
+        "--keep",
+        choices=SEXES,
+        metavar="SEX",
+        help="Keep ONLY annotations with the specified sexual dimorphism",
+    )
+    group_sex.add_argument(
+        "-d",
+        "--drop",
+        choices=SEXES,
+        metavar="SEX",
+        help="Drop annotations with the specified sexual dimorphism",
+    )
+    sex_parser.add_argument(
+        "--in",
+        dest="path_pairwise",
+        type=str,
+        required=False,
+        help=(
+            "Path to 'pairwise_similarity_annotations' file (JSONL or JSONL.gz).\n"
+            "If omitted, data are read from STDIN.\n"
+        ),
+    )
+    # =========================================================
+    # zygosity (Filter by zygosity)
+    # =========================================================
+    ZYGOSITIES = ("Homo", "Hetero", "Hemi")
+    zygosity_parser = subparsers.add_parser(
+        "zygosity",
+        help="Filter gene pairs by zygosity of phenotype annotations",
+        formatter_class=argparse.RawTextHelpFormatter,
+    )
+    group_zygosity = zygosity_parser.add_mutually_exclusive_group(required=True)
+    group_zygosity.add_argument(
+        "-k",
+        "--keep",
+        choices=ZYGOSITIES,
+        metavar="ZYGOSITY",
+        help="Keep ONLY annotations with the specified zygosity",
+    )
+    group_zygosity.add_argument(
+        "-d",
+        "--drop",
+        choices=ZYGOSITIES,
+        metavar="ZYGOSITY",
+        help="Drop annotations with the specified zygosity",
+    )
+    zygosity_parser.add_argument(
+        "--in",
+        dest="path_pairwise",
+        type=str,
+        required=False,
+        help=(
+            "Path to 'pairwise_similarity_annotations' file (JSONL or JSONL.gz).\n"
+            "If omitted, data are read from STDIN.\n"
+        ),
+    )
+    # =========================================================
+    # build-graphml
+    # =========================================================
+    build_graphml_parser = subparsers.add_parser(
+        "build-graphml",
+        help="Build a GraphML file from gene pair similarity annotations",
+        formatter_class=argparse.RawTextHelpFormatter,
+    )
+    build_graphml_parser.add_argument(
+        "--in",
+        dest="path_pairwise",
+        type=str,
+        required=False,
+        help=(
+            "Path to 'pairwise_similarity_annotations' file (JSONL or JSONL.gz).\n"
+            "If omitted, data are read from STDIN.\n"
+        ),
+    )
+    build_graphml_parser.add_argument(
+        "-a",
+        "--genewise_annotations",
+        dest="path_genewise",
+        type=str,
+        required=True,
+        help=("Path to the 'genewise_phenotype_annotations' file (JSONL or JSONL.gz).\n"),
+    )
+    # =========================================================
+    # build-webapp
+    # =========================================================
+    build_webapp_parser = subparsers.add_parser(
+        "build-webapp",
+        help="Build a webapp from gene pair similarity annotations",
+        formatter_class=argparse.RawTextHelpFormatter,
+    )
+    build_webapp_parser.add_argument(
+        "--in",
+        dest="path_pairwise",
+        type=str,
+        required=False,
+        help=(
+            "Path to 'pairwise_similarity_annotations' file (JSONL or JSONL.gz).\n"
+            "If omitted, data are read from STDIN.\n"
+        ),
+    )
+    build_webapp_parser.add_argument(
+        "-a",
+        "--genewise_annotations",
+        dest="path_genewise",
+        type=str,
+        required=True,
+        help=("Path to the 'genewise_phenotype_annotations' file (JSONL or JSONL.gz).\n"),
+    )
+    build_webapp_parser.add_argument(
+        "-o",
+        "--out",
+        dest="output_dir",
+        type=str,
+        required=True,
+    )
+    #######################################################
+    # Return parser
+    #######################################################
+    return parser
+###############################################################################
+# main
+###############################################################################
+def parse_args(argv=None):
+    parser = build_parser()
+    args = parser.parse_args(argv)
+    ########################################################################
+    # run
+    ########################################################################
+    if args.cmd == "run":
+        # If args.mp_obo or args.impc_phendigm are not provided,
+        # use the built-in files inside the TSUMUGI/data directory.
+        if not args.mp_obo:
+            args.mp_obo = str(files("TSUMUGI") / "data" / "mp.obo")
+        if not args.impc_phenodigm:
+            args.impc_phenodigm = str(files("TSUMUGI") / "data" / "impc_phenodigm.csv")
+    ########################################################################
+    # mp
+    ########################################################################
+    if args.cmd == "mp":
+        # If args.mp_obo is not provided,
+        # use the built-in files inside the TSUMUGI/data directory.
+        if not args.mp_obo:
+            args.mp_obo = str(files("TSUMUGI") / "data" / "mp.obo")
+        if args.exclude and not args.path_genewise:
+            parser.error(
+                "mp: '-a/--path_genewise' is required when using '-e/--exclude'.\n"
+                "Path to the 'genewise_phenotype_annotations' file (JSONL or JSONL.gz).\n"
+            )
+        # Default to pairwise if neither -g / --genewise nor -p / --pairwise is specified.
+        if not args.genewise and not args.pairwise:
+            args.pairwise = True
+        else:
+            args.pairwise = False
+    ########################################################################
+    # count / score
+    ########################################################################
+    # When using the count/score subcommand, at least one of --min or --max must be specified.
+    if args.cmd == "count" and args.min is None and args.max is None:
+        parser.error("count: At least one of '--min' or '--max' must be specified.")
+    if args.cmd == "score" and args.min is None and args.max is None:
+        parser.error("score: At least one of '--min' or '--max' must be specified.")
+    # When using -g / --genewise with the count subcommand,
+    # the --genewise_annotations option is required.
+    if args.cmd == "count" and args.genewise and not args.path_genewise:
+        parser.error(
+            "count: '-a/--genewise_annotations' is required when using '-g/--genewise'.\n"
+            "Provide the gene phenotype annotations JSONL(.gz) file to identify genes that were measured."
+        )
+    ########################################################################
+    # genes
+    ########################################################################
+    if args.cmd == "genes":
+        path_arg = args.keep or args.drop
+        # Default to pairwise if neither -g / --genewise nor -p / --pairwise is specified.
+        if not args.genewise and not args.pairwise:
+            args.pairwise = True
+        elif args.genewise:
+            args.pairwise = False
+        else:
+            args.genewise = False
+        # In pairwise mode, the gene list must be provided as a text file.
+        if args.pairwise and not Path(path_arg).is_file():
+            parser.error(
+                "genes --pairwise: Please provide a valid path to a text file containing gene symbols or gene pairs."
+            )
+    ########################################################################
+    # build-webapp
+    ########################################################################
+    # For build-webapp, check that output_dir is a directory (not a file)
+    if args.cmd == "build-webapp" and Path(args.output_dir).suffix:
+        parser.error(
+            f"build-webapp: {args.output_dir} looks like a file name (has extension). Please specify a directory."
+        )
+    args.version = _get_version()
+    return args