PyPI - pheval - Versions diffs - 0.3.9__py3-none-any.whl → 0.4.0__py3-none-any.whl - Mend

pheval 0.3.9py3-none-any.whl → 0.4.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of pheval might be problematic. Click here for more details.

Files changed (26) hide show

pheval/analyse/analysis.py +61 -150
pheval/analyse/assess_prioritisation_base.py +108 -0
pheval/analyse/benchmark_db_manager.py +140 -0
pheval/analyse/benchmark_generator.py +47 -50
pheval/analyse/benchmarking_data.py +3 -2
pheval/analyse/disease_prioritisation_analysis.py +70 -219
pheval/analyse/gene_prioritisation_analysis.py +66 -242
pheval/analyse/generate_plots.py +81 -79
pheval/analyse/generate_summary_outputs.py +64 -134
pheval/analyse/parse_benchmark_summary.py +50 -37
pheval/analyse/parse_corpus.py +219 -0
pheval/analyse/rank_stats.py +177 -144
pheval/analyse/run_data_parser.py +108 -27
pheval/analyse/variant_prioritisation_analysis.py +78 -212
pheval/cli.py +2 -4
pheval/cli_pheval_utils.py +34 -245
pheval/prepare/create_noisy_phenopackets.py +78 -67
pheval-0.4.0.dist-info/METADATA +112 -0
{pheval-0.3.9.dist-info → pheval-0.4.0.dist-info}/RECORD +22 -22
pheval/analyse/parse_pheval_result.py +0 -43
pheval/analyse/prioritisation_rank_recorder.py +0 -83
pheval/constants.py +0 -8
pheval-0.3.9.dist-info/METADATA +0 -35
{pheval-0.3.9.dist-info → pheval-0.4.0.dist-info}/LICENSE +0 -0
{pheval-0.3.9.dist-info → pheval-0.4.0.dist-info}/WHEEL +0 -0
{pheval-0.3.9.dist-info → pheval-0.4.0.dist-info}/entry_points.txt +0 -0

{pheval-0.3.9.dist-info → pheval-0.4.0.dist-info}/RECORD RENAMED Viewed

@@ -1,32 +1,32 @@
 pheval/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 pheval/analyse/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-pheval/analyse/analysis.py,sha256=ponm3P8nvzJNmcrNZ2_KudEhWSaWshd_Gd30D-aau8s,7743
-pheval/analyse/benchmark_generator.py,sha256=AeuwbaPb4j_dyBGPRgEBxQk2NahDb5u4xHyFiqp5Fes,5943
-pheval/analyse/benchmarking_data.py,sha256=aNZkWdmWemlnC1Tg35MtR60S9YC71QWS2rMuzkUc3w0,768
+pheval/analyse/analysis.py,sha256=Yt2xH0WS_2NO13-wYvywzmCRCj8RinQ1MeozJQuGe3o,4009
+pheval/analyse/assess_prioritisation_base.py,sha256=znBscRTqIKxxZMHR-H6KrjFJ6Uv5P5HzwTQUWS6Eoos,3434
+pheval/analyse/benchmark_db_manager.py,sha256=RaAnvq5Tfvsw8161iQUe_P146X98BckMRhMq6BibwNI,5111
+pheval/analyse/benchmark_generator.py,sha256=-LljszuKAT3oJfGQn7JHAILCGg5QXYny4nPPf273g_E,5896
+pheval/analyse/benchmarking_data.py,sha256=aRvDmwqjFGKvWDRGjMwaQxfDZscptRBwI-rcSqY-X5s,913
 pheval/analyse/binary_classification_stats.py,sha256=E35YjvGM-zFnuEt8M3pgN03vBab4MH6ih726QKvuogg,12519
-pheval/analyse/disease_prioritisation_analysis.py,sha256=mGfGYF5Eu7LxyBkAy6xMG1nDURaPiJY4rRQyKDcQe-4,12451
-pheval/analyse/gene_prioritisation_analysis.py,sha256=4GhXTG3hgKicf8UQ1O3YCo0CVgIPIqdVB4IOt2-g5II,13454
-pheval/analyse/generate_plots.py,sha256=MFORnFTgoelYAahFlu3Dc3Rul4cwCg8Bloxe62vONSc,21350
-pheval/analyse/generate_summary_outputs.py,sha256=s9pXMSW6xm4ZBe1aCd0UJSaFiKBvpUfPwJ2BI4qfTas,6591
-pheval/analyse/parse_benchmark_summary.py,sha256=Y8uPTlHTEiaeVBOqxMcdOqjY3ZBtOS3DoRycL78Dzxg,2384
-pheval/analyse/parse_pheval_result.py,sha256=2-J_c90KSs49EDjMukl8dgQyWJ0lZMlF-9ZYzD9hWzg,1438
-pheval/analyse/prioritisation_rank_recorder.py,sha256=EVe8DoEvvp0_WMAcjfVxmDGGRFPEELi7hEVjH3sIpLY,3223
+pheval/analyse/disease_prioritisation_analysis.py,sha256=1Ut4u6p9mDGbGBoXrVxTuUgv_nrqxzBhq5N9jbGWRWs,5725
+pheval/analyse/gene_prioritisation_analysis.py,sha256=_7r16BC0S2H9rOY016mLLUg6PcxaCQOh5FQcNKFTy-4,5582
+pheval/analyse/generate_plots.py,sha256=rMSdgawGYYc7BAAolqz73TAnanKtrxCC48bI6WQq6xc,21455
+pheval/analyse/generate_summary_outputs.py,sha256=9v9w7le_wLxyjgUgxl6f0RXb2Qt-B3XrKdlmfT6DSjo,4160
+pheval/analyse/parse_benchmark_summary.py,sha256=vyAOIdIWF4rZjGTPFE69ajhEC9AkkN3QBVqSe_uYZsg,2946
+pheval/analyse/parse_corpus.py,sha256=N88enptR4qG6cmqXU_TKg8DMmCeFog37eeK5nFEMQOQ,8678
 pheval/analyse/prioritisation_result_types.py,sha256=qJoB6O-lFYmzAMcTQeDJZQNLJ6hleoKDYATTkhvFF98,1228
-pheval/analyse/rank_stats.py,sha256=knj1tsKrly17QgtOUVpqA14UjbO99N3ydkWN4xU6c2k,15785
-pheval/analyse/run_data_parser.py,sha256=HzBKsJL2skjmrRZdrF3VYzswtKNgbX6U5qhY_kqq9mA,1552
-pheval/analyse/variant_prioritisation_analysis.py,sha256=XSlAV2G7psXewPIoiUD_4jgFivcG1aOcy1jSPlSil5M,12196
-pheval/cli.py,sha256=X4tDi7e3VB3v2RawkqIbfv4SFPCBuQwMXMnYCPTGtIo,1570
+pheval/analyse/rank_stats.py,sha256=53ZickUtQlctYsorAIUwlCX7M6UC-wCxoV1MbL6F9gc,17987
+pheval/analyse/run_data_parser.py,sha256=VQBUoOIRYRWc5uqURUvaWdaW3E3C7Su0JvLavQLHQaY,4105
+pheval/analyse/variant_prioritisation_analysis.py,sha256=LPEZDhFfzx-sQl9g8pM700l4Zzpy6qdOS68vOV2mZA0,6020
+pheval/cli.py,sha256=EBGh6TIxAiWs0eDdQiefq6YuD0mb93siGsNmsVO1j7c,1527
 pheval/cli_pheval.py,sha256=fWbKUcPTZZSa1EJEtH_lNn1XE6qRApRHihqUZS5owrA,2424
-pheval/cli_pheval_utils.py,sha256=4jLSJm4AEXu0SBtXbg4eNYLbCNQqQgjroDpRxQX34-M,22333
+pheval/cli_pheval_utils.py,sha256=O6tWnE85QQHGNcP08OwJGANMfXJPsZtFEu-D6ATld00,16700
 pheval/config_parser.py,sha256=lh-Dy_FflXJUnRC3HYaEdSvPAsNZWQZlEr1hHQigrTM,1227
-pheval/constants.py,sha256=TWBgWOc05FGXFu63fs-hEHS2IJkLLAPHtMppiWBfBOg,349
 pheval/implementations/__init__.py,sha256=BMUTotjTdgy5j5xubWCIQgRXrSQ1ZIcjooer7r299Zo,1228
 pheval/infra/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 pheval/infra/exomiserdb.py,sha256=pM9-TfjrgurtH4OtM1Enk5oVhIxGQN3rKRlrxHuObTM,5080
 pheval/post_processing/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 pheval/post_processing/post_processing.py,sha256=tqeVRWF6PMHpOe681ONeGaqxdviLgVJgze3o6qSpXEg,13438
 pheval/prepare/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-pheval/prepare/create_noisy_phenopackets.py,sha256=UbBRWDD95BFHPv03VYx04v35AGwJ9ynLltYKqQJHbZ0,11236
+pheval/prepare/create_noisy_phenopackets.py,sha256=ydhA4mpqKTDc4hBu8YfvNW2nMubHK3dbO-cv0lA4JFQ,11504
 pheval/prepare/create_spiked_vcf.py,sha256=90A-Mi8QKhvN036vtFEVWAHgzHO37itiLYrqYlG4LiA,23953
 pheval/prepare/custom_exceptions.py,sha256=_G3_95dPtHIs1SviYBV1j7cYc-hxlhuw8hhnYdzByYY,1719
 pheval/prepare/prepare_corpus.py,sha256=eRvozzezIgAqHAumtqul0WfXfBO1iOBaSlN8fPSn0Nw,4223
@@ -50,8 +50,8 @@ pheval/utils/file_utils.py,sha256=m21cz-qjDYqnI8ClUv3J9fKizex98a-9bSEerQ75i_c,35
 pheval/utils/phenopacket_utils.py,sha256=W9T_X48EJ-xn5GghzbZlt-lI-DxWoSm7_SHr8DCJg2Q,26856
 pheval/utils/semsim_utils.py,sha256=s7ZCR2VfPYnOh7ApX6rv66eGoVSm9QJaVYOWBEhlXpo,6151
 pheval/utils/utils.py,sha256=9V6vCT8l1g4O2-ZATYqsVyd7AYZdWGd-Ksy7_oIC3eE,2343
-pheval-0.3.9.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
-pheval-0.3.9.dist-info/METADATA,sha256=IdYBy71zIR4Jtcu9B_6ovotDUJQ6w6EMWVQF0zx2Alc,1810
-pheval-0.3.9.dist-info/WHEEL,sha256=sP946D7jFCHeNz5Iq4fL4Lu-PrWrFsgfLXbbkciIZwg,88
-pheval-0.3.9.dist-info/entry_points.txt,sha256=o9gSwDkvT4-lqKy4mlsftd1nzP9WUOXQCfnbqycURd0,81
-pheval-0.3.9.dist-info/RECORD,,
+pheval-0.4.0.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
+pheval-0.4.0.dist-info/METADATA,sha256=JXpNQPIx-5qBaP3ZDR96_hiasIdBHhaESiHUOJvT1s0,6418
+pheval-0.4.0.dist-info/WHEEL,sha256=sP946D7jFCHeNz5Iq4fL4Lu-PrWrFsgfLXbbkciIZwg,88
+pheval-0.4.0.dist-info/entry_points.txt,sha256=o9gSwDkvT4-lqKy4mlsftd1nzP9WUOXQCfnbqycURd0,81
+pheval-0.4.0.dist-info/RECORD,,

pheval/analyse/parse_pheval_result.py DELETED Viewed

@@ -1,43 +0,0 @@
-import logging
-from pathlib import Path
-from typing import List
-import pandas as pd
-from pheval.post_processing.post_processing import PhEvalResult
-info_log = logging.getLogger("info")
-def read_standardised_result(standardised_result_path: Path) -> List[dict]:
-    """
-    Read the standardised result output and return a list of dictionaries.
-    Args:
-        standardised_result_path (Path): The path to the file containing the standardised result output.
-    Returns:
-        List[dict]: A list of dictionaries representing the content of the standardised result file.
-    """
-    if standardised_result_path.is_file():
-        return pd.read_csv(standardised_result_path, delimiter="\t").to_dict("records")
-    else:
-        info_log.info(f"Could not find {standardised_result_path}")
-        return pd.DataFrame().to_dict("records")
-def parse_pheval_result(
-    data_class_type: PhEvalResult, pheval_result: List[dict]
-) -> List[PhEvalResult]:
-    """
-    Parse PhEval result into specified dataclass type.
-    Args:
-        data_class_type (PhEvalResult): The data class type to parse the result into.
-        pheval_result (List[dict]): A list of dictionaries representing the PhEval result.
-    Returns:
-        List[PhEvalResult]: A list of instances of the specified data class type,
-        each instance representing a row in the PhEval result.
-    """
-    return [data_class_type(**row) for row in pheval_result]

pheval/analyse/prioritisation_rank_recorder.py DELETED Viewed

@@ -1,83 +0,0 @@
-from collections import defaultdict
-from dataclasses import dataclass
-from pathlib import Path
-from typing import Union
-from pheval.analyse.prioritisation_result_types import (
-    DiseasePrioritisationResult,
-    GenePrioritisationResult,
-    VariantPrioritisationResult,
-)
-@dataclass
-class PrioritisationRankRecorder:
-    """
-    Record ranks for different types of prioritisation results.
-    Attributes:
-        index (int): The index representing the run.
-        directory (Path): The result directory path.
-        prioritisation_result (Union[GenePrioritisationResult, VariantPrioritisationResult,
-            DiseasePrioritisationResult]): The prioritisation result object.
-        run_comparison (defaultdict): The comparison dictionary to record ranks.
-    """
-    index: int
-    directory: Path
-    prioritisation_result: Union[
-        GenePrioritisationResult, VariantPrioritisationResult, DiseasePrioritisationResult
-    ]
-    run_comparison: defaultdict
-    def _record_gene_rank(self) -> None:
-        """
-        Record gene prioritisation rank.
-        This method updates the 'Gene' key in the run comparison dictionary with the gene
-        information extracted from the correct prioritisation result.
-        """
-        self.run_comparison[self.index]["Gene"] = self.prioritisation_result.gene
-    def _record_variant_rank(self) -> None:
-        """
-        Record variant prioritisation rank.
-        This method updates the 'Variant' key in the run comparison dictionary with the variant
-        information extracted from the correct prioritisation result.
-        """
-        variant = self.prioritisation_result.variant
-        self.run_comparison[self.index]["Variant"] = "-".join(
-            [variant.chrom, str(variant.pos), variant.ref, variant.alt]
-        )
-    def _record_disease_rank(self) -> None:
-        """
-        Record disease prioritisation rank.
-        This method updates the 'Disease' key in the run comparison dictionary with the disease
-        information extracted from the correct prioritisation result.
-        """
-        self.run_comparison[self.index][
-            "Disease"
-        ] = self.prioritisation_result.disease.disease_identifier
-    def record_rank(self) -> None:
-        """
-        Record the prioritisation ranks for different runs.
-        It assigns the prioritisation rank and associated details such as phenopacket name
-        and prioritisation result type ('Gene', 'Variant', or 'Disease') to the run comparison
-        dictionary for each respective run, allowing comparison and analysis of the ranks of correct results
-        across different runs.
-        """
-        self.run_comparison[self.index][
-            "Phenopacket"
-        ] = self.prioritisation_result.phenopacket_path.name
-        if type(self.prioritisation_result) is GenePrioritisationResult:
-            self._record_gene_rank()
-        elif type(self.prioritisation_result) is VariantPrioritisationResult:
-            self._record_variant_rank()
-        elif type(self.prioritisation_result) is DiseasePrioritisationResult:
-            self._record_disease_rank()
-        self.run_comparison[self.index][self.directory] = self.prioritisation_result.rank

pheval/constants.py DELETED Viewed

@@ -1,8 +0,0 @@
-PHEVAL_RESULTS_DIRECTORY_SUFFIX = "_results"
-GENE_PLOT_FILE_PREFIX = "gene"
-GENE_PLOT_Y_LABEL = "Disease-causing genes (%)"
-VARIANT_PLOT_FILE_PREFIX = "variant"
-VARIANT_PLOT_Y_LABEL = "Disease-causing variants (%)"
-DISEASE_PLOT_FILE_PREFIX = "disease"
-DISEASE_PLOT_Y_LABEL = "Known diseases (%)"
-RANK_COMPARISON_FILE_SUFFIX = "_rank_comparison.tsv"

pheval-0.3.9.dist-info/METADATA DELETED Viewed

@@ -1,35 +0,0 @@
-Metadata-Version: 2.1
-Name: pheval
-Version: 0.3.9
-Summary:
-Author: Yasemin Bridges
-Author-email: y.bridges@qmul.ac.uk
-Requires-Python: >=3.9,<4.0.0
-Classifier: Programming Language :: Python :: 3
-Classifier: Programming Language :: Python :: 3.9
-Classifier: Programming Language :: Python :: 3.10
-Classifier: Programming Language :: Python :: 3.11
-Classifier: Programming Language :: Python :: 3.12
-Requires-Dist: class-resolver (>=0.4.2)
-Requires-Dist: click (>=8.1.3)
-Requires-Dist: deprecation (>=2.1.0)
-Requires-Dist: google (>=3.0.0,<4.0.0)
-Requires-Dist: jaydebeapi (>=1.2.3)
-Requires-Dist: matplotlib (>=3.7.0,<4.0.0)
-Requires-Dist: oaklib (>=0.5.6)
-Requires-Dist: pandas (>=1.5.1)
-Requires-Dist: phenopackets (>=2.0.2,<3.0.0)
-Requires-Dist: plotly (>=5.13.0,<6.0.0)
-Requires-Dist: polars (>=0.19.15,<0.20.0)
-Requires-Dist: pyaml (>=21.10.1,<22.0.0)
-Requires-Dist: pyserde (>=0.9.8,<0.10.0)
-Requires-Dist: scikit-learn (>=1.4.0,<2.0.0)
-Requires-Dist: seaborn (>=0.12.2,<0.13.0)
-Requires-Dist: tqdm (>=4.64.1)
-Description-Content-Type: text/markdown
-# PhEval - Phenotypic Inference Evaluation Framework
-There is currently no empirical framework to evaluate the performance of phenotype matching and prioritization tools, much needed to guide tuning for cross species inference. Many algorithms are evaluated using simulations, which may fail to capture real-world scenarios. This gap presents a number of problems: it is difficult to optimize algorithms if we do not know which choices lead to better results; performance may be sensitive to factors that are subject to change, such as ontology structure or annotation completeness. We will develop a modular Phenotypic Inference Evaluation Framework, PhEval and use it to optimize our own algorithms, as well as deliver it as a community resource.

{pheval-0.3.9.dist-info → pheval-0.4.0.dist-info}/LICENSE RENAMED Viewed

File without changes

{pheval-0.3.9.dist-info → pheval-0.4.0.dist-info}/WHEEL RENAMED Viewed

File without changes

{pheval-0.3.9.dist-info → pheval-0.4.0.dist-info}/entry_points.txt RENAMED Viewed

File without changes

pheval 0.3.9__py3-none-any.whl → 0.4.0__py3-none-any.whl

Potentially problematic release.

pheval 0.3.9py3-none-any.whl → 0.4.0py3-none-any.whl