PyPI - rectanglepy - Versions diffs - 0.5.1__tar.gz → 0.5.3__tar.gz - Mend

rectanglepy 0.5.1tar.gz → 0.5.3tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (54) hide show

{rectanglepy-0.5.1 → rectanglepy-0.5.3}/.bumpversion.cfg RENAMED Viewed

@@ -1,5 +1,5 @@
 [bumpversion]
-current_version = 0.5.1
+current_version = 0.5.3
 tag = True
 commit = True

{rectanglepy-0.5.1 → rectanglepy-0.5.3}/.github/workflows/build.yaml RENAMED Viewed

@@ -23,6 +23,10 @@ jobs:
                 include:
                     - os: ubuntu-latest
                       python: "3.10"
+                    - os: ubuntu-latest
+                      python: "3.11"
+                    - os: ubuntu-latest
+                      python: "3.12"
         env:
             OS: ${{ matrix.os }}
             PYTHON: ${{ matrix.python }}
@@ -55,10 +59,10 @@ jobs:
         needs: test
         steps:
             - uses: actions/checkout@v2
-            - name: Set up Python 3.10
+            - name: Set up Python 3.12
               uses: actions/setup-python@v2
               with:
-                  python-version: "3.10"
+                  python-version: "3.12"
             - name: Install twine
               run: pip install twine
             - name: Install build dependencies

{rectanglepy-0.5.1 → rectanglepy-0.5.3}/.github/workflows/release.yaml RENAMED Viewed

@@ -18,6 +18,10 @@ jobs:
                 include:
                     - os: ubuntu-latest
                       python: "3.10"
+                    - os: ubuntu-latest
+                      python: "3.11"
+                    - os: ubuntu-latest
+                      python: "3.12"
         env:
             OS: ${{ matrix.os }}
             PYTHON: ${{ matrix.python }}
@@ -49,10 +53,10 @@ jobs:
         needs: test
         steps:
             - uses: actions/checkout@v2
-            - name: Set up Python 3.10
+            - name: Set up Python 3.12
               uses: actions/setup-python@v2
               with:
-                  python-version: "3.10"
+                  python-version: "3.12"
             - name: Install build dependencies
               run: python -m pip install --upgrade pip wheel twine build
             - name: Build package
@@ -68,10 +72,10 @@ jobs:
             - name: Checkout code
               uses: actions/checkout@v3
-            - name: Set up Python 3.10
+            - name: Set up Python 3.12
               uses: actions/setup-python@v4
               with:
-                  python-version: "3.10"
+                  python-version: "3.12"
             - name: Install hatch
               run: pip install hatch

{rectanglepy-0.5.1 → rectanglepy-0.5.3}/.github/workflows/test.yaml RENAMED Viewed

@@ -22,6 +22,10 @@ jobs:
                 include:
                     - os: ubuntu-latest
                       python: "3.10"
+                    - os: ubuntu-latest
+                      python: "3.11"
+                    - os: ubuntu-latest
+                      python: "3.12"
         env:
             OS: ${{ matrix.os }}
             PYTHON: ${{ matrix.python }}

{rectanglepy-0.5.1 → rectanglepy-0.5.3}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: rectanglepy
-Version: 0.5.1
+Version: 0.5.3
 Summary: Hierarchical deconvolution of bulk  transcriptomics
 Project-URL: Documentation, https://rectanglepy.readthedocs.io/
 Project-URL: Source, https://github.com/ComputationalBiomedicineGroup/Rectangle
@@ -36,6 +36,7 @@ Requires-Dist: numpy<2.0.0,>=1.0.0
 Requires-Dist: pydeseq2==0.4.11
 Requires-Dist: quadprog==0.1.12
 Requires-Dist: scipy==1.13.0
+Requires-Dist: setuptools<70.0.0,>=69.0.0
 Requires-Dist: statsmodels>=0.14.1
 Provides-Extra: dev
 Requires-Dist: bump2version; extra == 'dev'

{rectanglepy-0.5.1 → rectanglepy-0.5.3}/pyproject.toml RENAMED Viewed

@@ -4,7 +4,7 @@ requires = ["hatchling"]
 [project]
 name = "rectanglepy"
-version = "0.5.1"
+version = "0.5.3"
 description = "Hierarchical deconvolution of bulk  transcriptomics"
 readme = "README.md"
 requires-python = ">=3.10"
@@ -25,7 +25,8 @@ dependencies = [
     "loguru",
     "numpy>=1.0.0,<2.0.0",
     "anndata>=0.8.0,<0.10.9",
-    "statsmodels>=0.14.1"
+    "statsmodels>=0.14.1",
+    "setuptools>=69.0.0,<70.0.0",
 ]

{rectanglepy-0.5.1 → rectanglepy-0.5.3}/src/rectanglepy/pp/rectangle_signature.py RENAMED Viewed

@@ -24,6 +24,8 @@ class RectangleSignatureResult:
         The result of the p lfc cut off optimization, as a pd.DataFrame. Contains the following columns: p, lfc, pearson_r, rsme
     unkn_gene_corr
         The correlation between the unknown cell type and the genes linked to the unknown cell type.
+    unkn_bulk_err
+        The result of 'bulk - bulk_est' for the reconstructed bulk used to calculate the unknown cell type content.
     """
     def __init__(
@@ -39,6 +41,7 @@ class RectangleSignatureResult:
         clustered_signature_genes: pd.Series = None,
         cluster_assignments: list[int or str] = None,
         unkn_gene_corr: pd.Series = None,
+        unkn_bulk_err: pd.DataFrame = None,
     ):
         self.signature_genes = signature_genes
         self.bias_factors = bias_factors
@@ -51,6 +54,7 @@ class RectangleSignatureResult:
         self.clustered_signature_genes = clustered_signature_genes
         self.assignments = cluster_assignments
         self.unkn_gene_corr = unkn_gene_corr
+        self.unkn_bulk_err = unkn_bulk_err
     def get_signature_matrix(self, include_mrna_bias=True) -> pd.DataFrame:
         """Calculates the signature matrix by multiplying the pseudobulk_sig_cpm DataFrame subset by signature_genes and the bias_factors Series.

{rectanglepy-0.5.1 → rectanglepy-0.5.3}/src/rectanglepy/rectangle.py RENAMED Viewed

@@ -70,7 +70,7 @@ def rectangle(
         gene_expression_threshold=gene_expression_threshold,
     )
-    estimations = deconvolution(signatures, bulks, correct_mrna_bias, n_cpus)
+    estimations, bulk_err = deconvolution(signatures, bulks, correct_mrna_bias, n_cpus)
     if "Unknown" in estimations.columns:
         try:
@@ -81,6 +81,7 @@ def rectangle(
     else:
         unkn_gene_corr = None
     signatures.unkn_gene_corr = unkn_gene_corr
+    signatures.unkn_bulk_err = bulk_err
     return estimations, signatures

{rectanglepy-0.5.1 → rectanglepy-0.5.3}/src/rectanglepy/tl/deconvolution.py RENAMED Viewed

@@ -177,7 +177,13 @@ def deconvolution(
     Returns
     -------
-        A DataFrame containing the estimated cell fractions resulting from deconvolution. Each row represents a sample and each column represents a cell type.
+    estimation_df : pd.DataFrame
+        A DataFrame containing the estimated cell fractions. Each row represents
+        a sample, each column represents a cell type (including 'Unknown' if applicable).
+    bulk_err_df : pd.DataFrame
+        A DataFrame containing the gene-level difference between the true bulk
+        expression and the reconstructed bulk expression (i.e., `bulk - bulk_est`)
+        for each sample.
     """
     bulks = bulks.div(bulks.sum(axis=1), axis=0) * 1e6
@@ -194,28 +200,31 @@ def deconvolution(
             delayed(_process_bulk)(signatures, i, bulk, bulks.columns, correct_mrna_bias)
             for i, bulk in enumerate(bulks.values)
         )
+    estimations = [result[0] for result in results]
+    bulk_err = [result[1] for result in results]
+    estimation_df = pd.DataFrame(estimations, index=bulks.index)
+    bulk_err_df = pd.DataFrame(bulk_err, index=bulks.index)
-    result_df = pd.DataFrame(results, index=bulks.index)
-    # Return the result DataFrame
-    return result_df
+    return estimation_df, bulk_err_df
 def _process_bulk(
     signatures: RectangleSignatureResult, i: int, bulk: pd.Series, var_names: pd.Index, correct_mrna_bias: bool
-) -> pd.Series:
+) -> tuple[pd.Series, pd.Series]:
     try:
         logger.info(f"Deconvolute fractions for bulk: {i}")
         bulk = pd.Series(bulk, index=var_names)
-        result = _deconvolute(signatures, bulk, correct_mrna_bias=correct_mrna_bias)
+        estimations, bulk_err = _deconvolute(signatures, bulk, correct_mrna_bias=correct_mrna_bias)
         logger.info(f"Finished deconvolution for bulk: {i}")
-        return result
+        return estimations, bulk_err
     except Exception as e:
         logger.warning(f"Deconvolution failed for bulk: {i} with error: {e}")
-        return pd.Series(index=signatures.pseudobulk_sig_cpm.columns)
+        return pd.Series(index=signatures.pseudobulk_sig_cpm.columns), pd.Series(index=bulk.index)
-def _deconvolute(signatures: RectangleSignatureResult, bulk: pd.Series, correct_mrna_bias: bool = True) -> pd.Series:
+def _deconvolute(
+    signatures: RectangleSignatureResult, bulk: pd.Series, correct_mrna_bias: bool = True
+) -> tuple[pd.Series, pd.Series]:
     bulk_direct_reduced = bulk[bulk.index.isin(signatures.signature_genes)]
     signature_genes_direct_reduced = signatures.signature_genes[
         signatures.signature_genes.isin(bulk_direct_reduced.index)
@@ -231,8 +240,10 @@ def _deconvolute(signatures: RectangleSignatureResult, bulk: pd.Series, correct_
     start_fractions = _calculate_dwls(signature, bulk)
     if clustered_pseudobulk_sig_cpm is None:
-        start_fractions = correct_for_unknown_cell_content(bulk, pseudobulk_sig_cpm, start_fractions, bias_factors)
-        return start_fractions
+        start_fractions, bulk_err = correct_for_unknown_cell_content(
+            bulk, pseudobulk_sig_cpm, start_fractions, bias_factors
+        )
+        return start_fractions, bulk_err
     cluster_bias_factors = signatures.clustered_bias_factors
     if not correct_mrna_bias:
@@ -249,8 +260,10 @@ def _deconvolute(signatures: RectangleSignatureResult, bulk: pd.Series, correct_
         recursive_fractions = _calculate_dwls(signature, bulk, signatures.assignments, clustered_fractions)
     except Exception as e:
         logger.warning(f"Recursive deconvolution failed with error: {e}")
-        start_fractions = correct_for_unknown_cell_content(bulk, pseudobulk_sig_cpm, start_fractions, bias_factors)
-        return start_fractions
+        start_fractions, bulk_err = correct_for_unknown_cell_content(
+            bulk, pseudobulk_sig_cpm, start_fractions, bias_factors
+        )
+        return start_fractions, bulk_err
     final_fractions = []
@@ -269,13 +282,15 @@ def _deconvolute(signatures: RectangleSignatureResult, bulk: pd.Series, correct_
     final_fractions = pd.Series(final_fractions, index=start_fractions.index)
-    final_fractions = correct_for_unknown_cell_content(bulk, pseudobulk_sig_cpm, final_fractions, bias_factors)
-    return final_fractions
+    final_fractions, bulk_err = correct_for_unknown_cell_content(
+        bulk, pseudobulk_sig_cpm, final_fractions, bias_factors
+    )
+    return final_fractions, bulk_err
 def correct_for_unknown_cell_content(
     bulk: pd.Series, pseudo_signature_cpm: pd.DataFrame, estimates: pd.Series, bias_factors: pd.Series
-) -> pd.Series:
+) -> tuple[pd.Series, pd.Series]:
     r"""Performs correction for unknown cell content using the pseudo signature and bulk data.
     Reconstructs the bulk expression profiles through  the estimated cell fractions (weighted by the mRNA bias factors) and cell-type-specific expression profiles (i.e. signature).
@@ -306,13 +321,17 @@ def correct_for_unknown_cell_content(
     Returns
     -------
-    pd.Series: The corrected cell fractions, indexed by cell type. Adds an "Unknown" cell type.
+    estimates_fix
+         The corrected cell fractions, indexed by cell type. Includes an "Unknown" cell type for the unknown cellular content.
+    bulk_err
+         The difference (per gene) between the actual bulk expression and the reconstructed bulk expression (i.e., `bulk - bulk_est`).
     """
     if estimates.sum() == 0:
         estimates_fix = estimates
         # analysis fails if all cell fractions are zero, so we set the unknown cell content to ß
         estimates_fix["Unknown"] = 0
-        return estimates_fix
+        return estimates_fix, pd.Series(index=bulk.index)
     signature_genes = pseudo_signature_cpm.index
     bulk = bulk.loc[signature_genes]
@@ -325,6 +344,8 @@ def correct_for_unknown_cell_content(
     bulk_est = pd.Series(np.dot(signature, (estimates.T * bias_factors).T))
     bulk_est.index = signature.index
+    bulk_err = bulk - bulk_est
     # Calculate the unknown cellular content ad the difference of
     # per-sample overall expression levels in the true vs. reconstructed
     # bulk RNA-seq data, divided by the overall expression in the true bulk
@@ -335,4 +356,4 @@ def correct_for_unknown_cell_content(
     estimates_fix = estimates / estimates.sum() * (1 - ukn_cc)
     estimates_fix["Unknown"] = abs(ukn_cc)
-    return estimates_fix
+    return estimates_fix, bulk_err

{rectanglepy-0.5.1 → rectanglepy-0.5.3}/tests/test_rectangle.py RENAMED Viewed

@@ -23,3 +23,4 @@ def test_rectangle():
     assert isinstance(estimations, pd.DataFrame)
     assert isinstance(signatures, RectangleSignatureResult)
     assert isinstance(signatures.unkn_gene_corr, pd.Series)
+    assert isinstance(signatures.unkn_bulk_err, pd.DataFrame)

{rectanglepy-0.5.1 → rectanglepy-0.5.3}/tests/test_tl.py RENAMED Viewed

@@ -77,8 +77,9 @@ def test_correct_for_unknown_cell_content(small_data, quantiseq_data):
     fractions = _calculate_dwls(sig, bulk)
     biasfact = (pseudo_signature > 0).sum(axis=0)
     biasfact = biasfact / biasfact.min()
-    result = correct_for_unknown_cell_content(bulk, pseudo_signature, fractions, biasfact)
+    result, bulk_err = correct_for_unknown_cell_content(bulk, pseudo_signature, fractions, biasfact)
     assert len(fractions) + 1 == len(result)
+    assert len(bulk_err) > 0
 def test_solve_dampened_wsl(quantiseq_data):
@@ -106,9 +107,10 @@ def test_deconvolute_no_hierarchy(small_data, quantiseq_data):
     signature = build_rectangle_signatures(adata, "cell_type", p=0.9, lfc=0.1, optimize_cutoffs=False)
     bulk, _, _ = quantiseq_data
-    estimations = deconvolution(signature, bulk.T)
+    estimations, bulk_err = deconvolution(signature, bulk.T)
     assert np.allclose(estimations.sum(axis=1), 1)
     assert estimations.shape == (8, 4)
+    assert len(bulk_err) == 8
 def test_deconvolute_sparse_no_hierarchy(small_data, quantiseq_data):
@@ -118,7 +120,7 @@ def test_deconvolute_sparse_no_hierarchy(small_data, quantiseq_data):
     signature = build_rectangle_signatures(adata, "cell_type", p=0.9, lfc=0.1, optimize_cutoffs=False)
     bulk, _, _ = quantiseq_data
-    expected = deconvolution(signature, bulk.T)
+    expected, bulk_err_exp = deconvolution(signature, bulk.T)
     sc_counts = sc_counts.astype(pd.SparseDtype("int"))
     csr_sparse_matrix = sc_counts.sparse.to_coo().tocsr()
@@ -127,5 +129,6 @@ def test_deconvolute_sparse_no_hierarchy(small_data, quantiseq_data):
     )
     signature_sparse = build_rectangle_signatures(adata_sparse, "cell_type", p=0.9, lfc=0.1, optimize_cutoffs=False)
-    estimations = deconvolution(signature_sparse, bulk.T)
+    estimations, bulk_err = deconvolution(signature_sparse, bulk.T)
     assert expected.equals(estimations)
+    assert bulk_err_exp.equals(bulk_err)