PyPI - pytme - Versions diffs - 0.1.8__cp311-cp311-macosx_14_0_arm64.whl → 0.2.0__cp311-cp311-macosx_14_0_arm64.whl - Mend

pytme 0.1.8__cp311-cp311-macosx_14_0_arm64.whl → 0.2.0__cp311-cp311-macosx_14_0_arm64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (42) hide show

pytme-0.2.0.data/scripts/match_template.py +1019 -0
pytme-0.2.0.data/scripts/postprocess.py +570 -0
{pytme-0.1.8.data → pytme-0.2.0.data}/scripts/preprocessor_gui.py +244 -60
{pytme-0.1.8.dist-info → pytme-0.2.0.dist-info}/METADATA +3 -1
pytme-0.2.0.dist-info/RECORD +72 -0
{pytme-0.1.8.dist-info → pytme-0.2.0.dist-info}/WHEEL +1 -1
scripts/extract_candidates.py +218 -0
scripts/match_template.py +459 -218
pytme-0.1.8.data/scripts/match_template.py → scripts/match_template_filters.py +459 -218
scripts/postprocess.py +380 -435
scripts/preprocessor_gui.py +244 -60
scripts/refine_matches.py +218 -0
tme/__init__.py +2 -1
tme/__version__.py +1 -1
tme/analyzer.py +533 -78
tme/backends/cupy_backend.py +80 -15
tme/backends/npfftw_backend.py +35 -6
tme/backends/pytorch_backend.py +15 -7
tme/density.py +173 -78
tme/extensions.cpython-311-darwin.so +0 -0
tme/matching_constrained.py +195 -0
tme/matching_data.py +78 -32
tme/matching_exhaustive.py +369 -221
tme/matching_memory.py +1 -0
tme/matching_optimization.py +753 -649
tme/matching_utils.py +152 -8
tme/orientations.py +561 -0
tme/preprocessing/__init__.py +2 -0
tme/preprocessing/_utils.py +176 -0
tme/preprocessing/composable_filter.py +30 -0
tme/preprocessing/compose.py +52 -0
tme/preprocessing/frequency_filters.py +322 -0
tme/preprocessing/tilt_series.py +967 -0
tme/preprocessor.py +35 -25
tme/structure.py +2 -37
pytme-0.1.8.data/scripts/postprocess.py +0 -625
pytme-0.1.8.dist-info/RECORD +0 -61
{pytme-0.1.8.data → pytme-0.2.0.data}/scripts/estimate_ram_usage.py +0 -0
{pytme-0.1.8.data → pytme-0.2.0.data}/scripts/preprocess.py +0 -0
{pytme-0.1.8.dist-info → pytme-0.2.0.dist-info}/LICENSE +0 -0
{pytme-0.1.8.dist-info → pytme-0.2.0.dist-info}/entry_points.txt +0 -0
{pytme-0.1.8.dist-info → pytme-0.2.0.dist-info}/top_level.txt +0 -0

tme/orientations.py ADDED Viewed

@@ -0,0 +1,561 @@
+#!python3
+""" Handle template matching peaks and convert between formats.
+    Copyright (c) 2024 European Molecular Biology Laboratory
+    Author: Valentin Maurer <valentin.maurer@embl-hamburg.de>
+"""
+import re
+from collections import deque
+from dataclasses import dataclass
+from typing import List, Tuple, Dict
+import numpy as np
+from scipy.spatial.transform import Rotation
+@dataclass
+class Orientations:
+    """
+    Handle template matching peaks and convert between formats.
+    """
+    #: Return a numpy array with translations of each orientation (n x d).
+    translations: np.ndarray
+    #: Return a numpy array with euler angles of each orientation in zxy format (n x d).
+    rotations: np.ndarray
+    #: Return a numpy array with the score of each orientation (n, ).
+    scores: np.ndarray
+    #: Return a numpy array with additional orientation details (n, ).
+    details: np.ndarray
+    def __iter__(self) -> Tuple[np.ndarray, np.ndarray, np.ndarray, np.ndarray]:
+        """
+        Iterate over the current class instance. Each iteration returns a orientation
+        defined by its translation, rotation, score and additional detail.
+        Yields
+        ------
+        Tuple[np.ndarray, np.ndarray, np.ndarray, np.ndarray]
+            A tuple of arrays defining the given orientation.
+        """
+        yield from zip(self.translations, self.rotations, self.scores, self.details)
+    def __getitem__(self, indices: List[int]) -> "Orientations":
+        """
+        Retrieve a subset of orientations based on the provided indices.
+        Parameters
+        ----------
+        indices : List[int]
+            A list of indices specifying the orientations to be retrieved.
+        Returns
+        -------
+        :py:class:`Orientations`
+            A new :py:class:`Orientations`instance containing only the selected orientations.
+        """
+        indices = np.asarray(indices)
+        attributes = (
+            "translations",
+            "rotations",
+            "scores",
+            "details",
+        )
+        kwargs = {attr: getattr(self, attr)[indices] for attr in attributes}
+        return self.__class__(**kwargs)
+    def to_file(self, filename: str, file_format: type = None, **kwargs) -> None:
+        """
+        Save the current class instance to a file in the specified format.
+        Parameters
+        ----------
+        filename : str
+            The name of the file where the orientations will be saved.
+        file_format : type, optional
+            The format in which to save the orientations. Supported formats are 'text' and 'relion'.
+        **kwargs : dict
+            Additional keyword arguments specific to the file format.
+        Raises
+        ------
+        ValueError
+            If an unsupported file format is specified.
+        """
+        mapping = {
+            "text": self._to_text,
+            "relion": self._to_relion_star,
+            "dynamo": self._to_dynamo_tbl,
+        }
+        if file_format is None:
+            file_format = "text"
+            if filename.lower().endswith(".star"):
+                file_format = "relion"
+            elif filename.lower().endswith(".tbl"):
+                file_format = "dynamo"
+        func = mapping.get(file_format, None)
+        if func is None:
+            raise ValueError(
+                f"{file_format} not implemented. Supported are {','.join(mapping.keys())}."
+            )
+        return func(filename=filename, **kwargs)
+    def _to_text(self, filename: str) -> None:
+        """
+        Save orientations in a text file format.
+        Parameters
+        ----------
+        filename : str
+            The name of the file to save the orientations.
+        Notes
+        -----
+        The file is saved with a header specifying each column: z, y, x, euler_z,
+        euler_y, euler_x, score, detail. Each row in the file corresponds to an orientation.
+        """
+        header = "\t".join(
+            ["z", "y", "x", "euler_z", "euler_y", "euler_x", "score", "detail"]
+        )
+        with open(filename, mode="w", encoding="utf-8") as ofile:
+            _ = ofile.write(f"{header}\n")
+            for translation, angles, score, detail in self:
+                translation_string = "\t".join([str(x) for x in translation])
+                angle_string = "\t".join([str(x) for x in angles])
+                _ = ofile.write(
+                    f"{translation_string}\t{angle_string}\t{score}\t{detail}\n"
+                )
+        return None
+    def _to_dynamo_tbl(
+        self,
+        filename: str,
+        name_prefix: str = None,
+        sampling_rate: float = 1.0,
+        subtomogram_size: int = 0,
+    ) -> None:
+        """
+        Save orientations in Dynamo's tbl file format.
+        Parameters
+        ----------
+        filename : str
+            The name of the file to save the orientations.
+        sampling_rate : float, optional
+            Subtomogram sampling rate in angstrom per voxel
+        Notes
+        -----
+        The file is saved with a standard header used in Dynamo tbl files
+        outlined in [1]_. Each row corresponds to a particular partice.
+        References
+        ----------
+        .. [1]  https://wiki.dynamo.biozentrum.unibas.ch/w/index.php/Table
+        The file is saved with a standard header used in Dynamo STAR files.
+        Each row in the file corresponds to an orientation.
+        """
+        with open(filename, mode="w", encoding="utf-8") as ofile:
+            for index, (translation, rotation, score, detail) in enumerate(self):
+                rotation = Rotation.from_euler("zyx", rotation, degrees=True)
+                rotation = rotation.as_euler(seq="xyx", degrees=True)
+                out = [
+                    index,
+                    1,
+                    0,
+                    0,
+                    0,
+                    0,
+                    *rotation,
+                    self.scores[index],
+                    self.scores[index],
+                    0,
+                    0,
+                    # Wedge parameters
+                    -90,
+                    90,
+                    -60,
+                    60,
+                    0,
+                    0,
+                    0,
+                    0,
+                    0,
+                    0,
+                    # Coordinate in original volume
+                    *translation[::-1],
+                    0,
+                    0,
+                    0,
+                    0,
+                    0,
+                    0,
+                    0,
+                    0,
+                    sampling_rate,
+                    3,
+                    0,
+                    0,
+                ]
+                _ = ofile.write(" ".join([str(x) for x in out]) + "\n")
+        return None
+    def _to_relion_star(
+        self,
+        filename: str,
+        name_prefix: str = None,
+        ctf_image: str = None,
+        sampling_rate: float = 1.0,
+        subtomogram_size: int = 0,
+    ) -> None:
+        """
+        Save orientations in RELION's STAR file format.
+        Parameters
+        ----------
+        filename : str
+            The name of the file to save the orientations.
+        name_prefix : str, optional
+            A prefix to add to the image names in the STAR file.
+        ctf_image : str, optional
+            Path to CTF or wedge mask RELION.
+        sampling_rate : float, optional
+            Subtomogram sampling rate in angstrom per voxel
+        subtomogram_size : int, optional
+            Size of the square shaped subtomogram.
+        Notes
+        -----
+        The file is saved with a standard header used in RELION STAR files.
+        Each row in the file corresponds to an orientation.
+        """
+        optics_header = [
+            "# version 30001",
+            "data_optics",
+            "",
+            "loop_",
+            "_rlnOpticsGroup",
+            "_rlnOpticsGroupName",
+            "_rlnSphericalAberration",
+            "_rlnVoltage",
+            "_rlnImageSize",
+            "_rlnImageDimensionality",
+            "_rlnImagePixelSize",
+        ]
+        optics_data = [
+            "1",
+            "opticsGroup1",
+            "2.700000",
+            "300.000000",
+            str(int(subtomogram_size)),
+            "3",
+            str(float(sampling_rate)),
+        ]
+        optics_header = "\n".join(optics_header)
+        optics_data = "\t".join(optics_data)
+        header = [
+            "data_particles",
+            "",
+            "loop_",
+            "_rlnCoordinateX",
+            "_rlnCoordinateY",
+            "_rlnCoordinateZ",
+            "_rlnImageName",
+            "_rlnAngleRot",
+            "_rlnAngleTilt",
+            "_rlnAnglePsi",
+            "_rlnOpticsGroup",
+        ]
+        if ctf_image is not None:
+            header.append("_rlnCtfImage")
+        ctf_image = "" if ctf_image is None else f"\t{ctf_image}"
+        header = "\n".join(header)
+        name_prefix = "" if name_prefix is None else name_prefix
+        with open(filename, mode="w", encoding="utf-8") as ofile:
+            _ = ofile.write(f"{optics_header}\n")
+            _ = ofile.write(f"{optics_data}\n")
+            _ = ofile.write("\n# version 30001\n")
+            _ = ofile.write(f"{header}\n")
+            # pyTME uses a zyx data layout
+            for index, (translation, rotation, score, detail) in enumerate(self):
+                rotation = Rotation.from_euler("zyx", rotation, degrees=True)
+                rotation = rotation.as_euler(seq="xyx", degrees=True)
+                translation_string = "\t".join([str(x) for x in translation][::-1])
+                angle_string = "\t".join([str(x) for x in rotation])
+                name = f"{name_prefix}_{index}.mrc"
+                _ = ofile.write(
+                    f"{translation_string}\t{name}\t{angle_string}\t1{ctf_image}\n"
+                )
+        return None
+    @classmethod
+    def from_file(
+        cls, filename: str, file_format: type = None, **kwargs
+    ) -> "Orientations":
+        """
+        Create an instance of :py:class:`Orientations` from a file.
+        Parameters
+        ----------
+        filename : str
+            The name of the file from which to read the orientations.
+        file_format : type, optional
+            The format of the file. Currently, only 'text' format is supported.
+        **kwargs : dict
+            Additional keyword arguments specific to the file format.
+        Returns
+        -------
+        :py:class:`Orientations`
+            An instance of :py:class:`Orientations` populated with data from the file.
+        Raises
+        ------
+        ValueError
+            If an unsupported file format is specified.
+        """
+        mapping = {"text": cls._from_text, "relion": cls._from_relion_star}
+        if file_format is None:
+            file_format = "text"
+            if filename.lower().endswith(".star"):
+                file_format = "relion"
+        func = mapping.get(file_format, None)
+        if func is None:
+            raise ValueError(
+                f"{file_format} not implemented. Supported are {','.join(mapping.keys())}."
+            )
+        translations, rotations, scores, details, *_ = func(filename=filename, **kwargs)
+        return cls(
+            translations=translations,
+            rotations=rotations,
+            scores=scores,
+            details=details,
+        )
+    @staticmethod
+    def _from_text(
+        filename: str,
+    ) -> Tuple[np.ndarray, np.ndarray, np.ndarray, np.ndarray]:
+        """
+        Read orientations from a text file.
+        Parameters
+        ----------
+        filename : str
+            The name of the file from which to read the orientations.
+        Returns
+        -------
+        Tuple[np.ndarray, np.ndarray, np.ndarray, np.ndarray]
+            A tuple containing numpy arrays for translations, rotations, scores,
+            and details.
+        Notes
+        -----
+        The text file is expected to have a header and data in columns corresponding to
+        z, y, x, euler_z, euler_y, euler_x, score, detail.
+        """
+        with open(filename, mode="r", encoding="utf-8") as infile:
+            data = [x.strip().split("\t") for x in infile.read().split("\n")]
+            _ = data.pop(0)
+        translation, rotation, score, detail = [], [], [], []
+        for candidate in data:
+            if len(candidate) <= 1:
+                continue
+            if len(candidate) != 8:
+                candidate.append(-1)
+            candidate = [float(x) for x in candidate]
+            translation.append((candidate[0], candidate[1], candidate[2]))
+            rotation.append((candidate[3], candidate[4], candidate[5]))
+            score.append(candidate[6])
+            detail.append(candidate[7])
+        translation = np.vstack(translation).astype(int)
+        rotation = np.vstack(rotation).astype(float)
+        score = np.array(score).astype(float)
+        detail = np.array(detail).astype(float)
+        return translation, rotation, score, detail
+    @staticmethod
+    def _parse_star(filename: str, delimiter: str = None) -> Dict:
+        pattern = re.compile(r"\s*#.*")
+        with open(filename, mode="r", encoding="utf-8") as infile:
+            data = infile.read()
+        data = deque(filter(lambda line: line and line[0] != "#", data.split("\n")))
+        ret, category, block = {}, None, []
+        while data:
+            line = data.popleft()
+            if line.startswith("data") and not line.startswith("_"):
+                if category != line and category is not None:
+                    headers = list(ret[category].keys())
+                    headers = [pattern.sub("", x) for x in headers]
+                    ret[category] = {
+                        header: list(column)
+                        for header, column in zip(headers, zip(*block))
+                    }
+                    block.clear()
+                category = line
+                if category not in ret:
+                    ret[category] = {}
+                continue
+            if line.startswith("_"):
+                ret[category][line] = []
+                continue
+            if line.startswith("loop"):
+                continue
+            line_split = line.split(delimiter)
+            if len(line_split):
+                block.append(line_split)
+        headers = list(ret[category].keys())
+        headers = [pattern.sub("", x) for x in headers]
+        ret[category] = {
+            header: list(column) for header, column in zip(headers, zip(*block))
+        }
+        return ret
+    @classmethod
+    def _from_relion_star(
+        cls, filename: str, delimiter: str = None
+    ) -> Tuple[np.ndarray, np.ndarray, np.ndarray, np.ndarray]:
+        ret = cls._parse_star(filename=filename, delimiter=delimiter)
+        ret = ret["data_particles"]
+        translation = (
+            np.vstack(
+                (ret["_rlnCoordinateZ"], ret["_rlnCoordinateY"], ret["_rlnCoordinateX"])
+            )
+            .astype(np.float32)
+            .astype(int)
+            .T
+        )
+        rotation = (
+            np.vstack((ret["_rlnAngleRot"], ret["_rlnAngleTilt"], ret["_rlnAnglePsi"]))
+            .astype(np.float32)
+            .T
+        )
+        rotation = Rotation.from_euler("xyx", rotation, degrees=True)
+        rotation = rotation.as_euler(seq="zyx", degrees=True)
+        score = np.ones(translation.shape[0])
+        detail = np.ones(translation.shape[0]) * 1
+        return translation, rotation, score, detail
+    def get_extraction_slices(
+        self,
+        target_shape: Tuple[int],
+        extraction_shape: Tuple[int],
+        drop_out_of_box: bool = False,
+        return_orientations: bool = False,
+    ) -> "Orientations":
+        """
+        Calculate slices for extracting regions of interest within a larger array.
+        Parameters
+        ----------
+        target_shape : Tuple[int]
+            The shape of the target array within which regions are to be extracted.
+        extraction_shape : Tuple[int]
+            The shape of the regions to be extracted.
+        drop_out_of_box : bool, optional
+            If True, drop regions that extend beyond the target array boundary, by default False.
+        return_orientations : bool, optional
+            If True, return orientations along with slices, by default False.
+        Returns
+        -------
+        Union[Tuple[List[slice]], Tuple["Orientations", List[slice], List[slice]]]
+            If return_orientations is False, returns a tuple containing slices for candidate
+            regions and observation regions.
+            If return_orientations is True, returns a tuple containing orientations along
+            with slices for candidate regions and observation regions.
+        Raises
+        ------
+        SystemExit
+            If no peak remains after filtering, indicating an error.
+        """
+        left_pad = np.divide(extraction_shape, 2).astype(int)
+        right_pad = np.add(left_pad, np.mod(extraction_shape, 2)).astype(int)
+        obs_start = np.subtract(self.translations, left_pad)
+        obs_stop = np.add(self.translations, right_pad)
+        cand_start = np.subtract(np.maximum(obs_start, 0), obs_start)
+        cand_stop = np.subtract(obs_stop, np.minimum(obs_stop, target_shape))
+        cand_stop = np.subtract(extraction_shape, cand_stop)
+        obs_start = np.maximum(obs_start, 0)
+        obs_stop = np.minimum(obs_stop, target_shape)
+        subset = self
+        if drop_out_of_box:
+            stops = np.subtract(cand_stop, extraction_shape)
+            keep_peaks = (
+                np.sum(
+                    np.multiply(cand_start == 0, stops == 0),
+                    axis=1,
+                )
+                == self.translations.shape[1]
+            )
+            n_remaining = keep_peaks.sum()
+            if n_remaining == 0:
+                print(
+                    "No peak remaining after filtering. Started with"
+                    f" {self.translations.shape[0]} filtered to {n_remaining}."
+                    " Consider reducing min_distance, increase num_peaks or use"
+                    " a different peak caller."
+                )
+                exit(-1)
+            cand_start = cand_start[keep_peaks,]
+            cand_stop = cand_stop[keep_peaks,]
+            obs_start = obs_start[keep_peaks,]
+            obs_stop = obs_stop[keep_peaks,]
+            subset = self[keep_peaks]
+        cand_start, cand_stop = cand_start.astype(int), cand_stop.astype(int)
+        obs_start, obs_stop = obs_start.astype(int), obs_stop.astype(int)
+        candidate_slices = [
+            tuple(slice(s, e) for s, e in zip(start_row, stop_row))
+            for start_row, stop_row in zip(cand_start, cand_stop)
+        ]
+        observation_slices = [
+            tuple(slice(s, e) for s, e in zip(start_row, stop_row))
+            for start_row, stop_row in zip(obs_start, obs_stop)
+        ]
+        if return_orientations:
+            return subset, candidate_slices, observation_slices
+        return candidate_slices, observation_slices

tme/preprocessing/__init__.py ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ from .compose import Compose
2	+ from .frequency_filters import BandPassFilter, LinearWhiteningFilter