PyPI - sdss-almanac - Versions diffs - 0.2.1__py3-none-any.whl - Mend

sdss-almanac 0.2.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (26) hide show

almanac/__init__.py +4 -0
almanac/apogee.py +300 -0
almanac/cli.py +556 -0
almanac/config.py +110 -0
almanac/data_models/__init__.py +3 -0
almanac/data_models/exposure.py +350 -0
almanac/data_models/fps.py +109 -0
almanac/data_models/plate.py +142 -0
almanac/data_models/types.py +87 -0
almanac/data_models/utils.py +185 -0
almanac/database.py +22 -0
almanac/display.py +422 -0
almanac/etc/__init__.py +0 -0
almanac/etc/bad_exposures.csv +432 -0
almanac/io.py +320 -0
almanac/logger.py +27 -0
almanac/qa.py +24 -0
almanac/stash/data_models.py +0 -0
almanac/stash/plugmap_models.py +165 -0
almanac/utils.py +141 -0
sdss_almanac-0.2.1.dist-info/METADATA +201 -0
sdss_almanac-0.2.1.dist-info/RECORD +26 -0
sdss_almanac-0.2.1.dist-info/WHEEL +5 -0
sdss_almanac-0.2.1.dist-info/entry_points.txt +2 -0
sdss_almanac-0.2.1.dist-info/licenses/LICENSE.md +29 -0
sdss_almanac-0.2.1.dist-info/top_level.txt +1 -0

almanac/__init__.py ADDED Viewed

@@ -0,0 +1,4 @@
+__version__ = "0.2.1"
+from .config import config, get_config_path, ConfigManager
+from .logger import logger

almanac/apogee.py ADDED Viewed

@@ -0,0 +1,300 @@
+import os
+import numpy as np
+from glob import glob
+from subprocess import check_output
+from astropy.table import Table, hstack, unique
+from itertools import groupby
+from typing import Optional, Tuple, Dict, List, Set, Generator, Any, Union
+from scipy.spatial.distance import cdist
+from almanac import config, logger, utils
+from almanac.data_models import Exposure
+from almanac.data_models.types import ImageType
+from almanac.data_models.utils import mjd_to_exposure_prefix, get_exposure_path
+def get_unique_exposure_paths(paths: List[str]) -> List[str]:
+    """
+    Process a list of file paths to find unique exposures and determine which chips are available.
+    :param paths:
+        List of file paths to APOGEE exposure files.
+    :returns:
+        List of exposure paths.
+    """
+    chip_mapping = {}
+    for path in paths:
+        _, observatory, mjd, basename = path.rsplit("/", 3)
+        prefix, chip, exposure_apz = basename.split("-")
+        key = (observatory, mjd, exposure_apz)
+        chip_mapping.setdefault(key, [prefix, [False, False, False]])
+        index = "abc".index(chip)
+        chip_mapping[key][1][index] = True
+    unique_exposure_paths = []
+    for (observatory, mjd, exposure_apz), (prefix, chips) in chip_mapping.items():
+        chip = "abc"[chips.index(True)]
+        path = f"{config.apogee_dir}/{observatory}/{mjd}/{prefix}-{chip}-{exposure_apz}"
+        unique_exposure_paths.append(path)
+    return unique_exposure_paths
+def get_exposures(observatory: str, mjd: int) -> Generator[Exposure, None, None]:
+    """
+    Generate exposures taken from a given observatory on a given MJD.
+    :param observatory:
+        The observatory name (e.g. "apo").
+    :param mjd:
+        The Modified Julian Date.
+    :yields:
+        Exposure instances for each unique exposure found on disk.
+    """
+    paths = glob(get_exposure_path(observatory, mjd, "a?R", "*", "*"))
+    return organize_exposures(map(Exposure.from_path, get_unique_exposure_paths(paths)))
+def get_expected_number_of_exposures(observatory: str, mjd: int) -> int:
+    """
+    Query the SDSS database to get the expected exposures for a given observatory and MJD.
+    This is useful for identifying missing exposures.
+    """
+    if mjd < int(getattr(config.sdssdb_exposure_min_mjd, observatory)):
+        return -1
+    from almanac.database import opsdb
+    from peewee import fn
+    for model in (opsdb.Exposure, opsdb.ExposureFlavor):
+        model._meta.schema = f"opsdb_{observatory}"
+    start, end = map(mjd_to_exposure_prefix, (mjd, mjd + 1))
+    q = (
+        opsdb.Exposure.select(
+            fn.max(opsdb.Exposure.exposure_no)
+        )
+        .where(
+            (opsdb.Exposure.exposure_no > start)
+        &   (opsdb.Exposure.exposure_no < end)
+        )
+        .join(
+            opsdb.ExposureFlavor,
+            on=(opsdb.ExposureFlavor.pk == opsdb.Exposure.exposure_flavor),
+        )
+    )
+    try:
+        return q.scalar() - start
+    except:
+        return -1
+def organize_exposures(exposures: List[Exposure]) -> List[Exposure]:
+    """
+    Identify any missing exposures (based on non-contiguous exposure numbers)
+    and fill them with missing image types.
+    :param exposures:
+        A list of `Exposure` instances.
+    :returns:
+        A list of organized `Exposure` instances.
+    """
+    exposures = sorted(exposures, key=lambda x: x.exposure)
+    if len(exposures) == 0:
+        return []
+    observatory, mjd = (exposures[0].observatory, exposures[0].mjd)
+    n_expected = get_expected_number_of_exposures(observatory, mjd)
+    max_exposure = max(exposures[-1].exposure, n_expected)
+    organized = []
+    for i in range(1, max_exposure + 1):
+        if exposures and exposures[0].exposure == i:
+            organized.append(exposures.pop(0))
+        else:
+            organized.append(
+                Exposure(
+                    observatory=observatory,
+                    exposure=i,
+                    mjd=mjd,
+                    image_type="missing"
+                )
+            )
+    return organized
+def get_sequences(exposures: List[Exposure], image_type: ImageType, fields: Tuple[str, ...]) -> List[Tuple[int, int]]:
+    """
+    Get exposure number ranges for sequences of a specific image type.
+    :param exposures:
+        Astropy Table containing exposure metadata.
+    :param image_type:
+        The image type to search for (e.g., "Object", "ArcLamp").
+    :param fields:
+        Tuple of column names to group exposures by.
+    :param require_contiguous:
+        Whether to require exposure numbers to be contiguous within groups.
+    :returns:
+        List of tuples containing (start_exposure, end_exposure) for each sequence.
+    """
+    s = list(filter(lambda x: x.image_type == image_type, exposures))
+    sequence_exposure_numbers = []
+    for v, group in groupby(s, key=lambda x: tuple(getattr(x, f) for f in fields)):
+        for si, ei in utils.group_contiguous([e.exposure for e in group]):
+            sequence_exposure_numbers.append((si, ei))
+    return sequence_exposure_numbers
+def get_arclamp_sequences(exposures: List[Exposure]) -> List[Tuple[int, int]]:
+    """
+    Return a list of tuples indicating the start and end exposure numbers for
+    a sequence of arc lamp exposures.
+    :param exposures:
+        A list of `Exposure` instances.
+    :returns:
+        List of tuples containing (start_exposure, end_exposure) for each arc lamp sequence.
+    """
+    return get_sequences(exposures, "arclamp", ("dithered_pixels", ))
+def get_science_sequences(exposures: List[Exposure]) -> List[Tuple[int, int]]:
+    """
+    Return a list of tuples indicating the start and end exposure numbers for
+    a sequence of science exposures.
+    :param exposures:
+        A list of `Exposure` instances.
+    :returns:
+        List of tuples containing (start_exposure, end_exposure) for each science sequence.
+    """
+    return get_sequences(exposures, "object", ("field_id", "plate_id", "config_id", "image_type"))
+def get_almanac_data(observatory: str, mjd: int, fibers: bool = False, meta: bool = False):
+    """
+    Return comprehensive almanac data for all exposures taken from a given observatory on a given MJD.
+    :param observatory:
+        The observatory name (e.g. "apo").
+    :param mjd:
+        The Modified Julian Date.
+    :param fibers:
+        Whether to include fiber mapping information.
+    :param xmatch:
+        Whether to perform cross-matching with catalog database.
+    :param kwargs:
+        Additional keyword arguments passed to other functions.
+    :returns:
+        Tuple containing:
+        - observatory name
+        - MJD
+        - A list of exposures
+        - Table of exposure data
+        - dictionary of sequence indices
+        - dictionary of fiber mappings
+    """
+    exposures = get_exposures(observatory, mjd)
+    sequences = {
+        "objects": get_science_sequences(exposures),
+        "arclamps": get_arclamp_sequences(exposures),
+    }
+    if fibers:
+        catalogids, twomass_designations = (set(), set())
+        # We only need to get targets for one exposure in each science sequence.
+        for si, ei in sequences["objects"]:
+            exposure = exposures[si - 1]
+            for target in exposure.targets:
+                if target.expected_to_be_assigned_sdss_id:
+                    if target.catalogid > 0:
+                        catalogids.add(target.catalogid)
+                    else:
+                        twomass_designations.add(target.twomass_designation)
+        if meta:
+            # We will often run `get_almanac_data` in parallel (through multiple processes),
+            # so here we are avoiding opening a database connection until the child process starts.
+            from almanac.database import is_database_available, catalogdb
+            lookup_catalog = {}
+            lookup_twomass = {}
+            if catalogids and is_database_available:
+                q = (
+                    catalogdb.SDSS_ID_flat
+                    .select(
+                        catalogdb.SDSS_ID_flat.sdss_id,
+                        catalogdb.SDSS_ID_flat.catalogid
+                    )
+                    .where(
+                        catalogdb.SDSS_ID_flat.catalogid.in_(tuple(catalogids))
+                    &   (catalogdb.SDSS_ID_flat.rank == 1)
+                    )
+                    .tuples()
+                )
+                for sdss_id, catalogid in q:
+                    lookup_catalog[catalogid] = sdss_id
+            if twomass_designations and is_database_available:
+                q = (
+                    catalogdb.SDSS_ID_flat
+                    .select(
+                        catalogdb.SDSS_ID_flat.sdss_id,
+                        catalogdb.TwoMassPSC.designation
+                    )
+                    .join(
+                        catalogdb.CatalogToTwoMassPSC,
+                        on=(
+                            catalogdb.SDSS_ID_flat.catalogid
+                            == catalogdb.CatalogToTwoMassPSC.catalogid
+                        ),
+                    )
+                    .join(
+                        catalogdb.TwoMassPSC,
+                        on=(
+                            catalogdb.CatalogToTwoMassPSC.target_id
+                            == catalogdb.TwoMassPSC.pts_key
+                        ),
+                    )
+                    .where(
+                        catalogdb.TwoMassPSC.designation.in_(
+                            tuple(twomass_designations)
+                        )
+                    )
+                    .tuples()
+                )
+                for sdss_id, designation in q:
+                    lookup_twomass[designation] = sdss_id
+            # Add sdss_id to targets
+            for si, ei in sequences["objects"]:
+                for i in range(si - 1, ei):
+                    exposure = exposures[i]
+                    for target in exposure.targets:
+                        matches = [
+                            lookup_catalog.get(target.catalogid, -1),
+                            lookup_twomass.get(target.twomass_designation, -1)
+                        ]
+                        for match in matches:
+                            if match > 0:
+                                target.sdss_id = match
+                                break
+    return (observatory, mjd, exposures, sequences)