PyPI - sparclclient - Versions diffs - 1.2.1__py2.py3-none-any.whl - Mend

sparclclient 1.2.1__py2.py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (19) hide show

sparcl/Results.py +234 -0
sparcl/__init__.py +33 -0
sparcl/benchmarks/__init__.py +0 -0
sparcl/benchmarks/benchmarks.py +337 -0
sparcl/client.py +869 -0
sparcl/conf.py +34 -0
sparcl/exceptions.py +141 -0
sparcl/fields.py +160 -0
sparcl/gather_2d.py +233 -0
sparcl/notebooks/sparcl-examples.ipynb +1550 -0
sparcl/resample_spectra.py +41 -0
sparcl/sparc.ini +11 -0
sparcl/type_conversion.py +418 -0
sparcl/unsupported.py +65 -0
sparcl/utils.py +209 -0
sparclclient-1.2.1.dist-info/LICENSE +31 -0
sparclclient-1.2.1.dist-info/METADATA +14 -0
sparclclient-1.2.1.dist-info/RECORD +19 -0
sparclclient-1.2.1.dist-info/WHEEL +5 -0

sparcl/resample_spectra.py ADDED Viewed

@@ -0,0 +1,41 @@
+# NOT INTENDED FOR PUBLIC USE!
+#
+# See:
+#   https://spectres.readthedocs.io/en/latest/
+import math
+import spectres
+import numpy as np
+# Local
+import sparcl.client
+# Per paper, should be able to pass all flux in one call to spectres
+# https://arxiv.org/pdf/1705.05165.pdf
+# Perhaps users would rather the bins uniform (1,5,20 Angstroms?)
+def _resample_flux(records, wavstep=1):
+    smallest = math.floor(min([min(r.wavelength) for r in records]))
+    largest = math.ceil(max([max(r.wavelength) for r in records]))
+    #!wrange = largest - smallest
+    # new_wavs = np.fro<mfunction(lambda i: i + smallest, (wrange,), dtype=int)
+    # flux_2d = np.ones([len(records), wrange])
+    new_wavs = np.array(range(smallest, largest + 1, wavstep))
+    flux_2d = np.full([len(records), len(new_wavs)], None, dtype=float)
+    for idx, rec in enumerate(records):
+        flux_2d[idx] = spectres.spectres(
+            new_wavs, rec.wavelength, rec.flux, verbose=False
+        )
+    return flux_2d, new_wavs
+def _tt0(numrecs=20):
+    client = sparcl.client.SparclClient()
+    found = client.find(
+        constraints=dict(data_release=["BOSS-DR16"]), limit=numrecs
+    )
+    got = client.retrieve(found.ids)
+    flux_2d, new_wavs = _resample_flux(got.records)
+    return flux_2d, new_wavs

sparcl/sparc.ini ADDED Viewed

@@ -0,0 +1,11 @@
+# This config file is for the NOIRLab Astro Data Archive client.
+# It gets data from a server such as: https://specserver.noirlab.edu/
+[DEFAULT]
+ServerBaseUrl = https://specserver.noirlab.edu
+ServerAliveInterval = 45
+[sparc.server]
+# Time limit (seconds) for connecting to NOIRLab Astro Data Archive server
+ServerTimeout = 30

sparcl/type_conversion.py ADDED Viewed

@@ -0,0 +1,418 @@
+# Python Standard Library
+from abc import ABC, abstractmethod
+import copy
+#!from pprint import pformat
+from enum import Enum, auto
+# External Packages
+import numpy as np
+#!import pandas as pd
+from specutils import Spectrum1D
+import astropy.units as u
+from astropy.nddata import InverseVariance
+# Local Packages
+import sparcl.exceptions as ex
+"""It would be much better if this were abstracted and easier to
+update with new Data Types and new DataReleases.  Perhaps use
+something like the Server "Personalities".  I've rejected abstracting
+for now because I think we need operational experience with the DataType
+feature and how it interacts with other features (especially global
+Rename and retrieve(INCLUDE).
+DataType conversion should be done completely within the Client, not
+on the Server.  The obvious reason is Clients are language
+dependent, the Server API is not.  But for Client to be able to know
+all about fields names (mapping from original to new names, which ones
+are required) it needs info from the Server.  The Client gets such
+tables on instance instantiation through one web-service call that
+grabs everything that pulls it appart into multiple DataField related
+LUTs (LookUpTables, aka dictionaries).
+Questions abound for use-cases.
+1. Is it very important to be able to convert a record LIST to a
+   single data structure? Example: for Pandas DataFrame we combine all
+   vectors in a record into a 2D DataFrame.  What about those across
+   records into a 3D DataFrame?
+2. Should vectors and scalars be funadmentally separated? (see #1) If
+   so, how do we avoid hard coding the distinction for every
+   DataRelease?
+"""
+# Replace all uses of string rtype with enum @@@
+class Rtype(Enum):
+    JSON = auto()
+    NUMPY = auto()
+    PANDAS = auto()
+    SPECTRUM1D = auto()
+class Convert(ABC):
+    """Convert JSON record to mix of plain python
+    and selected data record type.
+    """
+    @abstractmethod
+    def to_numpy(self, record, o2nLUT):
+        newrec = copy.deepcopy(record)
+        return newrec
+    @abstractmethod
+    def to_spectrum1d(self, record, o2nLUT):
+        newrec = copy.deepcopy(record)
+        return newrec
+#!    @abstractmethod
+#!    def to_pandas(self, record, o2nLUT):
+#!        newrec = copy.deepcopy(record)
+#!        return(newrec)
+class NoopConvert(Convert):
+    def to_numpy(self, record, o2nLUT):
+        return record
+    def to_spectrum1d(self, record, o2nLUT):
+        return record
+    def to_pandas(self, record, o2nLUT):
+        return record
+class SdssDr16(Convert):
+    def to_numpy(self, record, o2nLUT):
+        """Convert FitsFile record to a structure that uses Numpy"""
+        arflds = [
+            "spectra.coadd.and_mask",
+            "spectra.coadd.flux",
+            "spectra.coadd.ivar",
+            "spectra.coadd.loglam",
+            "spectra.coadd.model",
+            "spectra.coadd.or_mask",
+            "spectra.coadd.sky",
+            "spectra.coadd.wdisp",
+        ]
+        lofl = [record[o2nLUT[f]] for f in arflds if f in o2nLUT]
+        newrec = dict(nparr=np.array(lofl))
+        for orig, new in o2nLUT.items():
+            if orig in arflds:
+                continue
+            if new in record:
+                newrec[new] = record[new]
+        return newrec
+    # Sdss
+    def to_spectrum1d(self, record, o2nLUT):
+        arflds = [
+            "red_shift",
+            "spectra.coadd.flux",
+            "spectra.coadd.ivar",
+            "spectra.coadd.loglam",
+            "spectra.coadd.and_mask",
+        ]
+        loglam = record[o2nLUT["spectra.coadd.loglam"]]
+        flux = record[o2nLUT["spectra.coadd.flux"]]
+        ivar = record[o2nLUT["spectra.coadd.ivar"]]
+        and_mask = record[o2nLUT["spectra.coadd.and_mask"]]
+        wavelength = (10 ** np.array(loglam)) * u.AA
+        flux = np.array(flux) * 10**-17 * u.Unit("erg cm-2 s-1 AA-1")
+        ivar = InverseVariance(np.array(ivar))
+        z = record.get("red_shift")
+        newrec = dict(
+            # flux, uncertainty, wavevelength, mask(and), redshift
+            spec1d=Spectrum1D(
+                spectral_axis=wavelength,
+                flux=flux,
+                uncertainty=ivar,
+                redshift=z,
+                mask=and_mask,
+            ),
+        )
+        for orig, new in o2nLUT.items():
+            if orig in arflds:
+                continue
+            if new in record:
+                newrec[new] = record[new]
+        return newrec
+#!    def to_pandas(self, record, o2nLUT):
+#!        arflds = [
+#!            'spectra.coadd.and_mask',
+#!            'spectra.coadd.flux',
+#!            'spectra.coadd.ivar',
+#!            'spectra.coadd.loglam',
+#!            'spectra.coadd.model',
+#!            'spectra.coadd.or_mask',
+#!            'spectra.coadd.sky',
+#!            'spectra.coadd.wdisp',
+#!            ]
+#!        dfdict = dict((o2nLUT[f], record[o2nLUT[f]])
+#!                      for f in arflds if f in o2nLUT)
+#!        newrec = dict(df = pd.DataFrame(dfdict))
+#!        for orig,new in o2nLUT.items():
+#!            if orig in arflds:
+#!                continue
+#!            if new in record:
+#!                newrec[new] = record[new]
+#!        return(newrec)
+class BossDr16(Convert):
+    def to_numpy(self, record, o2nLUT):
+        arflds = [
+            "spectra.coadd.AND_MASK",
+            "spectra.coadd.FLUX",
+            "spectra.coadd.IVAR",
+            "spectra.coadd.LOGLAM",
+            "spectra.coadd.MODEL",
+            "spectra.coadd.OR_MASK",
+            "spectra.coadd.SKY",
+            "spectra.coadd.WDISP",
+        ]
+        lofl = [record[o2nLUT[f]] for f in arflds if f in o2nLUT]
+        newrec = dict(nparr=np.array(lofl))
+        for orig, new in o2nLUT.items():
+            # Don't carry over the fields used to build the new datatype.
+            # This would be duplication since their content is already
+            # in the new datatype.
+            if orig in arflds:
+                continue
+            if new in record:
+                newrec[new] = record[new]
+        return newrec
+    # BOSS
+    def to_spectrum1d(self, record, o2nLUT):
+        arflds = [
+            "red_shift",
+            "spectra.coadd.FLUX",
+            "spectra.coadd.IVAR",
+            "spectra.coadd.LOGLAM",
+            "spectra.coadd.AND_MASK",
+        ]
+        loglam = record[o2nLUT["spectra.coadd.LOGLAM"]]
+        flux = record[o2nLUT["spectra.coadd.FLUX"]]
+        ivar = record[o2nLUT["spectra.coadd.IVAR"]]
+        and_mask = record[o2nLUT["spectra.coadd.AND_MASK"]]
+        wavelength = (10 ** np.array(loglam)) * u.AA
+        flux = np.array(flux) * 10**-17 * u.Unit("erg cm-2 s-1 AA-1")
+        ivar = InverseVariance(np.array(ivar))
+        z = record.get("red_shift")
+        newrec = dict(
+            # flux, uncertainty, wavelength, mask(and), redshift
+            spec1d=Spectrum1D(
+                spectral_axis=wavelength,
+                flux=flux,
+                uncertainty=ivar,
+                redshift=z,
+                mask=and_mask,
+            ),
+        )
+        for orig, new in o2nLUT.items():
+            if orig in arflds:
+                continue
+            if new in record:
+                newrec[new] = record[new]
+        return newrec
+#!    def to_pandas(self, record, o2nLUT): # BOSS
+#!        arflds = [
+#!            'spectra.coadd.AND_MASK',
+#!            'spectra.coadd.FLUX',
+#!            'spectra.coadd.IVAR',
+#!            'spectra.coadd.LOGLAM',
+#!            'spectra.coadd.MODEL',
+#!            'spectra.coadd.OR_MASK',
+#!            'spectra.coadd.SKY',
+#!            'spectra.coadd.WDISP',
+#!            ]
+#!        dfdict = dict((o2nLUT[f], record[o2nLUT[f]])
+#!                      for f in arflds if f in o2nLUT)
+#!        newrec = dict(df = pd.DataFrame(dfdict))
+#!        for orig,new in o2nLUT.items():
+#!            if orig in arflds:
+#!                continue
+#!            if new in record:
+#!                newrec[new] = record[new]
+#!        return(newrec)
+class Desi(Convert):
+    def to_numpy(self, record, o2nLUT):
+        arflds = [
+            "spectra.b_flux",
+            "spectra.b_ivar",
+            "spectra.b_mask",
+            "spectra.b_wavelength",
+            "spectra.r_flux",
+            "spectra.r_ivar",
+            "spectra.r_mask",
+            "spectra.r_wavelength",
+            "spectra.z_flux",
+            "spectra.z_ivar",
+            "spectra.z_mask",
+            "spectra.z_wavelength",
+        ]
+        lofl = [record[o2nLUT[f]] for f in arflds if f in o2nLUT]
+        newrec = dict(nparr=np.array(lofl))
+        for orig, new in o2nLUT.items():
+            if orig in arflds:
+                continue
+            if new in record:
+                newrec[new] = record[new]
+        return newrec
+    def to_spectrum1d(self, record, o2nLUT):  # Desi
+        arflds = [
+            "red_shift",
+            "spectra.b_flux",
+            "spectra.b_ivar",
+            "spectra.b_mask",
+            "spectra.b_wavelength",
+            "spectra.r_flux",
+            "spectra.r_ivar",
+            "spectra.r_mask",
+            "spectra.r_wavelength",
+            "spectra.z_flux",
+            "spectra.z_ivar",
+            "spectra.z_mask",
+            "spectra.z_wavelength",
+        ]
+        z = record.get("red_shift")
+        # _b
+        wavelength_b = record[o2nLUT["spectra.b_wavelength"]]
+        flux_b = record[o2nLUT["spectra.b_flux"]]
+        ivar_b = record[o2nLUT["spectra.b_ivar"]]
+        mask_b = record[o2nLUT["spectra.b_mask"]]
+        # Define units
+        wavelength_b = np.array(wavelength_b) * u.AA
+        flux_b = np.array(flux_b) * 10**-17 * u.Unit("erg cm-2 s-1 AA-1")
+        ivar_b = InverseVariance(np.array(ivar_b))
+        # _r
+        wavelength_r = record[o2nLUT["spectra.r_wavelength"]]
+        flux_r = record[o2nLUT["spectra.r_flux"]]
+        ivar_r = record[o2nLUT["spectra.r_ivar"]]
+        mask_r = record[o2nLUT["spectra.r_mask"]]
+        # Define units
+        wavelength_r = np.array(wavelength_r) * u.AA
+        flux_r = np.array(flux_r) * 10**-17 * u.Unit("erg cm-2 s-1 AA-1")
+        ivar_r = InverseVariance(np.array(ivar_r))
+        # _z
+        wavelength_z = record[o2nLUT["spectra.z_wavelength"]]
+        flux_z = record[o2nLUT["spectra.z_flux"]]
+        ivar_z = record[o2nLUT["spectra.z_ivar"]]
+        mask_z = record[o2nLUT["spectra.z_mask"]]
+        # Define units
+        wavelength_z = np.array(wavelength_z) * u.AA
+        flux_z = np.array(flux_z) * 10**-17 * u.Unit("erg cm-2 s-1 AA-1")
+        ivar_z = InverseVariance(np.array(ivar_z))
+        newrec = dict(
+            # flux, uncertainty, wavevelength, mask, redshift
+            b_spec1d=Spectrum1D(
+                spectral_axis=wavelength_b,
+                flux=flux_b,
+                uncertainty=ivar_b,
+                redshift=z,
+                mask=mask_b,
+            ),
+            r_spec1d=Spectrum1D(
+                spectral_axis=wavelength_r,
+                flux=flux_r,
+                uncertainty=ivar_r,
+                redshift=z,
+                mask=mask_r,
+            ),
+            z_spec1d=Spectrum1D(
+                spectral_axis=wavelength_z,
+                flux=flux_z,
+                uncertainty=ivar_z,
+                redshift=z,
+                mask=mask_z,
+            ),
+        )
+        for orig, new in o2nLUT.items():
+            if orig in arflds:
+                continue
+            if new in record:
+                newrec[new] = record[new]
+        return newrec
+class DesiDenali(Desi):
+    pass
+class DesiEverest(Desi):
+    pass
+# DR Instance LookUp Table
+diLUT = {
+    "SDSS-DR16": SdssDr16(),
+    "BOSS-DR16": BossDr16(),
+    "DESI-denali": DesiDenali(),
+    "DESI-everest": DesiEverest(),
+    #'Unknown': NoopConvert(),
+}
+def convert(record, rtype, client, include, verbose=False):
+    if rtype is None:
+        return record
+    dr = record["_dr"]
+    # Validate parameters
+    if dr not in diLUT:
+        allowed = ", ".join(list(diLUT.keys()))
+        msg = (
+            f'The Data Set associated with a records, "{dr}",'
+            f" is not supported for Type Conversion."
+            f" Available Data Sets are: {allowed}."
+        )
+        raise ex.UnkDr(msg)
+    drin = diLUT.get(dr, NoopConvert())
+    o2nLUT = copy.copy(client.orig2newLUT[dr])  # orig2newLUT[dr][orig] = new
+    o2nLUT["_dr"] = "_dr"
+    #!n2oLUT = client.new2origLUT[dr]
+    #!required = set(client.required[dr])
+    #!if include is not None:
+    #!    nuke = set(n2oLUT.keys()).difference(required.union(include))
+    #!    for new in nuke:
+    #!        del o2nLUT[n2oLUT[new]]
+    if rtype == "json":
+        return record
+    elif rtype == "numpy":
+        return drin.to_numpy(record, o2nLUT)
+    elif rtype == "pandas":
+        return drin.to_pandas(record, o2nLUT)
+    elif rtype == "spectrum1d":
+        return drin.to_spectrum1d(record, o2nLUT)
+    else:
+        raise Exception(f"Unknown record type ({rtype})")
+    return None

sparcl/unsupported.py ADDED Viewed

@@ -0,0 +1,65 @@
+# End Users should not use anything from this file. All of it is
+# considered experimentatal and be broken or change without notice.
+############################################
+# Python Standard Library
+from urllib.parse import urlencode
+#!from urllib.parse import urlparse
+#!from warnings import warn
+import pickle
+import tempfile
+import json
+############################################
+# External Packages
+import requests
+############################################
+# Local Packages
+#!from sparcl.fields import Fields
+import sparcl.exceptions as ex
+_STAGE = "https://sparclstage.datalab.noirlab.edu"  # noqa: E221
+_PAT = "https://sparc1.datalab.noirlab.edu"  # noqa: E221
+drs = ["SDSS-DR16", "BOSS-DR16", "DESI-EDR"]
+def retrieve(
+    ids,
+    include=["id"],
+    dataset_list=["BOSS-DR16"],
+    server=_PAT,
+    svc="spectras",  # or 'retrieve',
+    limit=100,
+    verbose=True,
+):
+    uparams = dict(
+        include=",".join(include),
+        limit=limit,
+        dataset_list=",".join(dataset_list),
+    )
+    qstr = urlencode(uparams)
+    url = f"{server}/sparc/{svc}/?{qstr}"
+    if verbose:
+        print(f"Using ids={ids[:2]}")
+        print(f'Using url="{url}"')
+        print(f"curl -X POST \"{url}\" -d '{json.dumps(ids)}' > retrieve.pkl")
+    res = requests.post(url, json=ids)
+    if res.status_code != 200:
+        #! if verbose and ('traceback' in res.json()):
+        #!     print(f'DBG: Server traceback=\n{res.json()["traceback"]}')
+        raise ex.genSparclException(res, verbose=verbose)
+    # unpack pickle file from result
+    with tempfile.TemporaryFile(mode="w+b") as fp:
+        for idx, chunk in enumerate(res.iter_content(chunk_size=None)):
+            fp.write(chunk)
+        # Position to start of file for pickle reading (load)
+        fp.seek(0)
+        results = pickle.load(fp)
+    return results