PyPI - imap-processing - Versions diffs - 1.0.0__py3-none-any.whl → 1.0.1__py3-none-any.whl - Mend

imap-processing 1.0.0py3-none-any.whl → 1.0.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of imap-processing might be problematic. Click here for more details.

Files changed (43) hide show

imap_processing/_version.py +2 -2
imap_processing/cdf/config/imap_codice_global_cdf_attrs.yaml +13 -1
imap_processing/cdf/config/imap_codice_l2-hi-omni_variable_attrs.yaml +635 -0
imap_processing/cdf/config/imap_codice_l2-hi-sectored_variable_attrs.yaml +422 -0
imap_processing/cdf/config/imap_enamaps_l2-common_variable_attrs.yaml +28 -21
imap_processing/cdf/config/imap_enamaps_l2-healpix_variable_attrs.yaml +2 -0
imap_processing/cdf/config/imap_enamaps_l2-rectangular_variable_attrs.yaml +12 -2
imap_processing/cli.py +6 -11
imap_processing/codice/codice_l2.py +640 -127
imap_processing/codice/constants.py +61 -0
imap_processing/ena_maps/ena_maps.py +111 -60
imap_processing/ena_maps/utils/coordinates.py +5 -0
imap_processing/ena_maps/utils/corrections.py +268 -0
imap_processing/ena_maps/utils/map_utils.py +143 -42
imap_processing/hi/hi_l2.py +3 -8
imap_processing/ialirt/constants.py +7 -1
imap_processing/ialirt/generate_coverage.py +1 -1
imap_processing/ialirt/l0/process_codice.py +66 -0
imap_processing/ialirt/utils/create_xarray.py +1 -0
imap_processing/idex/idex_l2a.py +2 -2
imap_processing/idex/idex_l2b.py +1 -1
imap_processing/lo/l1c/lo_l1c.py +61 -3
imap_processing/lo/l2/lo_l2.py +79 -11
imap_processing/mag/l1a/mag_l1a.py +2 -2
imap_processing/mag/l1a/mag_l1a_data.py +71 -13
imap_processing/mag/l1c/interpolation_methods.py +34 -13
imap_processing/mag/l1c/mag_l1c.py +117 -67
imap_processing/mag/l1d/mag_l1d_data.py +3 -1
imap_processing/spice/geometry.py +11 -9
imap_processing/spice/pointing_frame.py +77 -50
imap_processing/swapi/l1/swapi_l1.py +12 -4
imap_processing/swe/utils/swe_constants.py +7 -7
imap_processing/ultra/l1b/extendedspin.py +1 -1
imap_processing/ultra/l1b/ultra_l1b_culling.py +2 -2
imap_processing/ultra/l1b/ultra_l1b_extended.py +1 -1
imap_processing/ultra/l1c/helio_pset.py +1 -1
imap_processing/ultra/l1c/spacecraft_pset.py +2 -2
imap_processing-1.0.1.dist-info/METADATA +121 -0
{imap_processing-1.0.0.dist-info → imap_processing-1.0.1.dist-info}/RECORD +42 -40
imap_processing-1.0.0.dist-info/METADATA +0 -120
{imap_processing-1.0.0.dist-info → imap_processing-1.0.1.dist-info}/LICENSE +0 -0
{imap_processing-1.0.0.dist-info → imap_processing-1.0.1.dist-info}/WHEEL +0 -0
{imap_processing-1.0.0.dist-info → imap_processing-1.0.1.dist-info}/entry_points.txt +0 -0

imap_processing/codice/codice_l2.py CHANGED Viewed

@@ -10,51 +10,627 @@ dataset = process_codice_l2(l1_filename)
 """
 import logging
-from pathlib import Path
 import numpy as np
+import pandas as pd
 import xarray as xr
+from imap_data_access import ProcessingInputCollection, ScienceFilePath
 from imap_processing.cdf.imap_cdf_manager import ImapCdfAttributes
 from imap_processing.cdf.utils import load_cdf
-from imap_processing.codice.constants import HALF_SPIN_LUT
+from imap_processing.codice.constants import (
+    HALF_SPIN_LUT,
+    HI_L2_ELEVATION_ANGLE,
+    HI_OMNI_VARIABLE_NAMES,
+    HI_SECTORED_VARIABLE_NAMES,
+    L2_GEOMETRIC_FACTOR,
+    L2_HI_NUMBER_OF_SSD,
+    L2_HI_SECTORED_ANGLE,
+    LO_NSW_SPECIES_VARIABLE_NAMES,
+    LO_SW_PICKUP_ION_SPECIES_VARIABLE_NAMES,
+    LO_SW_SPECIES_VARIABLE_NAMES,
+    NSW_POSITIONS,
+    PUI_POSITIONS,
+    SW_POSITIONS,
+)
 logger = logging.getLogger(__name__)
 logger.setLevel(logging.INFO)
-def process_codice_l2(file_path: Path) -> xr.Dataset:
+def get_geometric_factor_lut(dependencies: ProcessingInputCollection) -> dict:
     """
-    Will process CoDICE l1 data to create l2 data products.
+    Get the geometric factor lookup table.
     Parameters
     ----------
-    file_path : pathlib.Path
-        Path to the CoDICE L1 file to process.
+    dependencies : ProcessingInputCollection
+        The collection of processing input files.
     Returns
     -------
-    l2_dataset : xarray.Dataset
-        The``xarray`` dataset containing the science data and supporting metadata.
+    geometric_factor_lut : dict
+        A dict with a full and reduced mode array with shape (esa_steps, position).
+    """
+    geometric_factors = pd.read_csv(
+        dependencies.get_file_paths(descriptor="l2-lo-gfactor")[0]
+    )
+    # sort by esa step. They should already be sorted, but just in case
+    full = geometric_factors[geometric_factors["mode"] == "full"].sort_values(
+        by="esa_step"
+    )
+    reduced = geometric_factors[geometric_factors["mode"] == "reduced"].sort_values(
+        by="esa_step"
+    )
+    # Sort position columns to ensure the correct order
+    position_names_sorted = sorted(
+        [col for col in full if col.startswith("position")],
+        key=lambda x: int(x.split("_")[-1]),
+    )
+    return {
+        "full": full[position_names_sorted].to_numpy(),
+        "reduced": reduced[position_names_sorted].to_numpy(),
+    }
+def get_efficiency_lut(dependencies: ProcessingInputCollection) -> pd.DataFrame:
     """
-    logger.info(f"Processing {file_path}")
+    Get the efficiency lookup table.
+    Parameters
+    ----------
+    dependencies : ProcessingInputCollection
+        The collection of processing input files.
+    Returns
+    -------
+    efficiency_lut : pandas.DataFrame
+        Contains the efficiency lookup table. Columns are:
+        species, product, esa_step, position_1, position_2, ..., position_24.
+    """
+    return pd.read_csv(dependencies.get_file_paths(descriptor="l2-lo-efficiency")[0])
-    # Open the l1 file
-    l1_dataset = load_cdf(file_path)
-    # Use the logical source as a way to distinguish between data products and
-    # set some useful distinguishing variables
-    # TODO: Could clean this up by using imap-data-access methods?
-    dataset_name = l1_dataset.attrs["Logical_source"]
-    data_level = dataset_name.removeprefix("imap_codice_").split("_")[0]
-    dataset_name = dataset_name.replace(data_level, "l2")
+def get_species_efficiency(species: str, efficiency: pd.DataFrame) -> np.ndarray:
+    """
+    Get the efficiency values for a given species.
-    # Use the L1 data product as a starting point for L2
-    l2_dataset = l1_dataset.copy()
+    Parameters
+    ----------
+    species : str
+        The species name.
+    efficiency : pandas.DataFrame
+        The efficiency lookup table.
-    # Get the L2 CDF attributes
+    Returns
+    -------
+    efficiency : np.ndarray
+        A 2D array of efficiencies with shape (epoch, esa_steps).
+    """
+    species_efficiency = efficiency[efficiency["species"] == species].sort_values(
+        by="esa_step"
+    )
+    # Sort position columns to ensure the correct order
+    position_names_sorted = sorted(
+        [col for col in species_efficiency if col.startswith("position")],
+        key=lambda x: int(x.split("_")[-1]),
+    )
+    # Shape: (esa_steps, positions)
+    return species_efficiency[position_names_sorted].to_numpy()
+def compute_geometric_factors(
+    dataset: xr.Dataset, geometric_factor_lookup: dict
+) -> np.ndarray:
+    """
+    Calculate geometric factors needed for intensity calculations.
+    Geometric factors are determined by comparing the half-spin values per
+    esa_step in the HALF_SPIN_LUT to the rgfo_half_spin values in the provided
+    L2 dataset.
+    If the half-spin value is less than the corresponding rgfo_half_spin value,
+    the geometric factor is set to 0.75 (full mode); otherwise, it is set to 0.5
+    (reduced mode).
+    NOTE: Half spin values are associated with ESA steps which corresponds to the
+    index of the energy_per_charge dimension that is between 0 and 127.
+    Parameters
+    ----------
+    dataset : xarray.Dataset
+        The L2 dataset containing rgfo_half_spin data variable.
+    geometric_factor_lookup : dict
+        A dict with a full and reduced mode array with shape (esa_steps, position).
+    Returns
+    -------
+    geometric_factors : np.ndarray
+        A 3D array of geometric factors with shape (epoch, esa_steps, positions).
+    """
+    # Convert the HALF_SPIN_LUT to a reverse mapping of esa_step to half_spin
+    esa_step_to_half_spin_map = {
+        val: key for key, vals in HALF_SPIN_LUT.items() for val in vals
+    }
+    # Create a list of half_spin values corresponding to ESA steps (0 to 127)
+    half_spin_values = np.array(
+        [esa_step_to_half_spin_map[step] for step in range(128)]
+    )
+    # Expand dimensions to compare each rgfo_half_spin value against
+    # all half_spin_values
+    rgfo_half_spin = dataset.rgfo_half_spin.data[:, np.newaxis]  # Shape: (epoch, 1)
+    # Perform the comparison and calculate modes
+    # Modes will be true (reduced mode) anywhere half_spin >= rgfo_half_spin otherwise
+    # false (full mode)
+    modes = half_spin_values >= rgfo_half_spin
+    # Get the geometric factors based on the modes
+    gf = np.where(
+        modes[:, :, np.newaxis],  # Shape (epoch, esa_step, 1)
+        geometric_factor_lookup["reduced"],  # Shape (1, esa_step, 24) - reduced mode
+        geometric_factor_lookup["full"],  # Shape (1, esa_step, 24) - full mode
+    )  # Shape: (epoch, esa_step, positions)
+    return gf
+def process_lo_species_intensity(
+    dataset: xr.Dataset,
+    species_list: list,
+    geometric_factors: np.ndarray,
+    efficiency: pd.DataFrame,
+    positions: list,
+) -> xr.Dataset:
+    """
+    Process the lo-species L2 dataset to calculate species intensities.
+    Parameters
+    ----------
+    dataset : xarray.Dataset
+        The L2 dataset to process.
+    species_list : list
+        List of species variable names to calculate intensity.
+    geometric_factors : np.ndarray
+        The geometric factors array with shape (epoch, esa_steps).
+    efficiency : pandas.DataFrame
+        The efficiency lookup table.
+    positions : list
+        A list of position indices to select from the geometric factor and
+        efficiency lookup tables.
+    Returns
+    -------
+    xarray.Dataset
+        The updated L2 dataset with species intensities calculated.
+    """
+    # Select the relevant positions from the geometric factors
+    geometric_factors = geometric_factors[:, :, positions]
+    # take the mean geometric factor across positions
+    geometric_factors = np.nanmean(geometric_factors, axis=-1)
+    scaler = len(positions)
+    # Calculate the species intensities using the provided geometric factors and
+    # efficiency. Species_intensity = species_rate / (gm * eff * esa_step)
+    for species in species_list:
+        # Select the relevant positions for the species from the efficiency LUT
+        # Shape: (epoch, esa_steps, positions)
+        species_eff = get_species_efficiency(species, efficiency)[
+            np.newaxis, :, positions
+        ]
+        if species_eff.size == 0:
+            logger.warning("No efficiency data found for species {species}. Skipping.")
+            continue
+        # Take the mean efficiency across positions
+        species_eff = np.nanmean(species_eff, axis=-1)
+        denominator = (
+            scaler * geometric_factors * species_eff * dataset["energy_table"].data
+        )
+        if species not in dataset:
+            logger.warning(
+                f"Species {species} not found in dataset. Filling with NaNS."
+            )
+            dataset[species] = np.full(dataset["energy_table"].data.shape, np.nan)
+        else:
+            dataset[species] = dataset[species] / denominator[:, :, np.newaxis]
+    return dataset
+def process_hi_omni(dependencies: ProcessingInputCollection) -> xr.Dataset:
+    """
+    Process the hi-omni L1B dataset to calculate omni-directional intensities.
+    See section 11.1.3 of the CoDICE algorithm document for details.
+    The formula for omni-directional intensities is::
+        l1B species data / (
+            geometric_factor * number_of_ssd * efficiency * energy_passband
+        )
+    Geometric factor is constant for all species which is 0.013.
+    Number of SSD is constant for all species which is 12.
+    Efficiency is provided in a CSV file for each species and energy bin.
+    Energy passband is calculated from L1B variables energy_bin_minus + energy_bin_plus
+    Parameters
+    ----------
+    dependencies : ProcessingInputCollection
+        The collection of processing input files.
+    Returns
+    -------
+    xarray.Dataset
+        The updated L2 dataset with omni-directional intensities calculated.
+    """
+    l1b_file = dependencies.get_file_paths(descriptor="hi-omni")[0]
+    l1b_dataset = load_cdf(l1b_file)
+    # Read the efficiencies data from the CSV file
+    efficiencies_file = dependencies.get_file_paths(descriptor="l2-hi-omni-efficiency")[
+        0
+    ]
+    efficiencies_df = pd.read_csv(efficiencies_file)
+    # Omni product has 8 species and each species has different shape.
+    # Eg.
+    #   h - (epoch, 15)
+    #   c - (epoch, 18)
+    #   uh - (epoch, 5)
+    #   etc.
+    # Because of that, we need to loop over each species and calculate
+    # omni-directional intensities separately.
+    for species in HI_OMNI_VARIABLE_NAMES:
+        species_data = efficiencies_df[efficiencies_df["species"] == species]
+        # Read current species' effificiency
+        species_efficiencies = species_data["average_efficiency"].values[np.newaxis, :]
+        # Calculate energy passband from L1B data
+        energy_passbands = (
+            l1b_dataset[f"energy_{species}_plus"]
+            + l1b_dataset[f"energy_{species}_minus"]
+        ).values[np.newaxis, :]
+        # Calculate omni-directional intensities
+        omni_direction_intensities = l1b_dataset[species] / (
+            L2_GEOMETRIC_FACTOR
+            * L2_HI_NUMBER_OF_SSD
+            * species_efficiencies
+            * energy_passbands
+        )
+        # Store by replacing existing species data with omni-directional intensities
+        l1b_dataset[species].values = omni_direction_intensities
+    # TODO: this may go away once Joey and I fix L1B CDF
+    # Update global CDF attributes
     cdf_attrs = ImapCdfAttributes()
-    l2_dataset = add_dataset_attributes(l2_dataset, dataset_name, cdf_attrs)
+    cdf_attrs.add_instrument_global_attrs("codice")
+    cdf_attrs.add_instrument_variable_attrs("codice", "l2-hi-omni")
+    l1b_dataset.attrs = cdf_attrs.get_global_attributes("imap_codice_l2_hi-omni")
+    # TODO: ask Joey to add attrs for epoch_delta_plus and epoch_delta_minus
+    # and update dimension to be 'epoch' in L1B data
+    for variable in l1b_dataset.data_vars:
+        if variable in ["epoch_delta_plus", "epoch_delta_minus", "data_quality"]:
+            l1b_dataset[variable].attrs = cdf_attrs.get_variable_attributes(
+                variable, check_schema=False
+            )
+        else:
+            l1b_dataset[variable].attrs = cdf_attrs.get_variable_attributes(
+                variable, check_schema=False
+            )
+    # Add these new coordinates
+    new_coords = {
+        "energy_h": l1b_dataset["energy_h"],
+        "energy_h_label": xr.DataArray(
+            l1b_dataset["energy_h"].values.astype(str),
+            dims=("energy_h",),
+            attrs=cdf_attrs.get_variable_attributes(
+                "energy_h_label", check_schema=False
+            ),
+        ),
+        "energy_he3": l1b_dataset["energy_he3"],
+        "energy_he3_label": xr.DataArray(
+            l1b_dataset["energy_he3"].values.astype(str),
+            dims=("energy_he3",),
+            attrs=cdf_attrs.get_variable_attributes(
+                "energy_he3_label", check_schema=False
+            ),
+        ),
+        "energy_he4": l1b_dataset["energy_he4"],
+        "energy_he4_label": xr.DataArray(
+            l1b_dataset["energy_he4"].values.astype(str),
+            dims=("energy_he4",),
+            attrs=cdf_attrs.get_variable_attributes(
+                "energy_he4_label", check_schema=False
+            ),
+        ),
+        "energy_c": l1b_dataset["energy_c"],
+        "energy_c_label": xr.DataArray(
+            l1b_dataset["energy_c"].values.astype(str),
+            dims=("energy_c",),
+            attrs=cdf_attrs.get_variable_attributes(
+                "energy_c_label", check_schema=False
+            ),
+        ),
+        "energy_o": l1b_dataset["energy_o"],
+        "energy_o_label": xr.DataArray(
+            l1b_dataset["energy_o"].values.astype(str),
+            dims=("energy_o",),
+            attrs=cdf_attrs.get_variable_attributes(
+                "energy_o_label", check_schema=False
+            ),
+        ),
+        "energy_ne_mg_si": l1b_dataset["energy_ne_mg_si"],
+        "energy_ne_mg_si_label": xr.DataArray(
+            l1b_dataset["energy_ne_mg_si"].values.astype(str),
+            dims=("energy_ne_mg_si",),
+            attrs=cdf_attrs.get_variable_attributes(
+                "energy_ne_mg_si_label", check_schema=False
+            ),
+        ),
+        "energy_fe": l1b_dataset["energy_fe"],
+        "energy_fe_label": xr.DataArray(
+            l1b_dataset["energy_fe"].values.astype(str),
+            dims=("energy_fe",),
+            attrs=cdf_attrs.get_variable_attributes(
+                "energy_fe_label", check_schema=False
+            ),
+        ),
+        "energy_uh": l1b_dataset["energy_uh"],
+        "energy_uh_label": xr.DataArray(
+            l1b_dataset["energy_uh"].values.astype(str),
+            dims=("energy_uh",),
+            attrs=cdf_attrs.get_variable_attributes(
+                "energy_uh_label", check_schema=False
+            ),
+        ),
+        "energy_junk": l1b_dataset["energy_junk"],
+        "energy_junk_label": xr.DataArray(
+            l1b_dataset["energy_junk"].values.astype(str),
+            dims=("energy_junk",),
+            attrs=cdf_attrs.get_variable_attributes(
+                "energy_junk_label", check_schema=False
+            ),
+        ),
+        "epoch": xr.DataArray(
+            l1b_dataset["epoch"].data,
+            dims=("epoch",),
+            attrs=cdf_attrs.get_variable_attributes("epoch", check_schema=False),
+        ),
+    }
+    l1b_dataset = l1b_dataset.assign_coords(new_coords)
+    return l1b_dataset
+def process_hi_sectored(dependencies: ProcessingInputCollection) -> xr.Dataset:
+    """
+    Process the hi-omni L1B dataset to calculate omni-directional intensities.
+    See section 11.1.2 of the CoDICE algorithm document for details.
+    The formula for omni-directional intensities is::
+        l1b species data / (geometric_factor * efficiency * energy_passband)
+    Geometric factor is constant for all species and is 0.013.
+    Efficiency is provided in a CSV file for each species and energy bin and
+    position.
+    Energy passband is calculated from energy_bin_minus + energy_bin_plus
+    Parameters
+    ----------
+    dependencies : ProcessingInputCollection
+        The collection of processing input files.
+    Returns
+    -------
+    xarray.Dataset
+        The updated L2 dataset with omni-directional intensities calculated.
+    """
+    file_path = dependencies.get_file_paths(descriptor="hi-sectored")[0]
+    l1b_dataset = load_cdf(file_path)
+    # Update global CDF attributes
+    cdf_attrs = ImapCdfAttributes()
+    cdf_attrs.add_instrument_global_attrs("codice")
+    cdf_attrs.add_instrument_variable_attrs("codice", "l2-hi-sectored")
+    # Overwrite L1B variable attributes with L2 variable attributes
+    l2_dataset = xr.Dataset(
+        coords={
+            "spin_sector": l1b_dataset["spin_sector"],
+            "spin_sector_label": xr.DataArray(
+                l1b_dataset["spin_sector"].values.astype(str),
+                dims=("spin_sector",),
+                attrs=cdf_attrs.get_variable_attributes(
+                    "spin_sector_label", check_schema=False
+                ),
+            ),
+            "energy_h": l1b_dataset["energy_h"],
+            "energy_h_label": xr.DataArray(
+                l1b_dataset["energy_h"].values.astype(str),
+                dims=("energy_h",),
+                attrs=cdf_attrs.get_variable_attributes(
+                    "energy_h_label", check_schema=False
+                ),
+            ),
+            "energy_he3he4": l1b_dataset["energy_he3he4"],
+            "energy_he3he4_label": xr.DataArray(
+                l1b_dataset["energy_he3he4"].values.astype(str),
+                dims=("energy_he3he4",),
+                attrs=cdf_attrs.get_variable_attributes(
+                    "energy_he3he4_label", check_schema=False
+                ),
+            ),
+            "energy_cno": l1b_dataset["energy_cno"],
+            "energy_cno_label": xr.DataArray(
+                l1b_dataset["energy_cno"].values.astype(str),
+                dims=("energy_cno",),
+                attrs=cdf_attrs.get_variable_attributes(
+                    "energy_cno_label", check_schema=False
+                ),
+            ),
+            "energy_fe": l1b_dataset["energy_fe"],
+            "energy_fe_label": xr.DataArray(
+                l1b_dataset["energy_fe"].values.astype(str),
+                dims=("energy_fe",),
+                attrs=cdf_attrs.get_variable_attributes(
+                    "energy_fe_label", check_schema=False
+                ),
+            ),
+            "epoch": l1b_dataset["epoch"],
+            "elevation_angle": xr.DataArray(
+                HI_L2_ELEVATION_ANGLE,
+                dims=("elevation_angle",),
+                attrs=cdf_attrs.get_variable_attributes(
+                    "elevation_angle", check_schema=False
+                ),
+            ),
+            "elevation_angle_label": xr.DataArray(
+                HI_L2_ELEVATION_ANGLE.astype(str),
+                dims=("elevation_angle",),
+                attrs=cdf_attrs.get_variable_attributes(
+                    "elevation_angle_label", check_schema=False
+                ),
+            ),
+        },
+        attrs=cdf_attrs.get_global_attributes("imap_codice_l2_hi-sectored"),
+    )
+    efficiencies_file = dependencies.get_file_paths(
+        descriptor="l2-hi-sectored-efficiency"
+    )[0]
+    # Calculate sectored intensities
+    efficiencies_df = pd.read_csv(efficiencies_file)
+    # Similar to hi-omni, each species has different shape.
+    # Because of that, we need to loop over each species and calculate
+    # sectored intensities separately.
+    for species in HI_SECTORED_VARIABLE_NAMES:
+        # Efficiencies from dataframe maps to different dimension in L1B data.
+        # For example:
+        #   l1b species 'h' has shape:
+        #       (epoch, 8, 12, 12) -> (time, energy, spin_sector, inst_az)
+        #   efficiencies 'h' has shape after reading from CSV:
+        #       (8, 12) -> (energy, inst_az)
+        #       NOTE: 12 here maps to last 12 in above l1b dimension.
+        # Because of this, it's easier to work with the data in xarray.
+        # Xarray automatically aligns dimensions and coordinates, making it easier
+        # to work with multi-dimensional data. Thus, we convert the efficiencies
+        # to xarray.DataArray with dimensions (energy, inst_az)
+        species_data = efficiencies_df[efficiencies_df["species"] == species].values
+        species_efficiencies = xr.DataArray(
+            species_data[:, 2:].astype(
+                float
+            ),  # Skip first two columns (species, energy_bin)
+            dims=(f"energy_{species}", "inst_az"),
+            coords=l1b_dataset[[f"energy_{species}", "inst_az"]],
+        )
+        # energy_passbands has shape:
+        #   (8,) -> (energy)
+        energy_passbands = xr.DataArray(
+            l1b_dataset[f"energy_{species}_minus"]
+            + l1b_dataset[f"energy_{species}_plus"],
+            dims=(f"energy_{species}",),
+            coords=l2_dataset[[f"energy_{species}"]],
+            name="passband",
+        )
+        sectored_intensities = l1b_dataset[species] / (
+            L2_GEOMETRIC_FACTOR * species_efficiencies * energy_passbands
+        )
+        # Replace existing species data with omni-directional intensities
+        l2_dataset[species] = xr.DataArray(
+            sectored_intensities.data,
+            dims=("epoch", f"energy_{species}", "spin_sector", "elevation_angle"),
+            attrs=cdf_attrs.get_variable_attributes(species, check_schema=False),
+        )
+    # Calculate spin angle
+    # Formula:
+    #   θ_(k,n) = (θ_(k,0)+30°* n)  mod 360°
+    # where
+    #   n is size of L2_HI_SECTORED_ANGLE, 0 to 11,
+    #   k is size of inst_az from l1b, 0 to 11,
+    # Calculate spin angle by adding a base angle from L2_HI_SECTORED_ANGLE
+    # for each SSD index and then adding multiple of 30 degrees for each elevation.
+    # Then mod by 360 to keep it within 0-360 range.
+    elevation_angles = np.arange(len(l2_dataset["elevation_angle"].values)) * 30.0
+    spin_angles = (L2_HI_SECTORED_ANGLE[:, np.newaxis] + elevation_angles) % 360.0
+    # Add spin angle variable using the new elevation_angle dimension
+    l2_dataset["spin_angles"] = (("spin_sector", "elevation_angle"), spin_angles)
+    l2_dataset["spin_angles"].attrs = cdf_attrs.get_variable_attributes(
+        "spin_angles", check_schema=False
+    )
+    # Now carry over other variables from L1B to L2 dataset
+    for variable in l1b_dataset.data_vars:
+        if variable.startswith("epoch_") and variable != "epoch":
+            # get attrs with just that name
+            l2_dataset[variable] = xr.DataArray(
+                l1b_dataset[variable].data,
+                dims=("epoch",),
+                attrs=cdf_attrs.get_variable_attributes(variable, check_schema=False),
+            )
+        elif variable.startswith("energy_"):
+            l2_dataset[variable] = xr.DataArray(
+                l1b_dataset[variable].data,
+                dims=(f"energy_{variable.split('_')[1]}",),
+                attrs=cdf_attrs.get_variable_attributes(variable, check_schema=False),
+            )
+        elif variable.startswith("unc_"):
+            l2_dataset[variable] = xr.DataArray(
+                l1b_dataset[variable].data,
+                dims=(
+                    "epoch",
+                    f"energy_{variable.split('_')[1]}",
+                    "spin_sector",
+                    "elevation_angle",
+                ),
+                attrs=cdf_attrs.get_variable_attributes(variable),
+            )
+        elif variable == "data_quality":
+            l2_dataset[variable] = l1b_dataset[variable]
+            l2_dataset[variable].attrs.update(
+                cdf_attrs.get_variable_attributes(variable, check_schema=False)
+            )
+    l2_dataset["epoch"].attrs.update(
+        cdf_attrs.get_variable_attributes("epoch", check_schema=False)
+    )
+    return l2_dataset
+def process_codice_l2(
+    descriptor: str, dependencies: ProcessingInputCollection
+) -> xr.Dataset:
+    """
+    Will process CoDICE l1 data to create l2 data products.
+    Parameters
+    ----------
+    descriptor : str
+        The descriptor for the CoDICE L1 file to process.
+    dependencies : ProcessingInputCollection
+        Collection of processing inputs such as ancillary data files.
+    Returns
+    -------
+    l2_dataset : xarray.Dataset
+        The``xarray`` dataset containing the science data and supporting metadata.
+    """
+    # This should get science files since ancillary or spice doesn't have data_type
+    # as data level.
+    file_path = dependencies.get_file_paths(descriptor=descriptor)[0]
+    # Now form product name from descriptor
+    descriptor = ScienceFilePath(file_path).descriptor
+    dataset_name = f"imap_codice_l2_{descriptor}"
     # TODO: update list of datasets that need geometric factors (if needed)
     # Compute geometric factors needed for intensity calculations
@@ -62,7 +638,46 @@ def process_codice_l2(file_path: Path) -> xr.Dataset:
         "imap_codice_l2_lo-sw-species",
         "imap_codice_l2_lo-nsw-species",
     ]:
-        geometric_factors = compute_geometric_factors(l2_dataset)
+        l2_dataset = load_cdf(file_path).copy()
+        geometric_factor_lookup = get_geometric_factor_lut(dependencies)
+        efficiency_lookup = get_efficiency_lut(dependencies)
+        geometric_factors = compute_geometric_factors(
+            l2_dataset, geometric_factor_lookup
+        )
+        if dataset_name == "imap_codice_l2_lo-sw-species":
+            # Filter the efficiency lookup table for solar wind efficiencies
+            efficiencies = efficiency_lookup[efficiency_lookup["product"] == "sw"]
+            # Calculate the pickup ion sunward solar wind intensities using equation
+            # described in section 11.2.4 of algorithm document.
+            process_lo_species_intensity(
+                l2_dataset,
+                LO_SW_PICKUP_ION_SPECIES_VARIABLE_NAMES,
+                geometric_factors,
+                efficiencies,
+                PUI_POSITIONS,
+            )
+            # Calculate the sunward solar wind species intensities using equation
+            # described in section 11.2.4 of algorithm document.
+            process_lo_species_intensity(
+                l2_dataset,
+                LO_SW_SPECIES_VARIABLE_NAMES,
+                geometric_factors,
+                efficiencies,
+                SW_POSITIONS,
+            )
+        else:
+            # Filter the efficiency lookup table for non solar wind efficiencies
+            efficiencies = efficiency_lookup[efficiency_lookup["product"] == "nsw"]
+            # Calculate the non-sunward species intensities using equation
+            # described in section 11.2.4 of algorithm document.
+            process_lo_species_intensity(
+                l2_dataset,
+                LO_NSW_SPECIES_VARIABLE_NAMES,
+                geometric_factors,
+                efficiencies,
+                NSW_POSITIONS,
+            )
     if dataset_name in [
         "imap_codice_l2_hi-counters-singles",
@@ -91,13 +706,13 @@ def process_codice_l2(file_path: Path) -> xr.Dataset:
     elif dataset_name == "imap_codice_l2_hi-sectored":
         # Convert the sectored count rates using equation described in section
         # 11.1.3 of algorithm document.
-        pass
+        l2_dataset = process_hi_sectored(dependencies)
     elif dataset_name == "imap_codice_l2_hi-omni":
         # Calculate the omni-directional intensity for each species using
         # equation described in section 11.1.4 of algorithm document
         # hopefully this can also apply to hi-ialirt
-        pass
+        l2_dataset = process_hi_omni(dependencies)
     elif dataset_name == "imap_codice_l2_lo-direct-events":
         # Convert the following data variables to physical units using
@@ -122,24 +737,7 @@ def process_codice_l2(file_path: Path) -> xr.Dataset:
         # in section 11.2.3 of algorithm document.
         pass
-    elif dataset_name == "imap_codice_l2_lo-sw-species":
-        # Calculate the sunward solar wind species intensities using equation
-        # described in section 11.2.4 of algorithm document.
-        # Calculate the pickup ion sunward solar wind intensities using equation
-        # described in section 11.2.4 of algorithm document.
-        # Hopefully this can also apply to lo-ialirt
-        # TODO: WIP - needs to be completed
-        l2_dataset = process_lo_sw_species(l2_dataset, geometric_factors)
-        pass
-    elif dataset_name == "imap_codice_l2_lo-nsw-species":
-        # Calculate the non-sunward solar wind species intensities using
-        # equation described in section 11.2.4 of algorithm document.
-        # Calculate the pickup ion non-sunward solar wind intensities using
-        # equation described in section 11.2.4 of algorithm document.
-        pass
-    logger.info(f"\nFinal data product:\n{l2_dataset}\n")
+    # logger.info(f"\nFinal data product:\n{l2_dataset}\n")
     return l2_dataset
@@ -191,88 +789,3 @@ def add_dataset_attributes(
                     f"attribute manager."
                 )
     return dataset
-def compute_geometric_factors(dataset: xr.Dataset) -> np.ndarray:
-    """
-    Calculate geometric factors needed for intensity calculations.
-    Geometric factors are determined by comparing the half-spin values per
-    esa_step in the HALF_SPIN_LUT to the rgfo_half_spin values in the provided
-    L2 dataset.
-    If the half-spin value is less than the corresponding rgfo_half_spin value,
-    the geometric factor is set to 0.75 (full mode); otherwise, it is set to 0.5
-    (reduced mode).
-    NOTE: Half spin values are associated with ESA steps which corresponds to the
-    index of the energy_per_charge dimension that is between 0 and 127.
-    Parameters
-    ----------
-    dataset : xarray.Dataset
-        The L2 dataset containing rgfo_half_spin data variable.
-    Returns
-    -------
-    geometric_factors : np.ndarray
-        A 2D array of geometric factors with shape (epoch, esa_steps).
-    """
-    # Convert the HALF_SPIN_LUT to a reverse mapping of esa_step to half_spin
-    esa_step_to_half_spin_map = {
-        val: key for key, vals in HALF_SPIN_LUT.items() for val in vals
-    }
-    # Create a list of half_spin values corresponding to ESA steps (0 to 127)
-    half_spin_values = np.array(
-        [esa_step_to_half_spin_map[step] for step in range(128)]
-    )
-    # Expand dimensions to compare each rgfo_half_spin value against
-    # all half_spin_values
-    rgfo_half_spin = dataset.rgfo_half_spin.data[:, np.newaxis]  # Shape: (epoch, 1)
-    # Perform the comparison and calculate geometric factors
-    geometric_factors = np.where(half_spin_values < rgfo_half_spin, 0.75, 0.5)
-    return geometric_factors
-def process_lo_sw_species(
-    dataset: xr.Dataset, geometric_factors: np.ndarray
-) -> xr.Dataset:
-    """
-    Process the lo-sw-species L2 dataset to calculate species intensities.
-    Parameters
-    ----------
-    dataset : xarray.Dataset
-        The L2 dataset to process.
-    geometric_factors : np.ndarray
-        The geometric factors array with shape (epoch, esa_steps).
-    Returns
-    -------
-    xarray.Dataset
-        The updated L2 dataset with species intensities calculated.
-    """
-    # TODO: WIP - implement intensity calculations
-    # valid_solar_wind_vars = [
-    #     "hplus",
-    #     "heplusplus",
-    #     "cplus4",
-    #     "cplus5",
-    #     "cplus6",
-    #     "oplus5",
-    #     "oplus6",
-    #     "oplus7",
-    #     "oplus8",
-    #     "ne",
-    #     "mg",
-    #     "si",
-    #     "fe_loq",
-    #     "fe_hiq",
-    # ]
-    # valid_pick_up_ion_vars = ["heplus", "cnoplus"]
-    return dataset

imap-processing 1.0.0__py3-none-any.whl → 1.0.1__py3-none-any.whl

Potentially problematic release.

imap-processing 1.0.0py3-none-any.whl → 1.0.1py3-none-any.whl