PyPI - imap-processing - Versions diffs - 0.8.0__py3-none-any.whl → 0.9.0__py3-none-any.whl - Mend

imap-processing 0.8.0py3-none-any.whl → 0.9.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of imap-processing might be problematic. Click here for more details.

Files changed (99) hide show

imap_processing/_version.py +2 -2
imap_processing/ccsds/excel_to_xtce.py +2 -0
imap_processing/cdf/config/imap_hi_variable_attrs.yaml +100 -1
imap_processing/cdf/config/imap_hit_global_cdf_attrs.yaml +14 -0
imap_processing/cdf/config/imap_hit_l1a_variable_attrs.yaml +63 -1
imap_processing/cdf/config/imap_idex_global_cdf_attrs.yaml +7 -0
imap_processing/cdf/config/imap_idex_l1a_variable_attrs.yaml +574 -231
imap_processing/cdf/config/imap_idex_l1b_variable_attrs.yaml +326 -0
imap_processing/cdf/config/imap_lo_l1a_variable_attrs.yaml +33 -23
imap_processing/cdf/config/imap_ultra_l1b_variable_attrs.yaml +7 -4
imap_processing/cdf/utils.py +3 -5
imap_processing/cli.py +13 -4
imap_processing/codice/codice_l1a.py +5 -5
imap_processing/codice/constants.py +9 -9
imap_processing/codice/decompress.py +6 -2
imap_processing/glows/l1a/glows_l1a.py +1 -2
imap_processing/hi/l1a/hi_l1a.py +4 -4
imap_processing/hi/l1a/histogram.py +106 -108
imap_processing/hi/l1a/science_direct_event.py +91 -224
imap_processing/hi/packet_definitions/TLM_HI_COMBINED_SCI.xml +3994 -0
imap_processing/hit/l0/constants.py +2 -2
imap_processing/hit/l0/decom_hit.py +12 -101
imap_processing/hit/l1a/hit_l1a.py +164 -23
imap_processing/ialirt/l0/process_codicelo.py +153 -0
imap_processing/ialirt/l0/process_hit.py +5 -5
imap_processing/ialirt/packet_definitions/ialirt_codicelo.xml +281 -0
imap_processing/ialirt/process_ephemeris.py +212 -0
imap_processing/idex/idex_l1a.py +55 -75
imap_processing/idex/idex_l1b.py +192 -0
imap_processing/idex/idex_variable_unpacking_and_eu_conversion.csv +33 -0
imap_processing/idex/packet_definitions/idex_packet_definition.xml +97 -595
imap_processing/lo/l0/decompression_tables/decompression_tables.py +16 -0
imap_processing/lo/l0/lo_science.py +44 -12
imap_processing/lo/l1a/lo_l1a.py +76 -8
imap_processing/lo/packet_definitions/lo_xtce.xml +9877 -87
imap_processing/mag/l1a/mag_l1a.py +1 -2
imap_processing/mag/l1a/mag_l1a_data.py +1 -2
imap_processing/mag/l1b/mag_l1b.py +2 -1
imap_processing/spice/geometry.py +37 -19
imap_processing/spice/time.py +144 -2
imap_processing/swapi/l1/swapi_l1.py +3 -3
imap_processing/swapi/packet_definitions/swapi_packet_definition.xml +1535 -446
imap_processing/swe/l2/swe_l2.py +134 -17
imap_processing/tests/ccsds/test_data/expected_output.xml +1 -1
imap_processing/tests/codice/test_codice_l1a.py +8 -8
imap_processing/tests/codice/test_decompress.py +4 -4
imap_processing/tests/conftest.py +46 -43
imap_processing/tests/hi/test_data/l0/H90_NHK_20241104.bin +0 -0
imap_processing/tests/hi/test_data/l0/H90_sci_cnt_20241104.bin +0 -0
imap_processing/tests/hi/test_data/l0/H90_sci_de_20241104.bin +0 -0
imap_processing/tests/hi/test_hi_l1b.py +2 -2
imap_processing/tests/hi/test_l1a.py +31 -58
imap_processing/tests/hi/test_science_direct_event.py +58 -0
imap_processing/tests/hit/test_data/sci_sample1.ccsds +0 -0
imap_processing/tests/hit/test_decom_hit.py +60 -50
imap_processing/tests/hit/test_hit_l1a.py +327 -12
imap_processing/tests/hit/test_hit_l1b.py +76 -0
imap_processing/tests/hit/validation_data/hskp_sample_eu.csv +89 -0
imap_processing/tests/hit/validation_data/sci_sample_raw1.csv +29 -0
imap_processing/tests/ialirt/test_data/l0/apid01152.tlm +0 -0
imap_processing/tests/ialirt/test_data/l0/imap_codice_l1a_lo-ialirt_20241110193700_v0.0.0.cdf +0 -0
imap_processing/tests/ialirt/unit/test_process_codicelo.py +106 -0
imap_processing/tests/ialirt/unit/test_process_ephemeris.py +109 -0
imap_processing/tests/ialirt/unit/test_process_hit.py +9 -6
imap_processing/tests/idex/conftest.py +1 -1
imap_processing/tests/idex/test_idex_l0.py +1 -1
imap_processing/tests/idex/test_idex_l1a.py +7 -1
imap_processing/tests/idex/test_idex_l1b.py +126 -0
imap_processing/tests/lo/test_lo_l1a.py +7 -16
imap_processing/tests/lo/test_lo_science.py +67 -3
imap_processing/tests/lo/test_pkts/imap_lo_l0_raw_20240803_v002.pkts +0 -0
imap_processing/tests/lo/validation_data/Instrument_FM1_T104_R129_20240803_ILO_SCI_DE_dec_DN_with_fills.csv +1999 -0
imap_processing/tests/mag/test_mag_l1b.py +39 -5
imap_processing/tests/spice/test_geometry.py +32 -6
imap_processing/tests/spice/test_time.py +135 -6
imap_processing/tests/swapi/test_swapi_decom.py +75 -69
imap_processing/tests/swapi/test_swapi_l1.py +4 -4
imap_processing/tests/swe/test_swe_l2.py +64 -8
imap_processing/tests/test_utils.py +1 -1
imap_processing/tests/ultra/test_data/l0/ultra45_raw_sc_ultrarawimg_withFSWcalcs_FM45_40P_Phi28p5_BeamCal_LinearScan_phi2850_theta-000_20240207T102740.csv +3314 -3314
imap_processing/tests/ultra/unit/test_de.py +8 -3
imap_processing/tests/ultra/unit/test_spatial_utils.py +125 -0
imap_processing/tests/ultra/unit/test_ultra_l1b_extended.py +39 -29
imap_processing/tests/ultra/unit/test_ultra_l1c_pset_bins.py +2 -25
imap_processing/ultra/constants.py +4 -0
imap_processing/ultra/l1b/de.py +8 -14
imap_processing/ultra/l1b/ultra_l1b_extended.py +29 -70
imap_processing/ultra/l1c/ultra_l1c_pset_bins.py +1 -36
imap_processing/ultra/utils/spatial_utils.py +221 -0
{imap_processing-0.8.0.dist-info → imap_processing-0.9.0.dist-info}/METADATA +1 -1
{imap_processing-0.8.0.dist-info → imap_processing-0.9.0.dist-info}/RECORD +94 -76
imap_processing/hi/l0/__init__.py +0 -0
imap_processing/hi/l0/decom_hi.py +0 -24
imap_processing/hi/packet_definitions/hi_packet_definition.xml +0 -482
imap_processing/tests/hi/test_decom.py +0 -55
imap_processing/tests/hi/test_l1a_sci_de.py +0 -72
{imap_processing-0.8.0.dist-info → imap_processing-0.9.0.dist-info}/LICENSE +0 -0
{imap_processing-0.8.0.dist-info → imap_processing-0.9.0.dist-info}/WHEEL +0 -0
{imap_processing-0.8.0.dist-info → imap_processing-0.9.0.dist-info}/entry_points.txt +0 -0

imap_processing/tests/hit/test_decom_hit.py CHANGED Viewed

@@ -15,7 +15,6 @@ from imap_processing.hit.l0.decom_hit import (
     is_sequential,
     parse_count_rates,
     parse_data,
-    subcom_sectorates,
     update_ccsds_header_dims,
 )
 from imap_processing.utils import packet_file_to_datasets
@@ -201,45 +200,6 @@ def test_assemble_science_frames(sci_dataset):
     assert "pha_raw" in updated_dataset
-def test_subcom_sectorates(sci_dataset):
-    """Test the subcom_sectorates function.
-    This function organizes the sector rates data
-    into new variables for each species and adds
-    them to the dataset.
-    """
-    # Prepare the input needed for the function to be called
-    sci_dataset = update_ccsds_header_dims(sci_dataset)
-    sci_dataset = assemble_science_frames(sci_dataset)
-    parse_count_rates(sci_dataset)
-    # Call the function to be tested
-    subcom_sectorates(sci_dataset)
-    # Check if the dataset has the expected new variables
-    for species in ["H", "4He", "CNO", "NeMgSi", "Fe"]:
-        assert species in sci_dataset
-        assert f"{species}_energy_min" in sci_dataset
-        assert f"{species}_energy_max" in sci_dataset
-    # Check the shape of the new variables
-    for species in ["H", "4He", "CNO", "NeMgSi", "Fe"]:
-        if species == "H":
-            assert sci_dataset[species].shape == (86, 3, 8, 15)
-            assert sci_dataset[f"{species}_energy_min"].shape == (3,)
-        elif species in ("4He", "CNO", "NeMgSi"):
-            assert sci_dataset[species].shape == (86, 2, 8, 15)
-            assert sci_dataset[f"{species}_energy_min"].shape == (2,)
-        elif species == "Fe":
-            assert sci_dataset[species].shape == (86, 1, 8, 15)
-            assert sci_dataset[f"{species}_energy_min"].shape == (1,)
-        assert (
-            sci_dataset[f"{species}_energy_max"].shape
-            == sci_dataset[f"{species}_energy_min"].shape
-        )
 @pytest.mark.parametrize(
     "packed, expected",
     [
@@ -266,14 +226,64 @@ def test_decom_hit(sci_dataset):
     This function orchestrates the unpacking and decompression
     of the HIT science data.
     """
-    # TODO: complete this test once the function is complete
     updated_dataset = decom_hit(sci_dataset)
-    # Check if the dataset has the expected new variables
-    # Check that binary science data exists
-    assert "count_rates_raw" in updated_dataset
-    assert "pha_raw" in updated_dataset
-    # Check that sector rates data has been organized
-    for species in ["H", "4He", "CNO", "NeMgSi", "Fe"]:
-        assert species in updated_dataset
-        assert f"{species}_energy_min" in updated_dataset
-        assert f"{species}_energy_max" in updated_dataset
+    # Check if the dataset has the expected data variables
+    sci_fields = [
+        "version",
+        "type",
+        "sec_hdr_flg",
+        "pkt_apid",
+        "seq_flgs",
+        "src_seq_ctr",
+        "pkt_len",
+        "pha_raw",
+        "hdr_unit_num",
+        "hdr_frame_version",
+        "hdr_dynamic_threshold_state",
+        "hdr_leak_conv",
+        "hdr_heater_duty_cycle",
+        "hdr_code_ok",
+        "hdr_minute_cnt",
+        "livetime",
+        "num_trig",
+        "num_reject",
+        "num_acc_w_pha",
+        "num_acc_no_pha",
+        "num_haz_trig",
+        "num_haz_reject",
+        "num_haz_acc_w_pha",
+        "num_haz_acc_no_pha",
+        "sngrates",
+        "nread",
+        "nhazard",
+        "nadcstim",
+        "nodd",
+        "noddfix",
+        "nmulti",
+        "nmultifix",
+        "nbadtraj",
+        "nl2",
+        "nl3",
+        "nl4",
+        "npen",
+        "nformat",
+        "naside",
+        "nbside",
+        "nerror",
+        "nbadtags",
+        "coinrates",
+        "bufrates",
+        "l2fgrates",
+        "l2bgrates",
+        "l3fgrates",
+        "l3bgrates",
+        "penfgrates",
+        "penbgrates",
+        "ialirtrates",
+        "sectorates",
+        "l4fgrates",
+        "l4bgrates",
+    ]
+    for field in sci_fields:
+        assert field in updated_dataset

imap_processing/tests/hit/test_hit_l1a.py CHANGED Viewed

@@ -1,29 +1,344 @@
+import numpy as np
+import pandas as pd
 import pytest
 import xarray as xr
 from imap_processing import imap_module_directory
-from imap_processing.hit.l1a.hit_l1a import hit_l1a
+from imap_processing.hit.hit_utils import (
+    HitAPID,
+    get_datasets_by_apid,
+)
+from imap_processing.hit.l1a.hit_l1a import decom_hit, hit_l1a, subcom_sectorates
+# TODO: Packet files are per apid at the moment so the tests currently
+#  reflect this. Eventually, HIT will provide a packet file with all apids
+#  and the tests will need to be updated.
 @pytest.fixture(scope="module")
-def packet_filepath():
+def hk_packet_filepath():
     """Set path to test data file"""
     return (
         imap_module_directory / "tests/hit/test_data/imap_hit_l0_raw_20100105_v001.pkts"
     )
-def test_hit_l1a(packet_filepath):
-    """Create L1A datasets from a packet file.
+@pytest.fixture(scope="module")
+def sci_packet_filepath():
+    """Set path to test data file"""
+    return imap_module_directory / "tests/hit/test_data/sci_sample1.ccsds"
+def test_validate_l1a_housekeeping_data(hk_packet_filepath):
+    """Validate the housekeeping dataset created by the L1A processing.
+    Compares the processed housekeeping data with expected values from
+    a validation csv file.
+    Parameters
+    ----------
+    hk_packet_filepath : str
+        File path to housekeeping ccsds file
+    """
+    datasets = hit_l1a(hk_packet_filepath, "001")
+    hk_dataset = None
+    for dataset in datasets:
+        if dataset.attrs["Logical_source"] == "imap_hit_l1a_hk":
+            hk_dataset = dataset
+    # Load the validation data
+    validation_file = (
+        imap_module_directory / "tests/hit/validation_data/hskp_sample_raw.csv"
+    )
+    validation_data = pd.read_csv(validation_file)
+    validation_data.columns = validation_data.columns.str.lower()
+    # Get a list of leak columns in ascending order
+    # (LEAK_I_00, LEAK_I_01, ..., LEAK_I_63)
+    # and group values into a single column
+    leak_columns = [col for col in validation_data.columns if col.startswith("leak")][
+        ::-1
+    ]
+    validation_data["leak_i"] = validation_data[leak_columns].apply(
+        lambda row: row.values, axis=1
+    )
+    validation_data.drop(columns=leak_columns, inplace=True)
+    # Define the keys that should have dropped from the housekeeping dataset
+    dropped_fields = {
+        "pkt_apid",
+        "sc_tick",
+        "version",
+        "type",
+        "sec_hdr_flg",
+        "seq_flgs",
+        "src_seq_ctr",
+        "pkt_len",
+        "hskp_spare1",
+        "hskp_spare2",
+        "hskp_spare3",
+        "hskp_spare4",
+        "hskp_spare5",
+    }
+    # Define the keys that should be ignored in the validation
+    # like ccsds headers
+    ignore_validation_fields = {
+        "ccsds_version",
+        "ccsds_type",
+        "ccsds_sec_hdr_flag",
+        "ccsds_appid",
+        "ccsds_grp_flag",
+        "ccsds_seq_cnt",
+        "ccsds_length",
+        "shcoarse",
+    }
+    # Check that dropped variables are not in the dataset
+    assert set(dropped_fields).isdisjoint(set(hk_dataset.data_vars.keys()))
+    # Compare the housekeeping dataset with the expected validation data
+    for field in validation_data.columns:
+        if field not in ignore_validation_fields:
+            assert field in hk_dataset.data_vars.keys()
+            for pkt in range(validation_data.shape[0]):
+                assert np.array_equal(
+                    hk_dataset[field][pkt].data, validation_data[field][pkt]
+                )
+def test_subcom_sectorates(sci_packet_filepath):
+    """Test the subcom_sectorates function.
+    This function organizes the sector rates data
+    by species and adds the data as new variables
+    to the dataset.
+    """
+    # Unpack and decompress ccsds file to xarray datasets
+    sci_dataset = get_datasets_by_apid(sci_packet_filepath)[HitAPID.HIT_SCIENCE]
+    sci_dataset = decom_hit(sci_dataset)
+    # Call the function to be tested
+    subcom_sectorates(sci_dataset)
+    # Number of science frames in the dataset
+    frames = sci_dataset["epoch"].shape[0]
+    # Check if the dataset has the expected new variables
+    for species in ["h", "he4", "cno", "nemgsi", "fe"]:
+        assert f"{species}_counts_sectored" in sci_dataset
+        assert f"{species}_energy_min" in sci_dataset
+        assert f"{species}_energy_max" in sci_dataset
+        # Check the shape of the new data variables
+        if species == "h":
+            assert sci_dataset[f"{species}_counts_sectored"].shape == (frames, 3, 8, 15)
+            assert sci_dataset[f"{species}_energy_min"].shape == (3,)
+        elif species in ("4he", "cno", "nemgsi"):
+            assert sci_dataset[f"{species}_counts_sectored"].shape == (frames, 2, 8, 15)
+            assert sci_dataset[f"{species}_energy_min"].shape == (2,)
+        elif species == "fe":
+            assert sci_dataset[f"{species}_counts_sectored"].shape == (frames, 1, 8, 15)
+            assert sci_dataset[f"{species}_energy_min"].shape == (1,)
+        assert (
+            sci_dataset[f"{species}_energy_max"].shape
+            == sci_dataset[f"{species}_energy_min"].shape
+        )
+def test_validate_l1a_counts_data(sci_packet_filepath):
+    """Compare the output of the L1A processing to the validation data.
+    This test compares the counts data product with the validation data.
+    The PHA data product is not validated since it's not being decommutated.
+    Parameters
+    ----------
+    sci_packet_filepath : str
+        Path to ccsds file for science data
+    """
+    # Process the sample data
+    processed_datasets = hit_l1a(sci_packet_filepath, "001")
+    l1a_counts_data = processed_datasets[0]
+    # Read in the validation data
+    validation_data = pd.read_csv(
+        imap_module_directory / "tests/hit/validation_data/sci_sample_raw1.csv"
+    )
+    # Helper functions for this test
+    def consolidate_rate_columns(data, rate_columns):
+        # The validation data isn't organized by arrays.
+        # Each value is in a separate column.
+        # Aggregate related data into arrays.
+        for new_col, prefix in rate_columns.items():
+            columns = [col for col in data.columns if prefix in col]
+            data[new_col] = data[columns].apply(lambda row: row.values, axis=1)
+            if new_col == "sectorates":
+                # Differentiate between the sectorate columns with three and
+                # five digits in the name. Those with three digits contain the
+                # sectorate value for the science frame and those with five digits
+                # are the sectorate values with the mod value appended to the end.
+                # The mod value determines the species and energy range for that
+                # science frame
+                sectorates_three_digits = data.filter(
+                    regex=r"^SECTORATES_\d{3}$"
+                ).columns
+                sectorates_five_digits = data.filter(
+                    regex=r"^SECTORATES_\d{3}_\d{1}$"
+                ).columns
+                data["sectorates"] = data[sectorates_three_digits].apply(
+                    lambda row: row.values.reshape(8, 15), axis=1
+                )
+                data["sectorates_by_mod_val"] = data[sectorates_five_digits].apply(
+                    lambda row: row.values, axis=1
+                )
+            data.drop(columns=columns, inplace=True)
+        return data
+    def process_single_rates(data):
+        # Combine the single rates for high and low gain into a 2D array
+        data["sngrates"] = data.apply(
+            lambda row: np.array([row["sngrates_hg"], row["sngrates_lg"]]), axis=1
+        )
+        data.drop(columns=["sngrates_hg", "sngrates_lg"], inplace=True)
+        return data
+    def process_sectorates(data):
+        # Add species and energy index to the data frame for each science frame
+        # First find the mod value for each science frame which equals the first index
+        # in the sectorates_by_mod_val array that has a value instead of a blank space
+        data["mod_10"] = data["sectorates_by_mod_val"].apply(
+            lambda row: next((i for i, value in enumerate(row) if value != " "), None)
+        )
+        # Mapping of mod value to species and energy index
+        species_energy = {
+            0: {"species": "H", "energy_idx": 0},
+            1: {"species": "H", "energy_idx": 1},
+            2: {"species": "H", "energy_idx": 2},
+            3: {"species": "He4", "energy_idx": 0},
+            4: {"species": "He4", "energy_idx": 1},
+            5: {"species": "CNO", "energy_idx": 0},
+            6: {"species": "CNO", "energy_idx": 1},
+            7: {"species": "NeMgSi", "energy_idx": 0},
+            8: {"species": "NeMgSi", "energy_idx": 1},
+            9: {"species": "Fe", "energy_idx": 0},
+        }
+        # Use the mod 10 value to determine the species and energy index
+        # for each science frame and add this information to the data frame
+        data["species"] = data["mod_10"].apply(
+            lambda row: species_energy[row]["species"].lower()
+            if row is not None
+            else None
+        )
+        data["energy_idx"] = data["mod_10"].apply(
+            lambda row: species_energy[row]["energy_idx"] if row is not None else None
+        )
+        data.drop(columns=["sectorates_by_mod_val", "mod_10"], inplace=True)
+        return data
+    def compare_data(expected_data, actual_data, skip):
+        # Compare the processed data to the validation data
+        for field in expected_data.columns:
+            if field not in [
+                "sc_tick",
+                "hdr_status_bits",
+                "species",
+                "energy_idx",
+            ]:
+                assert field in l1a_counts_data.data_vars.keys()
+            if field not in ignore:
+                for frame in range(expected_data.shape[0]):
+                    if field == "species":
+                        species = expected_data[field][frame]
+                        energy_idx = expected_data["energy_idx"][frame]
+                        assert np.array_equal(
+                            actual_data[f"{species}_counts_sectored"][frame][
+                                energy_idx
+                            ].data,
+                            expected_data["sectorates"][frame],
+                        )
+                    else:
+                        assert np.array_equal(
+                            actual_data[field][frame].data, expected_data[field][frame]
+                        )
+    rate_columns = {
+        "coinrates": "COINRATES_",
+        "bufrates": "BUFRATES_",
+        "l2fgrates": "L2FGRATES_",
+        "l2bgrates": "L2BGRATES_",
+        "l3fgrates": "L3FGRATES_",
+        "l3bgrates": "L3BGRATES_",
+        "penfgrates": "PENFGRATES_",
+        "penbgrates": "PENBGRATES_",
+        "sectorates": "SECTORATES_",
+        "l4fgrates": "L4FGRATES_",
+        "l4bgrates": "L4BGRATES_",
+        "ialirtrates": "IALIRTRATES_",
+        "sngrates_hg": "SNGRATES_HG_",
+        "sngrates_lg": "SNGRATES_LG_",
+    }
+    # Prepare validation data for comparison with processed data
+    validation_data.columns = validation_data.columns.str.strip()
+    validation_data = consolidate_rate_columns(validation_data, rate_columns)
+    validation_data = process_single_rates(validation_data)
+    validation_data = process_sectorates(validation_data)
+    # Fields to skip in comparison. CCSDS headers plus a few others that are not
+    # relevant to the comparison.
+    # The CCSDS header fields contain data per packet in the dataset, but the
+    # validation data has a value per science frame so skipping comparison for now
+    ignore = [
+        "version",
+        "type",
+        "sec_hdr_flg",
+        "pkt_apid",
+        "seq_flgs",
+        "src_seq_ctr",
+        "pkt_len",
+        "sc_tick",
+        "hdr_status_bits",
+        "energy_idx",
+    ]
+    # Compare processed data to validation data
+    validation_data.columns = validation_data.columns.str.lower()
+    compare_data(validation_data, l1a_counts_data, ignore)
+    # TODO: add validation for hdr_status_bits once validation data has been updated
+    #  to include this field broken out into its subfields
+    # TODO: add validation for CCSDS fields? currently validation data only has
+    #  one value per frame and the processed data has one value per packet.
+def test_hit_l1a(hk_packet_filepath, sci_packet_filepath):
+    """Create L1A datasets from packet files.
     Parameters
     ----------
-    packet_filepath : str
-        Path to ccsds file
+    hk_packet_filepath : str
+        Path to ccsds file for housekeeping data
+    sci_packet_filepath : str
+        Path to ccsds file for science data
     """
-    processed_datasets = hit_l1a(packet_filepath, "001")
-    # TODO: update assertions after science data processing is completed
-    assert isinstance(processed_datasets, list)
-    assert len(processed_datasets) == 1
-    assert isinstance(processed_datasets[0], xr.Dataset)
-    assert processed_datasets[0].attrs["Logical_source"] == "imap_hit_l1a_hk"
+    for packet_filepath in [hk_packet_filepath, sci_packet_filepath]:
+        processed_datasets = hit_l1a(packet_filepath, "001")
+        assert isinstance(processed_datasets, list)
+        assert all(isinstance(ds, xr.Dataset) for ds in processed_datasets)
+        if packet_filepath == hk_packet_filepath:
+            assert len(processed_datasets) == 1
+            assert processed_datasets[0].attrs["Logical_source"] == "imap_hit_l1a_hk"
+        else:
+            assert len(processed_datasets) == 2
+            assert (
+                processed_datasets[0].attrs["Logical_source"]
+                == "imap_hit_l1a_count-rates"
+            )
+            assert (
+                processed_datasets[1].attrs["Logical_source"]
+                == "imap_hit_l1a_pulse-height-events"
+            )

imap_processing/tests/hit/test_hit_l1b.py CHANGED Viewed

@@ -1,3 +1,4 @@
+import pandas as pd
 import pytest
 import xarray as xr
@@ -165,6 +166,81 @@ def test_hit_l1b_hk_dataset_attributes(hk_dataset):
     assert hk_dataset.coords.keys() == dataset_coords_dims
+def test_validate_l1b_housekeeping_data(hk_dataset):
+    """Validate the housekeeping dataset created by the L1B processing.
+    Parameters
+    ----------
+    hk_dataset : xr.Dataset
+        Housekeeping dataset created by the L1B processing.
+    """
+    # TODO: finish test. HIT will provide an updated validation file to fix issues:
+    #  - some fields have strings as values but in the processed data they're integers
+    #  - Some columns have blank cells where there should be data
+    # Load the validation data
+    validation_file = (
+        imap_module_directory / "tests/hit/validation_data/hskp_sample_eu.csv"
+    )
+    validation_data = pd.read_csv(validation_file)
+    validation_data.columns = validation_data.columns.str.lower().str.strip()
+    # Get a list of leak columns in ascending order
+    # (LEAK_I_00, LEAK_I_01, ..., LEAK_I_63)
+    # and group values into a single column
+    leak_columns = [
+        col for col in validation_data.columns if col.startswith("leak_i_")
+    ][::-1]
+    validation_data["leak_i"] = validation_data[leak_columns].apply(
+        lambda row: row.values, axis=1
+    )
+    validation_data.drop(columns=leak_columns, inplace=True)
+    # Define the keys that should have dropped from the housekeeping dataset
+    dropped_fields = {
+        "pkt_apid",
+        "sc_tick",
+        "version",
+        "type",
+        "sec_hdr_flg",
+        "seq_flgs",
+        "src_seq_ctr",
+        "pkt_len",
+        "hskp_spare1",
+        "hskp_spare2",
+        "hskp_spare3",
+        "hskp_spare4",
+        "hskp_spare5",
+    }
+    # Check that dropped variables are not in the dataset
+    assert set(dropped_fields).isdisjoint(set(hk_dataset.data_vars.keys()))
+    # TODO: uncomment block after new validation data is provided
+    # Define the keys that should be ignored in the validation
+    # like ccsds headers
+    # ignore_validation_fields = {
+    #     "ccsds_version",
+    #     "ccsds_type",
+    #     "ccsds_sec_hdr_flag",
+    #     "ccsds_appid",
+    #     "ccsds_grp_flag",
+    #     "ccsds_seq_cnt",
+    #     "ccsds_length",
+    #     "sc_tick",
+    # }
+    # # Compare the housekeeping dataset with the expected validation data
+    # for field in validation_data.columns:
+    #     if field not in ignore_validation_fields:
+    #         print(field)
+    #         assert field in hk_dataset.data_vars.keys()
+    #         for pkt in range(validation_data.shape[0]):
+    #             assert np.array_equal(
+    #                 hk_dataset[field][pkt].data, validation_data[field][pkt]
+    #             )
 def test_hit_l1b(dependencies):
     """Test creating L1B CDF files

imap-processing 0.8.0__py3-none-any.whl → 0.9.0__py3-none-any.whl

Potentially problematic release.

imap-processing 0.8.0py3-none-any.whl → 0.9.0py3-none-any.whl