tmplummer
diff --git a/‎imap_processing/cdf/global_attrs.py‎
Lines changed: 4 additions & 0 deletions b/‎imap_processing/cdf/global_attrs.py‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎imap_processing/cdf/utils.py‎
Lines changed: 52 additions & 3 deletions b/‎imap_processing/cdf/utils.py‎
Lines changed: 52 additions & 3 deletions
diff --git a/‎imap_processing/idex/tests/test_l1_cdfs.py‎
Lines changed: 1 addition & 1 deletion b/‎imap_processing/idex/tests/test_l1_cdfs.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎imap_processing/swe/__init__.py‎
Lines changed: 1 addition & 0 deletions b/‎imap_processing/swe/__init__.py‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎imap_processing/swe/l1a/swe_l1a.py‎
Lines changed: 43 additions & 13 deletions b/‎imap_processing/swe/l1a/swe_l1a.py‎
Lines changed: 43 additions & 13 deletions
diff --git a/‎imap_processing/swe/l1a/swe_science.py‎
Lines changed: 84 additions & 48 deletions b/‎imap_processing/swe/l1a/swe_science.py‎
Lines changed: 84 additions & 48 deletions
@@ -250,6 +250,7 @@ class ScienceAttrs(AttrBase):
     depend_0: str = None
     depend_1: str = None
     depend_2: str = None
+    depend_3: str = None
     variable_purpose: str = None
     var_notes: str = None
 
@@ -276,6 +277,9 @@ def output(self):
         if self.depend_2 is not None:
             endval["DEPEND_2"] = self.depend_2
 
+        if self.depend_3 is not None:
+            endval["DEPEND_3"] = self.depend_3
+
         if self.variable_purpose is not None:
             endval["VARIABLE_PURPOSE"] = self.variable_purpose
 
 
@@ -5,7 +5,37 @@
 from cdflib.xarray import xarray_to_cdf
 
 
-def write_cdf(data: xr.Dataset, description: str = "", directory: str = ""):
+def calc_start_time(shcoarse_time: int):
+    """Calculate the datetime64 from the CCSDS secondary header information.
+
+    Since all instrument has SHCOARSE or MET seconds, we need convert it to
+    UTC. Took this from IDEX code.
+
+    Parameters
+    ----------
+    shcoarse_time: int
+        Number of seconds since epoch (nominally the launch time)
+
+    Returns
+    -------
+    np.datetime64
+        The time of the event
+
+    TODO
+    -----
+    This conversion is temporary for now, and will need SPICE in the future.
+    Nick Dutton mentioned that s/c clock start epoch is
+        jan-1-2010-00:01:06.184 ET
+    We will use this for now.
+    """
+    # Get the datetime of Jan 1 2010 as the start date
+    launch_time = np.datetime64("2010-01-01T00:01:06.184")
+    return launch_time + np.timedelta64(shcoarse_time, "s")
+
+
+def write_cdf(
+    data: xr.Dataset, description: str = "", mode: str = "", directory: str = ""
+):
     """Write the contents of "data" to a CDF file using cdflib.xarray_to_cdf.
 
     This function determines the file name to use from the global attributes,
@@ -20,6 +50,7 @@ def write_cdf(data: xr.Dataset, description: str = "", directory: str = ""):
         data (xarray.Dataset): The dataset object to convert to a CDF
         description (str): The description to insert into the file name after the
                             orbit, before the SPICE field.  No underscores allowed.
+        mode (str): Instrument mode
         directory (str): The directory to write the file to
 
     Returns
@@ -29,7 +60,17 @@ def write_cdf(data: xr.Dataset, description: str = "", directory: str = ""):
     """
     # Determine the start date of the data in the file,
     # based on the time of the first dust impact
-    file_start_date = data["Epoch"][0].data
+    file_start_date = None
+    if "idex" in data.attrs["Logical_source"]:
+        file_start_date = data["Epoch"][0].data
+    elif "swe" in data.attrs["Logical_source"]:
+        start_time = data["Epoch"].data[0]
+        file_start_date = calc_start_time(start_time)
+    if file_start_date is None:
+        raise ValueError(
+            "Unable to determine file start date. Check Logical_source value"
+        )
+
     date_string = np.datetime_as_string(file_start_date, unit="D").replace("-", "")
 
     # Determine the optional "description" field
@@ -38,13 +79,21 @@ def write_cdf(data: xr.Dataset, description: str = "", directory: str = ""):
         if (description.startswith("_") or not description)
         else f"_{description}"
     )
+    mode = mode if (mode.startswith("_") or not mode) else f"_{mode}"
 
     # Determine the file name based on the attributes in the xarray
+    # Set file name based on this convention:
+    # imap_<instrument>_<datalevel>_<mode>_<descriptor>_<startdate>_
+    # <version>.cdf
+    # data.attrs["Logical_source"] has the mission, instrument, and level
+    # like this:
+    #   imap_idex_l1
     filename = (
         data.attrs["Logical_source"]
+        + mode
+        + description
         + "_"
         + date_string
-        + description
         + f"_v{data.attrs['Data_version']}.cdf"
     )
     filename_and_path = os.path.join(directory, filename)
 
@@ -77,7 +77,7 @@ def test_descriptor_in_file_name(decom_test_data, temp_path):
     date_to_test = "20250724"
     assert file_name == os.path.join(
         temp_path,
-        f"{decom_test_data.data.attrs['Logical_source']}_{date_to_test}_impact-lab-test001_v{idex.__version__}.cdf",
+        f"{decom_test_data.data.attrs['Logical_source']}_impact-lab-test001_{date_to_test}_v{idex.__version__}.cdf",
     )
     assert Path(file_name).exists()
 
 
@@ -0,0 +1 @@
+__version__ = "01"
@@ -1,10 +1,16 @@
 import logging
 
-from imap_processing.swe.l0 import decom_swe
+from imap_processing.cdf.utils import write_cdf
 from imap_processing.swe.l1a.swe_science import swe_science
+from imap_processing.swe.utils.swe_utils import (
+    SWEAPID,
+    create_dataset,
+    filename_descriptors,
+)
+from imap_processing.utils import group_by_apid, sort_by_time
 
 
-def swe_l1a(packet_file: str):
+def swe_l1a(packets, cdf_filepath):
     """Process SWE l0 data into l1a data.
 
     Receive all L0 data file. Based on appId, it
@@ -13,15 +19,39 @@ def swe_l1a(packet_file: str):
 
     Parameters
     ----------
-    packet_file : str
-        The path and filename to the L0 file to read
+    packets: list
+        Decom data list that contains all appIds
+    cdf_filepath: str
+        Folder path of where to write CDF file
+
+    Returns
+    -------
+    str
+        Path name of where CDF file was created.
+        This is used to upload file from local to s3.
+        TODO: test this later.
     """
-    decom_data = decom_swe.decom_packets(packet_file)
-    logging.info(f"Unpacking data from {packet_file}")
-
-    # If appId is science, then the file should contain all data of science appId
-    if decom_data[0].header["PKT_APID"].raw_value == 1344:
-        logging.info("Processing science data")
-        return swe_science(decom_data=decom_data)
-    else:
-        return decom_data
+    # group data by appId
+    grouped_data = group_by_apid(packets)
+
+    for apid in grouped_data.keys():
+        # If appId is science, then the file should contain all data of science appId
+        if apid == SWEAPID.SWE_SCIENCE:
+            # sort data by acquisition time
+            sorted_packets = sort_by_time(grouped_data[apid], "ACQ_START_COARSE")
+            logging.debug(
+                "Processing science data for [%s] packets", len(sorted_packets)
+            )
+            data = swe_science(decom_data=sorted_packets)
+        else:
+            # If it's not science, we unpack, organize and save it as a dataset.
+            sorted_packets = sort_by_time(grouped_data[apid], "SHCOARSE")
+            data = create_dataset(packets=sorted_packets)
+
+        # write data to CDF
+        return write_cdf(
+            data,
+            mode=f"{data['APP_MODE'].data[0]}" if apid == SWEAPID.SWE_APP_HK else "",
+            description=filename_descriptors.get(apid),
+            directory=cdf_filepath,
+        )
@@ -1,11 +1,18 @@
 import collections
+import dataclasses
 
 import numpy as np
 import xarray as xr
 
+from imap_processing.cdf.global_attrs import ConstantCoordinates
+from imap_processing.swe import swe_cdf_attrs
+from imap_processing.swe.utils.swe_utils import (
+    add_metadata_to_array,
+)
 
-def uncompress_counts(cem_count):
-    """Uncompress counts from the CEMs.
+
+def decompressed_counts(cem_count):
+    """Decompressed counts from the CEMs.
 
     Parameters
     ----------
@@ -15,16 +22,16 @@ def uncompress_counts(cem_count):
     Returns
     -------
     int
-        uncompressed count. Eg. 40959
+        decompressed count. Eg. 40959
     """
     # index is the first four bits of input data
     # multi is the last four bits of input data
     index = cem_count // 16
     multi = cem_count % 16
 
     # This is look up table for the index to get
-    # base and step_size to calculate the uncompressed count.
-    uncompress_table = {
+    # base and step_size to calculate the decompressed count.
+    decompress_table = {
         0: {"base": 0, "step_size": 1},
         1: {"base": 16, "step_size": 1},
         2: {"base": 32, "step_size": 2},
@@ -43,36 +50,18 @@ def uncompress_counts(cem_count):
         15: {"base": 33792, "step_size": 2048},
     }
 
-    # uncompression formula from SWE algorithm document CN102D-D0001 and page 16.
+    # decompression formula from SWE algorithm document CN102D-D0001 and page 16.
     # N = base[index] + multi * step_size[index] + (step_size[index] - 1) / 2
     # NOTE: for (step_size[index] - 1) / 2, we only keep the whole number part of
     # the quotient
 
     return (
-        uncompress_table[index]["base"]
-        + (multi * uncompress_table[index]["step_size"])
-        + ((uncompress_table[index]["step_size"] - 1) // 2)
+        decompress_table[index]["base"]
+        + (multi * decompress_table[index]["step_size"])
+        + ((decompress_table[index]["step_size"] - 1) // 2)
     )
 
 
-def add_metadata_to_array(data_packet, metadata_arrays):
-    """Add metadata to the metadata_arrays.
-
-    Parameters
-    ----------
-    data_packet : space_packet_parser.parser.Packet
-        SWE data packet
-    metadata_arrays : dict
-        metadata arrays
-    """
-    for key, value in data_packet.header.items():
-        metadata_arrays.setdefault(key, []).append(value.raw_value)
-
-    for key, value in data_packet.data.items():
-        if key != "SCIENCE_DATA":
-            metadata_arrays.setdefault(key, []).append(value.raw_value)
-
-
 def swe_science(decom_data):
     """SWE L1a science processing.
 
@@ -116,7 +105,7 @@ def swe_science(decom_data):
 
     # We know we can only have 8 bit numbers input, so iterate over all
     # possibilities once up front
-    decompression_table = np.array([uncompress_counts(i) for i in range(256)])
+    decompression_table = np.array([decompressed_counts(i) for i in range(256)])
 
     for data_packet in decom_data:
         # read raw data
@@ -129,51 +118,98 @@ def swe_science(decom_data):
         # convert bytes to numpy array of uint8
         raw_counts = np.frombuffer(byte_data, dtype=np.uint8)
 
-        # Uncompress counts. Uncompressed data is a list of 1260
-        # where 1260 = 15 seconds x 12 energy steps x 7 CEMs
+        # Uncompress counts. Decompressed data is a list of 1260
+        # where 1260 = 180 x 7 CEMs
         # Take the "raw_counts" indices/counts mapping from
         # decompression_table and then reshape the return
-        uncompress_data = np.take(decompression_table, raw_counts).reshape(15, 12, 7)
-        raw_counts = raw_counts.reshape(15, 12, 7)
+        uncompress_data = np.take(decompression_table, raw_counts).reshape(180, 7)
+        # Save raw counts data as well
+        raw_counts = raw_counts.reshape(180, 7)
 
         # Save data with its metadata field to attrs and DataArray of xarray.
-        science_array.append(uncompress_data)
-        raw_science_array.append(raw_counts)
-        add_metadata_to_array(data_packet, metadata_arrays)
+        # Save data as np.int64 to be complaint with ISTP' FILLVAL
+        science_array.append(uncompress_data.astype(np.int64))
+        raw_science_array.append(raw_counts.astype(np.int64))
+        metadata_arrays = add_metadata_to_array(data_packet, metadata_arrays)
 
-    met_time = xr.DataArray(
+    epoch_time = xr.DataArray(
         metadata_arrays["SHCOARSE"],
-        name="met_time",
-        dims=["met_time"],
-        attrs=dict(
-            description="Mission elapsed time",
-            units="seconds since start of the mission",
-        ),
+        name="Epoch",
+        dims=["Epoch"],
+        attrs=ConstantCoordinates.EPOCH,
+    )
+
+    # TODO: add more descriptive description
+    energy = xr.DataArray(
+        np.arange(180),
+        name="Energy",
+        dims=["Energy"],
+        attrs=dataclasses.replace(
+            swe_cdf_attrs.int_base,
+            catdesc="Energy's index value in the lookup table",
+            fieldname="Energy Bins",
+            label_axis="Energy Bins",
+            units="",
+        ).output(),
+    )
+
+    counts = xr.DataArray(
+        np.arange(7),
+        name="Counts",
+        dims=["Counts"],
+        attrs=dataclasses.replace(
+            swe_cdf_attrs.int_base,
+            catdesc="Counts",
+            fieldname="Counts",
+            label_axis="Counts",
+            units="int",
+        ).output(),
     )
 
     science_xarray = xr.DataArray(
         science_array,
-        dims=["met_time", "seconds", "energy_steps", "cem_counts"],
+        dims=["Epoch", "Energy", "Counts"],
+        attrs=swe_cdf_attrs.l1a_science_attrs.output(),
     )
+
     raw_science_xarray = xr.DataArray(
         raw_science_array,
-        dims=["met_time", "seconds", "energy_steps", "cem_counts"],
+        dims=["Epoch", "Energy", "Counts"],
+        attrs=swe_cdf_attrs.l1a_science_attrs.output(),
     )
 
     dataset = xr.Dataset(
-        {"SCIENCE_DATA": science_xarray},
-        coords={"met_time": met_time},
+        coords={
+            "Epoch": epoch_time,
+            "Energy": energy,
+            "Counts": counts,
+        },
+        attrs=swe_cdf_attrs.swe_l1a_global_attrs.output(),
     )
-
+    dataset["SCIENCE_DATA"] = science_xarray
     dataset["RAW_SCIENCE_DATA"] = raw_science_xarray
 
     # create xarray dataset for each metadata field
     for key, value in metadata_arrays.items():
         if key == "SHCOARSE":
             continue
+        # TODO: figure out how to add more descriptive
+        # description for each metadata field
+        #
+        # int_attrs["CATDESC"] = int_attrs["FIELDNAM"] = int_attrs["LABLAXIS"] = key
+        # # get int32's max since most of metadata is under 32-bits
+        # int_attrs["VALIDMAX"] = np.iinfo(np.int32).max
+        # int_attrs["DEPEND_0"] = "Epoch"
         dataset[key] = xr.DataArray(
             value,
-            dims=["met_time"],
+            dims=["Epoch"],
+            attrs=dataclasses.replace(
+                swe_cdf_attrs.swe_metadata_attrs,
+                catdesc=key,
+                fieldname=key,
+                label_axis=key,
+                depend_0="Epoch",
+            ).output(),
         )
 
     return dataset
Original file line number	Diff line number	Diff line change
`@@ -77,7 +77,7 @@ def test_descriptor_in_file_name(decom_test_data, temp_path):`
`77`	`77`	`date_to_test = "20250724"`
`78`	`78`	`assert file_name == os.path.join(`
`79`	`79`	`temp_path,`
`80`		`- f"{decom_test_data.data.attrs['Logical_source']}_{date_to_test}_impact-lab-test001_v{idex.__version__}.cdf",`
	`80`	`+ f"{decom_test_data.data.attrs['Logical_source']}_impact-lab-test001_{date_to_test}_v{idex.__version__}.cdf",`
`81`	`81`	`)`
`82`	`82`	`assert Path(file_name).exists()`
`83`	`83`