Source code for romancal.ramp_fitting.ramp_fit_step

#! /usr/bin/env python
#
from __future__ import annotations

import copy
import logging
from typing import TYPE_CHECKING

import asdf
import numpy as np
from astropy.utils.decorators import deprecated
from roman_datamodels import datamodels as rdm
from roman_datamodels.dqflags import group, pixel
from stcal.jump.jump_class import JumpData
from stcal.ramp_fitting import ols_cas22_fit
from stcal.ramp_fitting.likely_fit import likely_ramp_fit
from stcal.ramp_fitting.ols_cas22 import Parameter, Variance

from romancal.datamodels.fileio import open_dataset
from romancal.stpipe import RomanStep

SQRT2 = np.sqrt(2)

if TYPE_CHECKING:
    from typing import ClassVar

log = logging.getLogger(__name__)
log.setLevel(logging.DEBUG)

__all__ = ["RampFitStep"]



[docs]
class RampFitStep(RomanStep):
    """This step fits a straight line to the value of counts vs. time to
    determine the mean count rate for each pixel.
    """

    class_alias = "ramp_fit"

    spec = """
        algorithm = option('ols_cas22', 'likely', default='likely')  # Algorithm to use to fit. Note: `ols_cas22` is deprecated and will be removed in a future version
        suffix = string(default='rampfit')  # Default suffix of results
        rejection_threshold = float(default=4.5,min=0) # CR sigma rejection threshold
        use_ramp_jump_detection = boolean(default=True) # Use jump detection during ramp fitting
        threshold_intercept = float(default=None) # Override the intercept parameter for the threshold function in the jump detection algorithm.
        threshold_constant = float(default=None) # Override the constant parameter for the threshold function in the jump detection algorithm.
        include_var_rnoise = boolean(default=False) # include var_rnoise in output (can be reconstructed from err and other variances)
        maximum_cores = string(default='1') # cores for multiprocessing. Can be an integer, 'half', 'quarter', or 'all'
        expand_large_events = boolean(default=False) # Turns on Snowball detection
        min_sat_area = float(default=1.0) # minimum required area for the central saturation of snowballs
        min_jump_area = float(default=6.0) # minimum area to trigger large events processing
        expand_factor = float(default=1.9) # The expansion factor for the enclosing circles or ellipses
        sat_required_snowball = boolean(default=True) # Require the center of snowballs to be saturated
        min_sat_radius_extend = float(default=0.5) # The min radius of the sat core to trigger the extension of the core
        sat_expand = integer(default=2) # Number of pixels to add to the radius of the saturated core of snowballs
        edge_size = integer(default=0) # Distance from detector edge where a saturated core is not required for snowball detection
     """

    weighting = "optimal"  # Only weighting allowed for OLS

    reference_file_types: ClassVar = ["readnoise", "gain"]


[docs]
    def process(self, dataset):
        input_model = open_dataset(dataset, update_version=self.update_version)

        # Retrieve reference info
        readnoise_filename = self.get_reference_file(input_model, "readnoise")
        gain_filename = self.get_reference_file(input_model, "gain")
        log.info("Using READNOISE reference file: %s", readnoise_filename)
        readnoise_model = rdm.open(readnoise_filename, mode="r")
        log.info("Using GAIN reference file: %s", gain_filename)
        gain_model = rdm.open(gain_filename, mode="r")

        # Do the fitting based on the algorithm selected.
        algorithm = self.algorithm.lower()
        if algorithm == "ols_cas22":
            out_model = ols_cas22(
                input_model,
                readnoise_model,
                gain_model,
                include_var_rnoise=self.include_var_rnoise,
                use_jump=self.use_ramp_jump_detection,
                threshold_intercept=self.threshold_intercept,
                threshold_constant=self.threshold_constant,
            )
        elif algorithm == "likely":
            jump_kw = dict(
                maximum_cores=self.maximum_cores,
                expand_large_events=self.expand_large_events,
                min_sat_area=self.min_sat_area,
                min_jump_area=self.min_jump_area,
                expand_factor=self.expand_factor,
                sat_required_snowball=self.sat_required_snowball,
                min_sat_radius_extend=self.min_sat_radius_extend,
                sat_expand=self.sat_expand,
                edge_size=self.edge_size,
            )

            out_model = likely(
                input_model,
                readnoise_model,
                gain_model,
                include_var_rnoise=self.include_var_rnoise,
                jump_kw=jump_kw,
            )
        else:
            log.error("Algorithm %s is not supported. Skipping step.")
            out_model = input_model
            out_model.meta.cal_step.ramp_fit = "SKIPPED"

        return out_model




@deprecated("0.22.0")
def ols_cas22(
    input_model,
    readnoise_model,
    gain_model,
    include_var_rnoise=False,
    use_jump=True,
    threshold_intercept=None,
    threshold_constant=None,
):
    """Peform Optimal Linear Fitting on arbitrarily space resulants

    Parameters
    ----------
    input_model : RampModel
        Model containing ramps.

    readnoise_model : ReadnoiseRefModel
        Model with the read noise reference information.

    gain_model : GainRefModel
        Model with the gain reference information.

    use_jump : bool
        If True, fit jumps as part of ramp fitting.

    threshold_intercept : float
        y-intercept to use for jump significance equation

    threshold_constant : float
        slope to use for jump significance equation

    Returns
    -------
    out_model : ImageModel
        Model containing a count-rate image.

    """

    if use_jump:
        log.info("Jump detection as part of ramp fitting is enabled.")
    else:
        log.info("Jump detection as part of ramp fitting is disabled.")

    kwargs = {}
    if threshold_intercept is not None:
        kwargs["threshold_intercept"] = threshold_intercept
    if threshold_constant is not None:
        kwargs["threshold_constant"] = threshold_constant

    gain = gain_model.data
    read_time = input_model.meta.exposure.frame_time

    # Account for the gain.  Do not modify input_model.
    resultants = input_model.data * gain
    read_noise = readnoise_model.data * gain
    dq = input_model.groupdq

    # Force read pattern to be pure lists not LNodes
    read_pattern = [list(reads) for reads in input_model.meta.exposure.read_pattern]
    if len(read_pattern) != resultants.shape[0]:
        raise RuntimeError("mismatch between resultants shape and read_pattern.")

    # Fit the ramps
    output = ols_cas22_fit.fit_ramps_casertano(
        resultants,
        dq,
        read_noise,
        read_time,
        read_pattern=read_pattern,
        use_jump=use_jump,
        **kwargs,
    )

    # Break out the information and fix units back to DN/s
    slopes = output.parameters[..., Parameter.slope] / gain
    var_rnoise = output.variances[..., Variance.read_var] / gain**2
    var_poisson = output.variances[..., Variance.poisson_var] / gain**2
    err = np.sqrt(var_poisson + var_rnoise)
    dq = output.dq.astype(np.uint32)

    # Propagate DQ flags forward.
    ramp_dq = get_pixeldq_flags(dq, input_model.pixeldq, slopes, err, gain)

    # Create the image model.  Rescale by the gain back to DN/s
    image_info = {
        "slope": slopes,
        "dq": ramp_dq,
        "var_poisson": var_poisson,
        "var_rnoise": var_rnoise,
        "err": err,
    }
    image_model = _create_image_model(
        input_model, image_info, include_var_rnoise=include_var_rnoise
    )
    image_model.meta.cal_step.ramp_fit = "COMPLETE"

    # That's all folks
    return image_model


def likely(
    input_model,
    readnoise_model,
    gain_model,
    rejection_threshold=4.5,
    include_var_rnoise=False,
    jump_kw=None,
):
    """Perform Maximum Likelihood Algorithm

    Parameters
    ----------
    input_model : RampModel
        Model containing ramps.

    readnoise_model : ReadnoiseRefModel
        Model with the read noise reference information.

    gain_model : GainRefModel
        Model with the gain reference information.

    rejection_threshold : float
        Reject CRs at this SNR

    include_var_rnoise : bool
        if True, include var_rnoise estimates in the output data model

    jump_kw : dict
        Additional keywords to control jump detection; see _setup_jump_data.

    Returns
    -------
    out_model : ImageModel
        Model containing a count-rate image.
    """
    # Add the needed components to the input model.
    input_model["flags_do_not_use"] = pixel.DO_NOT_USE
    input_model["flags_saturated"] = pixel.SATURATED
    input_model["rejection_threshold"] = rejection_threshold
    input_model["flags_jump_det"] = pixel.JUMP_DET
    # Add an axis to match the JWST data cube
    input_model.data = input_model.data[np.newaxis, :, :, :]
    input_model.groupdq = input_model.groupdq[np.newaxis, :, :, :]
    # add ancillary information needed by likelihood fitting
    input_model.read_pattern = _get_readtimes(input_model)
    input_model.zeroframe = None
    input_model.average_dark_current = np.zeros(
        [input_model.data.shape[2], input_model.data.shape[3]]
    )

    # Setup jump data to handle snowballs and other special situations handled by
    # the likelihood algorithm
    if jump_kw is None:
        jump_kw = dict()
    jump_data = _setup_jump_data(input_model, readnoise_model, gain_model, **jump_kw)

    image_info, _, _ = likely_ramp_fit(
        input_model, readnoise_model.data, gain_model.data, jump_data=jump_data
    )

    # Flag pixels that have only a single resultant.
    oneresultant = (
        np.sum(
            (input_model.groupdq[0] & (group.SATURATED | group.DO_NOT_USE)) == 0,
            axis=0,
        )
        <= 1
    )
    # we need to revisit the pixeldq handling!
    image_info["dq"] |= pixel.DO_NOT_USE * oneresultant

    out_model = _create_image_model(
        input_model, image_info, include_var_rnoise=include_var_rnoise
    )

    out_model.meta.cal_step.ramp_fit = "COMPLETE"

    return out_model


def _setup_jump_data(
    result,
    rnoise_m,
    gain_m,
    expand_large_events=False,
    min_jump_area=6,
    min_sat_area=1,
    expand_factor=1.9,
    sat_required_snowball=True,
    min_sat_radius_extend=0.5,
    sat_expand=2,
    edge_size=0,
    maximum_cores="1",
):
    """
    Create a JumpData instance to be used by STCAL jump.

    Parameters
    ----------
    result : RampModel
        The ramp model input from the previous step.

    rnoise_m : ReadNoise model
        Readnoise reference model

    gain_m : GainModel
        Gain reference model

    expand_large_events : bool
        if True, identify and flag potential snowballs

    min_jump_area : int
        minimum saturated area to trigger large event processing

    min_sat_area : float
        minimum required area for the central saturation of snowballs

    expand_factor : float
        The expansion factor for the enclosing circles or ellipses

    sat_required_snowball : bool
        Require the center of snowballs to be saturated

    min_sat_radius_extend : float
        The min radius of the sat core to trigger the extension of the core

    sat_expand : int
        Number of pixels to add to the radius of the saturated core of snowballs

    edge_size : int
        Distance from detector edge where a saturated core is not required for snowball detection

    maximum_cores : string
        str(int) giving the maximum number of cores to use, or 'quarter', 'half', or 'all'

    Returns
    -------
    jump_data : JumpData
        The data container to be used to run the STCAL detect_jumps_data.
    """

    # Instantiate a JumpData class and populate it based on the input RampModel.
    jump_data = JumpData(result, gain_m.data, rnoise_m.data, pixel)

    # Setup snowball detection
    sat_expand = sat_expand * 2
    jump_data.set_snowball_info(
        expand_large_events,
        min_jump_area,
        min_sat_area,
        expand_factor,
        sat_required_snowball,
        min_sat_radius_extend,
        sat_expand,
        edge_size,
    )

    # Performance setup
    jump_data.max_cores = maximum_cores

    return jump_data


# #########
# Utilities
# #########
def _create_image_model(input_model, image_info, include_var_rnoise=False):
    """Creates an ImageModel from the computed arrays from ramp_fit.

    Parameters
    ----------
    input_model : `~roman_datamodels.datamodels.RampModel`
        Input ``RampModel`` for which the output ``ImageModel`` is created.

    image_info : dict
        The ramp fitting arrays needed for the ``ImageModel``.

    include_var_rnoise : bool
        If True, include var_rnoise in the output model.

    Returns
    -------
    out_model : `~roman_datamodels.datamodels.ImageModel`
        The output ``ImageModel`` to be returned from the ramp fit step.

    """
    im = rdm.ImageModel()
    # use getitem here to avoid copying the DNode
    im.meta = copy.deepcopy(input_model["meta"])
    im.meta.model_type = "ImageModel"
    # since we've copied nodes let's remove any "read" tags
    for node in asdf.treeutil.iter_tree(im):
        if node._read_tag is not None:
            node._read_tag = None
    im.meta.product_type = "l2"
    im.meta.cal_step = {}
    for step_name in im.schema_info("required")["roman"]["meta"]["cal_step"][
        "required"
    ].info:
        im.meta.cal_step[step_name] = input_model.meta.cal_step.get(
            step_name, "INCOMPLETE"
        )
    im.meta.cal_logs = []
    im.meta.photometry = {
        "conversion_megajanskys": -999999,
        "conversion_megajanskys_uncertainty": -999999,
        "pixel_area": -999999,
    }
    im.amp33 = input_model.amp33.copy()
    im.border_ref_pix_left = input_model.border_ref_pix_left.copy()
    im.border_ref_pix_right = input_model.border_ref_pix_right.copy()
    im.border_ref_pix_top = input_model.border_ref_pix_top.copy()
    im.border_ref_pix_bottom = input_model.border_ref_pix_bottom.copy()
    im.dq_border_ref_pix_left = input_model.dq_border_ref_pix_left.copy()
    im.dq_border_ref_pix_right = input_model.dq_border_ref_pix_right.copy()
    im.dq_border_ref_pix_top = input_model.dq_border_ref_pix_top.copy()
    im.dq_border_ref_pix_bottom = input_model.dq_border_ref_pix_bottom.copy()

    # trim off border reference pixels from science data, dq, err
    # and var_poisson/var_rnoise
    im.data = image_info["slope"][4:-4, 4:-4].copy()
    if image_info["dq"] is not None:
        im.dq = image_info["dq"][4:-4, 4:-4].copy()
    else:
        im.dq = np.zeros(im.data.shape, dtype="u4")

    im.err = image_info["err"][4:-4, 4:-4].copy().astype("float16")
    im.var_poisson = image_info["var_poisson"][4:-4, 4:-4].copy().astype("float16")
    if include_var_rnoise:
        im.var_rnoise = image_info["var_rnoise"][4:-4, 4:-4].copy().astype("float16")

    # Add required chisq and dumo fields.  chisq will be populated with zeroes
    # if the likelihood algorithm was not run, so that "chisq" is not a key in
    # image_info.

    if "chisq" in image_info.keys() and image_info["chisq"] is not None:
        im.chisq = image_info["chisq"][4:-4, 4:-4].copy().astype("float16")
    else:
        im.chisq = np.zeros(im.data.shape, dtype=np.float16)

    slopes_alt = slopes_uniform_weights(input_model)

    # Add this to the optimal-weighted slopes to get the uniform-weighted slopes
    im.dumo = (slopes_alt[4:-4, 4:-4] - im.data).astype("float16")

    return im


def slopes_uniform_weights(input_model):
    """
    Compute ramp slopes using uniform (read-noise-limited) weights.

    Parameters
    ----------
    input_model : RampModel
        Model containing ramps.

    Returns
    -------
    slopes : ndarray
        The slope for each pixel under uniform weighting, which is optimal
        in the read noise limit.  All flags, including saturation and
        jump, will be ignored.
    """

    # The lines below compute the weight for each resultant in the case
    # of uniform weighting (a diagonal covariance matrix consisting only
    # of read noise).

    readtimes = _get_readtimes(input_model)

    ni = np.array([len(t) for t in readtimes])
    ti = np.array([np.mean(t) for t in readtimes])
    N = np.sum(ni)
    Nt = np.sum(ni * ti)
    Ntt = np.sum(ni * ti**2)
    weights = (N * ni * ti - Nt * ni) / (N * Ntt - Nt**2)

    # We want the weighted sum over reads.
    if len(input_model.data.shape) == 3:
        return np.sum(weights[:, None, None] * input_model.data, axis=0)
    elif len(input_model.data.shape) == 4:
        return np.sum(weights[:, None, None] * input_model.data[0], axis=0)
    else:
        raise ValueError("Unexpected shape for input_model.data")


def get_pixeldq_flags(groupdq, pixeldq, slopes, err, gain):
    """Construct pixeldq for ramp fit output from input dqs and ramp slopes.

    The algorithm is:
    - pass forward existing pixeldq flags
    - if we flagged a jump, flag the pixel as containing a jump
    - if everything is saturated, flag the pixel as saturated
    - if everything is saturated or do not use, flag the pixel as do not use
    - add NO_GAIN_VALUE if gain is not finite or less than zero

    Parameters
    ----------
    groupdq : np.ndarray
        dq flags for each resultant
    pixeldq : np.ndarray
        dq flags for each pixel
    slopes : np.ndarray
        derived slopes for each pixel
    err : np.ndarray
        derived total uncertainty for each pixel
    gain : np.ndarray
        gains for each pixel

    Returns
    -------
    pixeldq : np.ndarray
        Updated pixeldq array combining information from input dq and slopes.

    """
    outpixeldq = pixeldq.copy()
    # jump flagging
    m = np.any(groupdq & group.JUMP_DET, axis=0)
    outpixeldq |= (m * pixel.JUMP_DET).astype(np.uint32)
    # all saturated flagging
    m = np.all(groupdq & group.SATURATED, axis=0)
    outpixeldq |= (m * pixel.SATURATED).astype(np.uint32)
    # all either saturated or do not use or NaN slope flagging
    satordnu = group.SATURATED | group.DO_NOT_USE
    m = np.all(groupdq & satordnu, axis=0)
    m |= ~np.isfinite(slopes) | (err <= 0)
    outpixeldq |= (m * pixel.DO_NOT_USE).astype(np.uint32)
    m = (gain < 0) | ~np.isfinite(gain)
    outpixeldq |= (m * pixel.NO_GAIN_VALUE).astype(np.uint32)

    return outpixeldq


def _get_readtimes(ramp_data):
    """Get the read times needed to compute the covariance matrices.

    If there is already a read_pattern in the ramp_data class, then just get it.
    If not, then one needs to be constructed.  If one needs to be constructed it
    is assumed the groups are evenly spaced in time, as are the frames that make
    up the group.  If each group has only one frame and no group gap, then a list
    of the group times is returned.  If nframes > 0, then a list of lists of each
    frame time in each group is returned with the assumption:
        group_time = (nframes + groupgap) * frame_time

    Parameters
    ----------
    ramp_data : RampData
        Input data necessary for computing ramp fitting.

    Returns
    -------
    readtimes : list
        A list of frame times for each frame used in the computation of the ramp.

    """
    nresultants = ramp_data.meta.exposure.nresultants
    log.info("Number of resultants: %d ", nresultants)

    rtimes = [
        list(np.array(r) * ramp_data.meta.exposure.frame_time)
        for r in ramp_data.meta.exposure.read_pattern
    ]

    return rtimes