From 2ac5b09aea79d55d6f6127a618d4c315c2cd1541 Mon Sep 17 00:00:00 2001 From: Mihai Cara Date: Wed, 27 Nov 2024 11:25:41 -0500 Subject: [PATCH 01/13] Add common resample code to stcal. --- src/stcal/resample/__init__.py | 13 + src/stcal/resample/resample.py | 1584 ++++++++++++++++++++++++++++++++ src/stcal/resample/utils.py | 299 ++++++ 3 files changed, 1896 insertions(+) create mode 100644 src/stcal/resample/__init__.py create mode 100644 src/stcal/resample/resample.py create mode 100644 src/stcal/resample/utils.py diff --git a/src/stcal/resample/__init__.py b/src/stcal/resample/__init__.py new file mode 100644 index 00000000..7152f15c --- /dev/null +++ b/src/stcal/resample/__init__.py @@ -0,0 +1,13 @@ +from .resample import ( + OutputTooLargeError, + Resample, + compute_wcs_pixel_area, + UnsupportedWCSError, +) + +__all__ = [ + "OutputTooLargeError", + "Resample", + "compute_wcs_pixel_area", + "UnsupportedWCSError", +] diff --git a/src/stcal/resample/resample.py b/src/stcal/resample/resample.py new file mode 100644 index 00000000..b9891d3d --- /dev/null +++ b/src/stcal/resample/resample.py @@ -0,0 +1,1584 @@ +import logging +import math +import os +import warnings +import json +import abc +from copy import deepcopy +import sys + +import numpy as np +from scipy.ndimage import median_filter +import psutil + +from astropy import units as u +from astropy.nddata.bitmask import ( + bitfield_to_boolean_mask, + interpret_bit_flags, +) +from drizzle.utils import calc_pixmap +from drizzle.resample import Drizzle +from stdatamodels.jwst.library.basic_utils import bytes2human + + +from stcal.resample.utils import ( + bytes2human, + compute_wcs_pixel_area, + get_tmeasure, + resample_range, +) + + +log = logging.getLogger(__name__) +log.setLevel(logging.DEBUG) + +__all__ = [ + "compute_wcs_pixel_area" + "OutputTooLargeError", + "Resample", + "resampled_wcs_from_models", + "UnsupportedWCSError", +] + + +class OutputTooLargeError(RuntimeError): + """Raised when the output is too large for in-memory instantiation""" + + +class UnsupportedWCSError(RuntimeError): + """ Raised when provided output WCS has an unexpected number of axes + or has an unsupported structure. + """ + + +class Resample: + """ + This is the controlling routine for the resampling process. + + Notes + ----- + This routine performs the following operations:: + + 1. Extracts parameter settings from input model, such as pixfrac, + weight type, exposure time (if relevant), and kernel, and merges + them with any user-provided values. + 2. Creates output WCS based on input images and define mapping function + between all input arrays and the output array. + 3. Updates output data model with output arrays from drizzle, including + a record of metadata from all input models. + """ + resample_suffix = 'i2d' + resample_file_ext = '.fits' + + # supported output arrays (subclasses can add more): + output_array_types = { + "data": np.float32, + "wht": np.float32, + "con": np.int32, + "var_rnoise": np.float32, + "var_flat": np.float32, + "var_poisson": np.float32, + "err": np.float32, + } + + dq_flag_name_map = {} + + def __init__(self, n_input_models=None, pixfrac=1.0, kernel="square", + fillval=0.0, wht_type="ivm", good_bits=0, + output_wcs=None, output_model=None, + accumulate=False, enable_ctx=True, enable_var=True, + compute_err=None, + allowed_memory=None): + """ + Parameters + ---------- + n_input_models : int, None, optional + Number of input models expected to be resampled. When provided, + this is used to estimate memory requirements and optimize memory + allocation for the context array. + + pixfrac : float, optional + The fraction of a pixel that the pixel flux is confined to. The + default value of 1 has the pixel flux evenly spread across the + image. A value of 0.5 confines it to half a pixel in the linear + dimension, so the flux is confined to a quarter of the pixel area + when the square kernel is used. + + kernel: {"square", "gaussian", "point", "turbo", "lanczos2", "lanczos3"}, optional + The name of the kernel used to combine the input. The choice of + kernel controls the distribution of flux over the kernel. + The square kernel is the default. + + .. warning:: + The "gaussian" and "lanczos2/3" kernels **DO NOT** + conserve flux. + + fillval: float, None, str, optional + The value of output pixels that did not have contributions from + input images' pixels. When ``fillval`` is either `None` or + ``"INDEF"`` and ``out_img`` is provided, the values of ``out_img`` + will not be modified. When ``fillval`` is either `None` or + ``"INDEF"`` and ``out_img`` is **not provided**, the values of + ``out_img`` will be initialized to `numpy.nan`. If ``fillval`` + is a string that can be converted to a number, then the output + pixels with no contributions from input images will be set to this + ``fillval`` value. + + wht_type : {"exptime", "ivm"}, optional + The weighting type for adding models' data. For ``wht_type="ivm"`` + (the default), the weighting will be determined per-pixel using + the inverse of the read noise (VAR_RNOISE) array stored in each + input image. If the ``VAR_RNOISE`` array does not exist, + the variance is set to 1 for all pixels (i.e., equal weighting). + If ``weight_type="exptime"``, the weight will be set equal + to the measurement time (``TMEASURE``) when available and to + the exposure time (``EFFEXPTM``) otherwise. + + good_bits : int, str, None, optional + An integer bit mask, `None`, a Python list of bit flags, a comma-, + or ``'|'``-separated, ``'+'``-separated string list of integer + bit flags or mnemonic flag names that indicate what bits in models' + DQ bitfield array should be *ignored* (i.e., zeroed). + + When co-adding models using :py:meth:`add_model`, any pixels with + a non-zero DQ values are assigned a weight of zero and therefore + they do not contribute to the output (resampled) data. + ``good_bits`` provides a mean to ignore some of the DQ bitflags. + + When ``good_bits`` is an integer, it must be + the sum of all the DQ bit values from the input model's + DQ array that should be considered "good" (or ignored). For + example, if pixels in the DQ array can be + combinations of 1, 2, 4, and 8 flags and one wants to consider DQ + "defects" having flags 2 and 4 as being acceptable, then + ``good_bits`` should be set to 2+4=6. Then a pixel with DQ values + 2,4, or 6 will be considered a good pixel, while a pixel with + DQ value, e.g., 1+2=3, 4+8=12, etc. will be flagged as + a "bad" pixel. + + Alternatively, when ``good_bits`` is a string, it can be a + comma-separated or '+' separated list of integer bit flags that + should be summed to obtain the final "good" bits. For example, + both "4,8" and "4+8" are equivalent to integer ``good_bits=12``. + + Finally, instead of integers, ``good_bits`` can be a string of + comma-separated mnemonics. For example, for JWST, all the following + specifications are equivalent: + + `"12" == "4+8" == "4, 8" == "JUMP_DET, DROPOUT"` + + In order to "translate" mnemonic code to integer bit flags, + ``Resample.dq_flag_name_map`` attribute must be set to either + a dictionary (with keys being mnemonc codes and the values being + integer flags) or a `~astropy.nddata.BitFlagNameMap`. + + In order to reverse the meaning of the flags + from indicating values of the "good" DQ flags + to indicating the "bad" DQ flags, prepend '~' to the string + value. For example, in order to exclude pixels with + DQ flags 4 and 8 for computations and to consider + as "good" all other pixels (regardless of their DQ flag), + use a value of ``~4+8``, or ``~4,8``. A string value of + ``~0`` would be equivalent to a setting of ``None``. + + | Default value (0) will make *all* pixels with non-zero DQ + values be considered "bad" pixels, and the corresponding data + pixels will be assigned zero weight and thus these pixels + will not contribute to the output resampled data array. + + | Set `good_bits` to `None` to turn off the use of model's DQ + array. + + For more details, see documentation for + `astropy.nddata.bitmask.extend_bit_flag_map`. + + output_wcs : dict, WCS object, None + Specifies output WCS either directly as a WCS or a dictionary + with keys ``'wcs'`` (WCS object) and ``'pixel_scale'`` + (pixel scale in arcseconds). ``'pixel_scale'``, when provided, + will be used for computation of drizzle scaling factor. When it is + not provided, output pixel scale will be *estimated* from the + provided WCS object. ``output_wcs`` object is required when + ``output_model`` is `None`. ``output_wcs`` is ignored when + ``output_model`` is provided. + + output_model : dict, None, optional + A dictionary containing data arrays and other attributes that + will be used to add new models to. use + :py:meth:`Resample.output_model_attributes` to get the list of + keywords that must be present. When ``accumulate`` is `False`, + only the WCS object of the model will be used. When ``accumulate`` + is `True`, new models will be added to the existing data in the + ``output_model``. + + When ``output_model`` is `None`, a new model will be created. + + accumulate : bool, optional + Indicates whether resampled models should be added to the + provided ``output_model`` data or if new arrays should be + created. + + enable_ctx : bool, optional + Indicates whether to create a context image. If ``disable_ctx`` + is set to `True`, parameters ``out_ctx``, ``begin_ctx_id``, and + ``max_ctx_id`` will be ignored. + + enable_var : bool, optional + Indicates whether to resample variance arrays. + + compute_err : {"from_var", "driz_err"}, None, optional + - ``"from_var"``: compute output model's error array from + all (Poisson, flat, readout) resampled variance arrays. + Setting ``compute_err`` to ``"from_var"`` will assume + ``enable_var`` was set to `True` regardless of actual + value of the parameter ``enable_var``. + - ``"driz_err"``: compute output model's error array by drizzling + together all input models' error arrays. + + Error array will be assigned to ``'err'`` key of the output model. + + .. note:: + At this time, output error array is not equivalent to + error propagation results. + + allowed_memory : float, None + Fraction of memory allowed to be used for resampling. If + ``allowed_memory`` is `None` then no check for available memory + will be performed. + + """ + # to see if setting up arrays and drizzle is needed + self._finalized = False + self._n_res_models = 0 + + self._n_predicted_input_models = n_input_models + self.allowed_memory = allowed_memory + self._output_model = output_model + self._create_new_output_model = output_model is not None + + self._enable_ctx = enable_ctx + self._enable_var = enable_var + self._compute_err = compute_err + self._accumulate = accumulate + + # these are attributes that are used only for information purpose + # and are added to created the output_model only if they are + # not already present there: + self._pixel_scale_ratio = None + self._output_pixel_scale = None # in arcsec + + # resample parameters + self.pixfrac = pixfrac + self.kernel = kernel + self.fillval = fillval + self.good_bits = good_bits + + if wht_type in ["ivm", "exptime"]: + self.weight_type = wht_type + else: + raise ValueError("Unexpected weight type: '{self.weight_type}'") + + self._output_wcs = output_wcs + + self.input_file_names = [] + self._group_ids = [] + + # determine output WCS and set-up output model if needed: + if output_model is None: + if output_wcs is None: + raise ValueError( + "Output WCS must be provided either through the " + "'output_wcs' parameter or the 'ouput_model' parameter. " + ) + else: + if isinstance(output_wcs, dict): + self._output_pixel_scale = output_wcs.get("pixel_scale") + self._pixel_scale_ratio = output_wcs.get( + "pixel_scale_ratio" + ) + self._output_wcs = output_wcs.get("wcs") + else: + self._output_wcs = output_wcs + + self.check_output_wcs(self._output_wcs) + + else: + self.validate_output_model( + output_model=output_model, + accumulate=accumulate, + enable_ctx=enable_ctx, + enable_var=enable_var, + ) + self._output_model = output_model + self._output_wcs = output_model["wcs"] + self._output_pixel_scale = output_model.get("pixel_scale") + if output_wcs: + log.warning( + "'output_wcs' will be ignored. Using the 'wcs' supplied " + "by the 'output_model' instead." + ) + + if self._output_pixel_scale is None: + self._output_pixel_scale = 3600.0 * np.rad2deg( + math.sqrt(compute_wcs_pixel_area(self._output_wcs)) + ) + log.info( + "Computed output pixel scale: " + f"{self._output_pixel_scale} arcsec." + ) + else: + log.info( + f"Output pixel scale: {self._output_pixel_scale} arcsec." + ) + + self._output_array_shape = self._output_wcs.array_shape + + # Check that the output data shape has no zero length dimensions + npix = np.prod(self._output_array_shape) + if not npix: + raise ValueError( + "Invalid output frame shape: " + f"{tuple(self._output_array_shape)}" + ) + + log.info(f"Driz parameter kernel: {self.kernel}") + log.info(f"Driz parameter pixfrac: {self.pixfrac}") + log.info(f"Driz parameter fillval: {self.fillval}") + log.info(f"Driz parameter weight_type: {self.weight_type}") + log.debug( + f"Output mosaic size (nx, ny): {self._output_wcs.pixel_shape}" + ) + + # set up an empty (don't allocate arrays at this time) output model: + if self._output_model is None: + self._output_model = self.create_output_model() + + self.reset_arrays(reset_output=False, n_input_models=n_input_models) + + @classmethod + def output_model_attributes(cls, accumulate, enable_ctx, enable_var, + compute_err): + """ + Returns a set of string keywords that must be present in an + 'output_model' that is provided as input at the class initialization. + + Parameters + ---------- + + accumulate : bool, optional + Indicates whether resampled models should be added to the + provided ``output_model`` data or if new arrays should be + created. + + enable_ctx : bool, optional + Indicates whether to create a context image. If ``disable_ctx`` + is set to `True`, parameters ``out_ctx``, ``begin_ctx_id``, and + ``max_ctx_id`` will be ignored. + + enable_var : bool, optional + Indicates whether to resample variance arrays. + + compute_err : {"from_var", "driz_err"}, None, optional + - ``"from_var"``: compute output model's error array from + all (Poisson, flat, readout) resampled variance arrays. + Setting ``compute_err`` to ``"from_var"`` will assume + ``enable_var`` was set to `True` regardless of actual + value of the parameter ``enable_var``. + - ``"driz_err"``: compute output model's error array by drizzling + together all input models' error arrays. + + Error array will be assigned to ``'err'`` key of the output model. + + .. note:: + At this time, output error array is not equivalent to + error propagation results. + + """ + # always required: + attributes = { + "data", + "wcs", + "wht", + } + + if enable_ctx: + attributes.add("con") + if compute_err: + attributes.add("err") + if enable_var: + attributes.update( + ["var_rnoise", "var_poisson", "var_flat"] + ) + # TODO: if we want to support adding more data to + # existing output models, we need to also store weights + # for variance arrays: + # var_rnoise_weight + # var_flat_weight + # var_poisson_weight + if accumulate: + if enable_ctx: + attributes.add("n_coadds") + + # additional attributes required for input parameter 'output_model' + # when data and weight arrays are not None: + attributes.update( + { + "pixfrac", + "kernel", + "fillval", + "weight_type", + "pointings", + "exposure_time", + "measurement_time", + "start_time", + "end_time", + "duration", + } + ) + + return attributes + + def check_memory_requirements(self, output_model, allowed_memory, + n_input_models=None): + """ Called just before `create_output_model` returns to verify + that there is enough memory to hold the output. + + Parameters + ---------- + allowed_memory : float, None + Fraction of memory allowed to be used for resampling. If + + output_model : dict, None, optional + A dictionary containing data arrays and other attributes that + will be used to add new models to. use + :py:meth:`Resample.output_model_attributes` to get the list of + keywords that must be present. When ``accumulate`` is `False`, + only the WCS object of the model will be used. When ``accumulate`` + is `True`, new models will be added to the existing data in the + ``output_model``. + + When ``output_model`` is `None`, a new model will be created. + + n_input_models : int, None, optional + Number of input models expected to be resampled. When provided, + this is used to estimate memory requirements and optimize memory + allocation for the context array. + + + """ + if ((allowed_memory is None and + "DMODEL_ALLOWED_MEMORY" not in os.environ) or + n_input_models is None): + return + + allowed_memory = float(allowed_memory) + + # get the available memory + available_memory = ( + psutil.virtual_memory().available + psutil.swap_memory().total + ) + + # compute the output array size + npix = np.prod(self._output_array_shape) + nconpl = n_input_models // 32 + (1 if n_input_models % 32 else 0) # context planes + required_memory = 0 + for arr in self.output_array_types: + if arr in output_model: + if arr == "con": + f = nconpl + elif arr == "err": + if self._compute_err == "from_var": + f = 2 # data and weight arrays + elif self._compute_err == "driz_err": + f = 1 + elif arr.startswith("var"): + f = 3 # variance data, weight, and total arrays + else: + f = 1 + + required_memory += f * self.output_array_types[arr].itemsize + + # add pixmap itemsize: + required_memory += 2 * np.dtype(float).itemsize + required_memory *= npix + + # compare used to available + used_fraction = required_memory / available_memory + if used_fraction > allowed_memory: + raise OutputTooLargeError( + f'Combined ImageModel size {self._output_wcs.array_shape} ' + f'requires {bytes2human(required_memory)}. ' + f'Model cannot be instantiated.' + ) + + def check_output_wcs(self, output_wcs, estimate_output_shape=True): + """ + Check that provided WCS has expected properties and that its + ``array_shape`` property is defined. + + Parameters + ---------- + output_wcs : WCS object + A WCS object corresponding to the output (resampled) image. + + estimate_output_shape : bool, optional + Indicates whether to *estimate* pixel scale of the ``output_wcs`` + from + + """ + naxes = output_wcs.output_frame.naxes + if naxes != 2: + raise UnsupportedWCSError( + "Output WCS needs 2 coordinate axes but the " + f"supplied WCS has {naxes} axes." + ) + + # make sure array_shape and pixel_shape are set: + if output_wcs.array_shape is None and estimate_output_shape: + # if wcs_pars and "output_shape" in wcs_pars: + # output_wcs.array_shape = wcs_pars["output_shape"] + # else: + if output_wcs.bounding_box: + halfpix = 0.5 + sys.float_info.epsilon + output_wcs.array_shape = ( + int(output_wcs.bounding_box[1][1] + halfpix), + int(output_wcs.bounding_box[0][1] + halfpix), + ) + else: + # TODO: In principle, we could compute footprints of all + # input models, convert them to image coordinates using + # `output_wcs`, and then take max(x_i), max(y_i) as + # output image size. + raise ValueError( + "Unable to infer output image size from provided " + "inputs." + ) + + def validate_output_model(self, output_model, accumulate, + enable_ctx, enable_var): + """ Checks that ``output_model`` dictionary has all the required + keywords that the code would expect it to have based on the values + of ``accumulate``, ``enable_ctx``, ``enable_var``. It will raise + `ValueError` if `output_model` is missing required keywords/values. + + """ + if output_model is None: + if accumulate: + raise ValueError( + "'output_model' must be defined when 'accumulate' is True." + ) + return + + required_attributes = self.output_model_attributes( + accumulate=accumulate, + enable_ctx=enable_ctx, + enable_var=enable_var, + ) + + for attr in required_attributes: + if attr not in output_model: + raise ValueError( + f"'output_model' dictionary must have '{attr}' set." + ) + + model_wcs = output_model["wcs"] + self.check_output_wcs(model_wcs, estimate_output_shape=False) + wcs_shape = model_wcs.array_shape + ref_shape = output_model["data"].shape + if accumulate and wcs_shape is None: + raise ValueError( + "Output model's 'wcs' must have 'array_shape' attribute " + "set when 'accumulate' parameter is True." + ) + + if not np.array_equiv(wcs_shape, ref_shape): + raise ValueError( + "Output model's 'wcs.array_shape' value is not consistent " + "with the shape of the data array." + ) + + for attr in required_attributes.difference(["data", "wcs"]): + if (isinstance(output_model[attr], np.ndarray) and + not np.array_equiv(output_model[attr].shape, ref_shape)): + raise ValueError( + "'output_wcs.array_shape' value is not consistent " + f"with the shape of the '{attr}' array." + ) + + # TODO: also check "pixfrac", "kernel", "fillval", "weight_type" + # with initializer parameters. log a warning if different. + + def create_output_model(self): + """ Create a new "output model": a dictionary of data and meta fields. + Check that there is enough memory to hold all arrays by calling + `check_memory_requirements`. + + """ + assert self._output_wcs is not None + assert np.array_equiv( + self._output_wcs.array_shape, + self._output_array_shape + ) + assert self._output_pixel_scale + + pix_area = self._output_pixel_scale**2 + + output_model = { + # WCS: + "wcs": self._output_wcs, + + # main arrays: + "data": None, + "wht": None, + "con": None, + + # resample parameters: + "pixfrac": self.pixfrac, + "kernel": self.kernel, + "fillval": self.fillval, + "weight_type": self.weight_type, + + # accumulate-specific: + "n_coadds": 0, + + # pixel scale: + "pixelarea_steradians": pix_area / np.rad2deg(3600)**2, + "pixelarea_arcsecsq": pix_area, + "pixel_scale_ratio": self._pixel_scale_ratio, + + # drizzle info: + "pointings": 0, + + # exposure time: + "exposure_time": 0.0, + "measurement_time": None, + "start_time": None, + "end_time": None, + "duration": 0.0, + } + + if self._enable_var: + output_model.update( + { + "var_rnoise": None, + "var_flat": None, + "var_poisson": None, + # TODO: if we want to support adding more data to + # existing output models, we need to also store weights + # for variance arrays: + # var_rnoise_weight + # var_flat_weight + # var_poisson_weight + } + ) + + if self._compute_err is not None: + output_model["err"] = None + + if self.allowed_memory: + self.check_memory_requirements( + output_model, + self.allowed_memory, + n_input_models=self._n_predicted_input_models, + ) + + return output_model + + @property + def output_model(self): + return self._output_model + + @property + def output_array_shape(self): + return self._output_array_shape + + @property + def output_wcs(self): + return self._output_wcs + + @property + def group_ids(self): + return self._group_ids + + def _get_intensity_scale(self, model): + """ + Compute an intensity scale from the input and output pixel area. + + For imaging data, the scaling is used to account for differences + between the nominal pixel area and the average pixel area for + the input data. + + For spectral data, the scaling is used to account for flux + conservation with non-unity pixel scale ratios, when the + data units are flux density. + + Parameters + ---------- + model : dict + The input data model. + + Returns + ------- + iscale : float + The scale to apply to the input data before drizzling. + + """ + input_pixflux_area = model["pixelarea_steradians"] + wcs = model["wcs"] + + if input_pixflux_area: + if 'SPECTRAL' in wcs.output_frame.axes_type: + # Use the nominal area as is + input_pixel_area = input_pixflux_area + + # If input image is in flux density units, correct the + # flux for the user-specified change to the spatial dimension + if _is_flux_density(model["bunit_data"]): + input_pixel_area *= self.pscale_ratio + else: + input_pixel_area = compute_wcs_pixel_area( + wcs, + shape=model["data"].shape + ) + if input_pixel_area is None: + model_name = model["filename"] + if not model_name: + model_name = "Unknown" + raise ValueError( + "Unable to compute input pixel area from WCS of input " + f"image {repr(model_name)}." + ) + + if self._pixel_scale_ratio is None: + input_pscale = 3600.0 * np.rad2deg( + math.sqrt(input_pixel_area) + ) + + self._pixel_scale_ratio = ( + self._output_pixel_scale / input_pscale + ) + + # update output model if "pixel_scale_ratio" was never + # set previously: + if (self._output_model is not None and + self._output_model["pixel_scale_ratio"] is None): + self._output_model["pixel_scale_ratio"] = self._pixel_scale_ratio + + iscale = math.sqrt(input_pixflux_area / input_pixel_area) + + else: + iscale = 1.0 + + return iscale + + @property + def finalized(self): + return self._finalized + + def reset_arrays(self, reset_output=True, n_input_models=None): + """ Initialize/reset `Drizzle` objects, output model and arrays, + and time counters. Output WCS and shape are not modified from + `Resample` object initialization. This method needs to be called + before calling :py:meth:`add_model` for the first time if + :py:meth:`finalize` was previously called. + + Parameters + ---------- + reset_output : bool, optional + When `True` a new output model will be created. Otherwise new + models will be resampled and added to existing output data arrays. + + n_input_models : int, None, optional + Number of input models expected to be resampled. When provided, + this is used to estimate memory requirements and optimize memory + allocation for the context array. + + """ + self._n_predicted_input_models = n_input_models + + # set up an empty (don't allocate arrays at this time) output model: + if reset_output or getattr(self, "_output_model", None) is None: + self._output_model = self.create_output_model() + + om = self._output_model + + begin_ctx_id = om.get("n_coadds", 0) + if n_input_models is None: + max_ctx_id = None + else: + max_ctx_id = begin_ctx_id + n_input_models - 1 + + self._driz = Drizzle( + kernel=self.kernel, + fillval=self.fillval, + out_shape=self._output_array_shape, + out_img=om["data"], + out_wht=om["wht"], + out_ctx=om["con"], + exptime=om["exposure_time"], + begin_ctx_id=begin_ctx_id, + max_ctx_id=max_ctx_id, + ) + + # Also make a temporary model to hold error data + if self._compute_err == "driz_err": + self._driz_error = Drizzle( + kernel=self.kernel, + fillval=self.fillval, + out_shape=self._output_array_shape, + out_img=om["err"], + exptime=om["exposure_time"], + disable_ctx=True, + ) + + if self._enable_var: + self.init_variance_arrays() + + self.init_time_counters() + + self._finalized = False + + def validate_input_model(self, model): + """ Checks that ``model`` has all the required keywords needed for + processing based on settings used during initialisation if the + `Resample` object. + + Parameters + ---------- + model : dict + A dictionary containing data arrays and other meta attributes + and values of actual models used by pipelines. + + Raises + ------ + KeyError + A `KeyError` is raised when ``model`` does not have a required + keyword. + + """ + # TODO: do we need this to just raise a custom + assert isinstance(model, dict) + min_attributes = [ + # arrays: + "data", + "dq", + + # meta: + "group_id", + "s_region", + "wcs", + + "exposure_time", + "start_time", + "end_time", + "duration", + "measurement_time", + "effective_exposure_time", + "elapsed_exposure_time", + + "pixelarea_steradians", + # "pixelarea_arcsecsq", + + "level", # sky level + "subtracted", + ] + + if self._enable_var: + min_attributes += ["var_rnoise", "var_poisson", "var_flat"] + + if self._compute_err == "driz_err": + min_attributes.append("err") + + if (not self._enable_var and self.weight_type is not None and + self.weight_type.startswith('ivm')): + min_attributes.append("var_rnoise") + + for attr in min_attributes: + if attr not in model: + raise KeyError( + f"Attempt to access non-existent key '{attr}' " + "in a data model." + ) + + def add_model(self, model): + """ Resamples model image and either variance data (if ``enable_var`` + was `True`) or error data (if ``enable_err`` was `True`) and adds + them using appropriate weighting to the corresponding + arrays of the output model. It also updates resampled data weight, + the context array (if ``enable_ctx`` is `True`), relevant output + model's values such as "n_coadds". + + Whenever ``model`` has a unique group ID that was never processed + before, the "pointings" value of the output model is incremented and + the "group_id" attribute is updated. Also, time counters are updated + with new values from the input ``model`` by calling + :py:meth:`~Resample.update_time`. + + Parameters + ---------- + model : dict + A dictionary containing data arrays and other meta attributes + and values of actual models used by pipelines. + + """ + if self._finalized: + raise RuntimeError( + "Resampling has been finalized and intermediate arrays have " + "been freed. Unable to add new models. Call 'reset_arrays' " + "to initialize a new output model and associated arrays." + ) + self.validate_input_model(model) + self._n_res_models += 1 + + data = model["data"] + wcs = model["wcs"] + + # Check that input models are 2D images + if data.ndim != 2: + raise RuntimeError( + f"Input model '{model['filename']}' is not a 2D image." + ) + + self._output_model["n_coadds"] += 1 + + if (group_id := model["group_id"]) not in self._group_ids: + self.update_time(model) + self._group_ids.append(group_id) + self.output_model["pointings"] += 1 + + iscale = self._get_intensity_scale(model) + log.debug(f'Using intensity scale iscale={iscale}') + + pixmap = calc_pixmap( + wcs, + self.output_model["wcs"], + data.shape, + ) + + log.info("Resampling science and variance data") + + weight = self.build_driz_weight( + model, + weight_type=self.weight_type, + good_bits=self.good_bits, + ) + + # apply sky subtraction + blevel = model["level"] + if not model["subtracted"] and blevel is not None: + data = data - blevel + # self._output_model["subtracted"] = True + + xmin, xmax, ymin, ymax = resample_range( + data.shape, + wcs.bounding_box + ) + + add_image_kwargs = { + 'exptime': model["exposure_time"], + 'pixmap': pixmap, + 'scale': iscale, + 'weight_map': weight, + 'wht_scale': 1.0, # hard-coded for JWST count-rate data + 'pixfrac': self.pixfrac, + 'in_units': 'cps', # TODO: get units from data model + 'xmin': xmin, + 'xmax': xmax, + 'ymin': ymin, + 'ymax': ymax, + } + + self._driz.add_image(data, **add_image_kwargs) + + if self._compute_err == "driz_err": + self._driz_error.add_image(model["err"], **add_image_kwargs) + + if self._enable_var: + self.resample_variance_arrays(model, pixmap, iscale, weight, + xmin, xmax, ymin, ymax) + + # update output model (variance is too expensive so it's omitted) + self._output_model["data"] = self._driz.out_img + self._output_model["wht"] = self._driz.out_wht + if self._driz.out_ctx is not None: + self._output_model["con"] = self._driz.out_ctx + + if self._compute_err == "driz_err": + # use resampled error + self.output_model["err"] = self._driz_error.out_img + + def finalize(self, free_memory=True): + """ Finalizes all computations and frees temporary objects. + + ``finalize`` calls :py:meth:`~Resample.finalize_resample_variance` and + :py:meth:`~Resample.finalize_time_info`. + + .. warning:: + If ``enable_var=True`` and :py:meth:`~Resample.finalize` is called + with ``free_memory=True`` then intermediate arrays holding variance + weights will be lost and so continuing adding new models after + a call to :py:meth:`~Resample.finalize` will result in incorrect + variance. + + """ + if self._finalized: + # can't finalize twice + return + self._finalized = free_memory + + self._output_model["pointings"] = len(self.group_ids) + + # assign resampled arrays to the output model dictionary: + self._output_model["data"] = self._driz.out_img + self._output_model["wht"] = self._driz.out_wht + if self._driz.out_ctx is not None: + # Since the context array is dynamic, it must be re-assigned + # back to the product's `con` attribute. + self._output_model["con"] = self._driz.out_ctx + + if free_memory: + del self._driz + + # compute final variances: + if self._enable_var: + self.finalize_resample_variance( + self._output_model, + free_memory=free_memory + ) + + if self._compute_err == "driz_err": + # use resampled error + self.output_model["err"] = self._driz_error.out_img + if free_memory: + del self._driz_error + + elif self._enable_var: + # compute error from variance arrays: + var_components = [ + self._output_model["var_rnoise"], + self._output_model["var_poisson"], + self._output_model["var_flat"], + ] + if self._compute_err == "from_var": + self.output_model["err"] = np.sqrt( + np.nansum(var_components, axis=0) + ) + + # nansum returns zero for input that is all NaN - + # set those values to NaN instead + all_nan = np.all(np.isnan(var_components), axis=0) + self._output_model["err"][all_nan] = np.nan + + del var_components, all_nan + + self._finalized = True + + self.finalize_time_info() + + return + + def init_variance_arrays(self): + """ Allocate arrays that hold co-added resampled variances and their + weights. """ + shape = self.output_array_shape + + for noise_type in ["var_rnoise", "var_flat", "var_poisson"]: + var_dtype = self.output_array_types[noise_type] + kwd = f"{noise_type}_weight" + if self._accumulate: + wsum = self._output_model.get(noise_type) + wt = self._output_model.get(kwd) + if wsum is None or wt is None: + wsum = np.full(shape, np.nan, dtype=var_dtype) + wt = np.zeros(shape, dtype=var_dtype) + else: + wsum = wsum * (wt * wt) + else: + wsum = np.full(shape, np.nan, dtype=var_dtype) + wt = np.zeros(shape, dtype=var_dtype) + + setattr(self, f"_{noise_type}_wsum", wsum) + setattr(self, f"_{noise_type}_weight", wt) + + def resample_variance_arrays(self, model, pixmap, iscale, + weight_map, xmin, xmax, ymin, ymax): + """ Resample and co-add variance arrays using appropriate weights + and update total weights. + + Parameters + ---------- + model : dict + A dictionary containing data arrays and other meta attributes + and values of actual models used by pipelines. + + pixmap : 3D array + A mapping from input image (``data``) coordinates to resampled + (``out_img``) coordinates. ``pixmap`` must be an array of shape + ``(Ny, Nx, 2)`` where ``(Ny, Nx)`` is the shape of the input image. + ``pixmap[..., 0]`` forms a 2D array of X-coordinates of input + pixels in the ouput frame and ``pixmap[..., 1]`` forms a 2D array of + Y-coordinates of input pixels in the ouput coordinate frame. + + iscale : float + The scale to apply to the input variance data before drizzling. + + weight_map : 2D array, None, optional + A 2D numpy array containing the pixel by pixel weighting. + Must have the same dimensions as ``data``. + + When ``weight_map`` is `None`, the weight of input data pixels will + be assumed to be 1. + + xmin : float, optional + This and the following three parameters set a bounding rectangle + on the input image. Only pixels on the input image inside this + rectangle will have their flux added to the output image. Xmin + sets the minimum value of the x dimension. The x dimension is the + dimension that varies quickest on the image. If the value is zero, + no minimum will be set in the x dimension. All four parameters are + zero based, counting starts at zero. + + xmax : float, optional + Sets the maximum value of the x dimension on the bounding box + of the input image. If the value is zero, no maximum will + be set in the x dimension, the full x dimension of the output + image is the bounding box. + + ymin : float, optional + Sets the minimum value in the y dimension on the bounding box. The + y dimension varies less rapidly than the x and represents the line + index on the input image. If the value is zero, no minimum will be + set in the y dimension. + + ymax : float, optional + Sets the maximum value in the y dimension. If the value is zero, no + maximum will be set in the y dimension, the full x dimension + of the output image is the bounding box. + + """ + # Do the read noise variance first, so it can be + # used for weights if needed + pars = { + 'pixmap': pixmap, + 'iscale': iscale, + 'weight_map': weight_map, + 'xmin': xmin, + 'xmax': xmax, + 'ymin': ymin, + 'ymax': ymax, + } + + if self._check_var_array(model, "var_rnoise"): + rn_var = self._resample_one_variance_array( + "var_rnoise", + model=model, + **pars, + ) + + # Find valid weighting values in the variance + if rn_var is not None: + mask = (rn_var > 0) & np.isfinite(rn_var) + else: + mask = np.full_like(rn_var, False) + + # Set the weight for the image from the weight type + if self.weight_type == "ivm" and rn_var is not None: + weight = np.ones(self.output_array_shape) + weight[mask] = np.reciprocal(rn_var[mask]) + + elif self.weight_type == "exptime": + t, _ = get_tmeasure(model) + weight = np.full(self.output_array_shape, t) + + # Weight and add the readnoise variance + # Note: floating point overflow is an issue if variance weights + # are used - it can't be squared before multiplication + if rn_var is not None: + # Add the inverse of the resampled variance to a running sum. + # Update only pixels (in the running sum) with + # valid new values: + mask = (rn_var >= 0) & np.isfinite(rn_var) & (weight > 0) + self._var_rnoise_wsum[mask] = np.nansum( + [ + self._var_rnoise_wsum[mask], + rn_var[mask] * weight[mask] * weight[mask] + ], + axis=0 + ) + self._var_rnoise_weight[mask] += weight[mask] + + # Now do poisson and flat variance, updating only valid new values + # (zero is a valid value; negative, inf, or NaN are not) + if self._check_var_array(model, "var_poisson"): + pn_var = self._resample_one_variance_array( + "var_poisson", + model=model, + **pars, + ) + if pn_var is not None: + mask = (pn_var >= 0) & np.isfinite(pn_var) & (weight > 0) + self._var_poisson_wsum[mask] = np.nansum( + [ + self._var_poisson_wsum[mask], + pn_var[mask] * weight[mask] * weight[mask] + ], + axis=0 + ) + self._var_poisson_weight[mask] += weight[mask] + + if self._check_var_array(model, "var_flat"): + flat_var = self._resample_one_variance_array( + "var_flat", + model=model, + **pars, + ) + if flat_var is not None: + mask = (flat_var >= 0) & np.isfinite(flat_var) & (weight > 0) + self._var_flat_wsum[mask] = np.nansum( + [ + self._var_flat_wsum[mask], + flat_var[mask] * weight[mask] * weight[mask] + ], + axis=0 + ) + self._var_flat_weight[mask] += weight[mask] + + def finalize_resample_variance(self, output_model, free_memory=True): + """ Compute variance for the resampled image from running sums and + weights. Free memory (when ``free_memory=True``) that holds these + running sums and weights arrays. + """ + # Divide by the total weights, squared, and set in the output model. + # Zero weight and missing values are NaN in the output. + with warnings.catch_warnings(): + warnings.filterwarnings("ignore", "invalid value*", RuntimeWarning) + warnings.filterwarnings("ignore", "divide by zero*", RuntimeWarning) + + output_variance = ( + self._var_rnoise_wsum / self._var_rnoise_weight / + self._var_rnoise_weight + ).astype( + dtype=self.output_array_types["var_rnoise"] + ) + output_model["var_rnoise"] = output_variance + + output_variance = ( + self._var_poisson_wsum / self._var_poisson_weight / + self._var_poisson_weight + ).astype( + dtype=self.output_array_types["var_poisson"] + ) + output_model["var_poisson"] = output_variance + + output_variance = ( + self._var_flat_wsum / self._var_flat_weight / + self._var_flat_weight + ).astype( + dtype=self.output_array_types["var_flat"] + ) + output_model["var_flat"] = output_variance + + if free_memory: + self._finalized = True + del ( + self._var_rnoise_wsum, + self._var_poisson_wsum, + self._var_flat_wsum, + self._var_rnoise_weight, + self._var_poisson_weight, + self._var_flat_weight, + ) + + def _resample_one_variance_array(self, name, model, iscale, + weight_map, pixmap, + xmin=None, xmax=None, ymin=None, + ymax=None): + """Resample one variance image from an input model. + + The error image is passed to drizzle instead of the variance, to + better match kernel overlap and user weights to the data, in the + pixel averaging process. The drizzled error image is squared before + returning. + """ + variance = model.get(name) + if variance is None or variance.size == 0: + log.debug( + f"No data for '{name}' for model " + f"{repr(model['filename'])}. Skipping ..." + ) + return + + elif variance.shape != model["data"].shape: + log.warning( + f"Data shape mismatch for '{name}' for model " + f"{repr(model['filename'])}. Skipping ..." + ) + return + + output_shape = self.output_array_shape + + # Resample the error array. Fill "unpopulated" pixels with NaNs. + driz = Drizzle( + out_shape=output_shape, + kernel=self.kernel, + fillval=np.nan, + disable_ctx=True + ) + + # Call 'drizzle' to perform image combination + log.info(f"Drizzling {variance.shape} --> {output_shape}") + + driz.add_image( + data=np.sqrt(variance), + exptime=model["exposure_time"], + pixmap=pixmap, + scale=iscale, + weight_map=weight_map, + wht_scale=1.0, # hard-coded for JWST count-rate data + pixfrac=self.pixfrac, + in_units="cps", # TODO: get units from data model + xmin=xmin, + xmax=xmax, + ymin=ymin, + ymax=ymax, + ) + + return driz.out_img ** 2 + + def build_driz_weight(self, model, weight_type=None, good_bits=None): + """ Create a weight map for use by drizzle. + + Parameters + ---------- + wht_type : {"exptime", "ivm"}, optional + The weighting type for adding models' data. For ``wht_type="ivm"`` + (the default), the weighting will be determined per-pixel using + the inverse of the read noise (VAR_RNOISE) array stored in each + input image. If the ``VAR_RNOISE`` array does not exist, + the variance is set to 1 for all pixels (i.e., equal weighting). + If ``weight_type="exptime"``, the weight will be set equal + to the measurement time (``TMEASURE``) when available and to + the exposure time (``EFFEXPTM``) otherwise. + + good_bits : int, str, None, optional + An integer bit mask, `None`, a Python list of bit flags, a comma-, + or ``'|'``-separated, ``'+'``-separated string list of integer + bit flags or mnemonic flag names that indicate what bits in models' + DQ bitfield array should be *ignored* (i.e., zeroed). + + See `Resample` for more information + + """ + data = model["data"] + dq = model["dq"] + + dqmask = bitfield_to_boolean_mask( + dq, + good_bits, + good_mask_value=1, + dtype=np.uint8, + flag_name_map=self.dq_flag_name_map, + ) + + if weight_type and weight_type.startswith('ivm'): + weight_type = weight_type.strip() + selective_median = weight_type.startswith('ivm-smed') + bitvalue = interpret_bit_flags( + good_bits, + flag_name_map=self.dq_flag_name_map + ) + if bitvalue is None: + bitvalue = 0 + + # disable selective median if SATURATED flag is included + # in good_bits: + try: + saturation = self.dq_flag_name_map["SATURATED"] + if selective_median and not (bitvalue & saturation): + selective_median = False + weight_type = 'ivm' + except AttributeError: + pass + + var_rnoise = model["var_rnoise"] + if (var_rnoise is not None and var_rnoise.shape == data.shape): + with np.errstate(divide="ignore", invalid="ignore"): + inv_variance = var_rnoise**-1 + + inv_variance[~np.isfinite(inv_variance)] = 1 + + if weight_type != 'ivm': + ny, nx = data.shape + + # apply a median filter to smooth the weight at saturated + # (or high read-out noise) single pixels. keep kernel size + # small to still give lower weight to extended CRs, etc. + ksz = weight_type[8 if selective_median else 7:] + if ksz: + kernel_size = int(ksz) + if not (kernel_size % 2): + raise ValueError( + 'Kernel size of the median filter in IVM ' + 'weighting must be an odd integer.' + ) + else: + kernel_size = 3 + + ivm_copy = inv_variance.copy() + + if selective_median: + # apply median filter selectively only at + # points of partially saturated sources: + jumps = np.where( + np.logical_and(dq & saturation, dqmask) + ) + w2 = kernel_size // 2 + for r, c in zip(*jumps): + x1 = max(0, c - w2) + x2 = min(nx, c + w2 + 1) + y1 = max(0, r - w2) + y2 = min(ny, r + w2 + 1) + data = ivm_copy[y1:y2, x1:x2][dqmask[y1:y2, x1:x2]] + if data.size: + inv_variance[r, c] = np.median(data) + # else: leave it as is + + else: + # apply median to the entire inv-var array: + inv_variance = median_filter( + inv_variance, + size=kernel_size + ) + bad_dqmask = np.logical_not(dqmask) + inv_variance[bad_dqmask] = ivm_copy[bad_dqmask] + + else: + warnings.warn( + "var_rnoise array not available. " + "Setting drizzle weight map to 1", + RuntimeWarning + ) + inv_variance = 1.0 + + weight = inv_variance * dqmask + + elif weight_type == "exptime": + t, _ = get_tmeasure(model) + weight = np.full(data.shape, t) + weight *= dqmask + + else: + weight = np.ones(data.shape, dtype=data.dtype) * dqmask + + return weight.astype(np.float32) + + def init_time_counters(self): + """ Initialize variables/arrays needed to process exposure time. """ + self._total_exposure_time = self.output_model["exposure_time"] + self._duration = self.output_model["duration"] + self._total_measurement_time = self.output_model["measurement_time"] + if self._total_measurement_time is None: + self._total_measurement_time = 0.0 + + if (start_time := self.output_model.get("start_time", None)) is None: + self._exptime_start = [] + else: + self._exptime_start[start_time] + + if (end_time := self.output_model.get("end_time", None)) is None: + self._exptime_end = [] + else: + self._exptime_end[end_time] + + self._measurement_time_success = [] + + def update_time(self, model): + """ A method called by the `~Resample.add_model` method to process each + image's time attributes *only when ``model`` has a new group ID. + + """ + if model["group_id"] in self._group_ids: + return + + self._exptime_start.append(model["start_time"]) + self._exptime_end.append(model["end_time"]) + + t, success = get_tmeasure(model) + self._total_exposure_time += model["exposure_time"] + self._measurement_time_success.append(success) + self._total_measurement_time += t + + self._duration += model["duration"] + + def finalize_time_info(self): + """ Perform final computations for the total time and update relevant + fileds of the output model. + + """ + assert self._n_res_models + # basic exposure time attributes: + self._output_model["exposure_time"] = self._total_exposure_time + self._output_model["start_time"] = min(self._exptime_start) + self._output_model["end_time"] = max(self._exptime_end) + # Update other exposure time keywords: + # XPOSURE (identical to the total effective exposure time,EFFEXPTM) + self._output_model["effective_exposure_time"] = self._total_exposure_time + # DURATION (identical to TELAPSE, elapsed time) + self._output_model["duration"] = self._duration + self._output_model["elapsed_exposure_time"] = self._duration + + if all(self._measurement_time_success): + self._output_model["measurement_time"] = self._total_measurement_time + + def _check_var_array(self, model, array_name): + """ Check that a variance array has the same shape as the model's + data array. + + """ + array_data = model.get(array_name, None) + sci_data = model["data"] + model_name = _get_model_name(model) + + if array_data is None or array_data.size == 0: + log.debug( + f"No data for '{array_name}' for model " + f"{repr(model_name)}. Skipping ..." + ) + return False + + elif array_data.shape != sci_data.shape: + log.warning( + f"Data shape mismatch for '{array_name}' for model " + f"{repr(model_name)}. Skipping ..." + ) + return False + + return True + + +def _get_model_name(model): + model_name = model.get("filename") + if model_name is None or not model_name.strip(): + model_name = "Unknown" + return model_name + + +def _is_flux_density(bunit): + """ + Differentiate between surface brightness and flux density data units. + + Parameters + ---------- + bunit : str or `~astropy.units.Unit` + Data units, e.g. 'MJy' (is flux density) or 'MJy/sr' (is not). + + Returns + ------- + bool + True if the units are equivalent to flux density units. + """ + try: + flux_density = u.Unit(bunit).is_equivalent(u.Jy) + except (ValueError, TypeError): + flux_density = False + return flux_density diff --git a/src/stcal/resample/utils.py b/src/stcal/resample/utils.py new file mode 100644 index 00000000..7175af4b --- /dev/null +++ b/src/stcal/resample/utils.py @@ -0,0 +1,299 @@ +from copy import deepcopy +import logging +import math + +import asdf +import numpy as np +from astropy.nddata.bitmask import interpret_bit_flags +from spherical_geometry.polygon import SphericalPolygon + + +__all__ = [ + "build_mask", + "bytes2human", + "compute_wcs_pixel_area", + "get_tmeasure", + "is_imaging_wcs", + "load_custom_wcs", + "resample_range", +] + +log = logging.getLogger(__name__) +log.setLevel(logging.DEBUG) + + +def resample_range(data_shape, bbox=None): + # Find range of input pixels to resample: + if bbox is None: + xmin = ymin = 0 + xmax = data_shape[1] - 1 + ymax = data_shape[0] - 1 + else: + ((x1, x2), (y1, y2)) = bbox + xmin = max(0, int(x1 + 0.5)) + ymin = max(0, int(y1 + 0.5)) + xmax = min(data_shape[1] - 1, int(x2 + 0.5)) + ymax = min(data_shape[0] - 1, int(y2 + 0.5)) + + return xmin, xmax, ymin, ymax + + +def load_custom_wcs(asdf_wcs_file, output_shape=None): + """ Load a custom output WCS from an ASDF file. + + Parameters + ---------- + asdf_wcs_file : str + Path to an ASDF file containing a GWCS structure. + + output_shape : tuple of int, optional + Array shape (in ``[x, y]`` order) for the output data. If not provided, + the custom WCS must specify one of: pixel_shape, + array_shape, or bounding_box. + + Returns + ------- + wcs : WCS + The output WCS to resample into. + + """ + if not asdf_wcs_file: + return None + + with asdf.open(asdf_wcs_file) as af: + wcs = deepcopy(af.tree["wcs"]) + wcs.pixel_area = af.tree.get("pixel_area", None) + wcs.pixel_shape = af.tree.get("pixel_shape", None) + wcs.array_shape = af.tree.get("array_shape", None) + + if output_shape is not None: + wcs.array_shape = output_shape[::-1] + wcs.pixel_shape = output_shape + elif wcs.pixel_shape is not None: + wcs.array_shape = wcs.pixel_shape[::-1] + elif wcs.array_shape is not None: + wcs.pixel_shape = wcs.array_shape[::-1] + elif wcs.bounding_box is not None: + wcs.array_shape = tuple( + int(axs[1] + 0.5) + for axs in wcs.bounding_box.bounding_box(order="C") + ) + else: + raise ValueError( + "Step argument 'output_shape' is required when custom WCS " + "does not have neither of 'array_shape', 'pixel_shape', or " + "'bounding_box' attributes set." + ) + + return wcs + + +def build_mask(dqarr, bitvalue, flag_name_map=None): + """Build a bit mask from an input DQ array and a bitvalue flag + + In the returned bit mask, 1 is good, 0 is bad + """ + bitvalue = interpret_bit_flags(bitvalue, flag_name_map=flag_name_map) + + if bitvalue is None: + return np.ones(dqarr.shape, dtype=np.uint8) + return np.logical_not(np.bitwise_and(dqarr, ~bitvalue)).astype(np.uint8) + + +def get_tmeasure(model): + """ + Check if the measurement_time keyword is present in the datamodel + for use in exptime weighting. If not, revert to using exposure_time. + + Returns a tuple of (exptime, is_measurement_time) + """ + try: + tmeasure = model["measurement_time"] + except KeyError: + return model["exposure_time"], False + if tmeasure is None: + return model["exposure_time"], False + else: + return tmeasure, True + + +# FIXME: temporarily copied here to avoid this import: +# from stdatamodels.jwst.library.basic_utils import bytes2human +def bytes2human(n): + """Convert bytes to human-readable format + + Taken from the `psutil` library which references + http://code.activestate.com/recipes/578019 + + Parameters + ---------- + n : int + Number to convert + + Returns + ------- + readable : str + A string with units attached. + + Examples + -------- + >>> bytes2human(10000) + '9.8K' + + >>> bytes2human(100001221) + '95.4M' + """ + symbols = ('K', 'M', 'G', 'T', 'P', 'E', 'Z', 'Y') + prefix = {} + for i, s in enumerate(symbols): + prefix[s] = 1 << (i + 1) * 10 + for s in reversed(symbols): + if n >= prefix[s]: + value = float(n) / prefix[s] + return '%.1f%s' % (value, s) + return "%sB" % n + + +def is_imaging_wcs(wcs): + """ Returns `True` if ``wcs`` is an imaging WCS and `False` otherwise. """ + imaging = all( + ax == 'SPATIAL' for ax in wcs.output_frame.axes_type + ) + return imaging + + +def compute_wcs_pixel_area(wcs, shape=None): + """ Computes pixel area in steradians. + """ + if (shape := (shape or wcs.array_shape)) is None: + raise ValueError( + "Either WCS must have 'array_shape' attribute set or 'shape' " + "argument must be supplied." + ) + + valid_polygon = False + spatial_idx = np.where( + np.array(wcs.output_frame.axes_type) == 'SPATIAL' + )[0] + + ny, nx = shape + + if wcs.bounding_box is None: + ((xmin, xmax), (ymin, ymax)) = ((-0.5, nx - 0.5), (-0.5, ny - 0.5)) + else: + ((xmin, xmax), (ymin, ymax)) = wcs.bounding_box + + xmin = max(0, int(xmin + 0.5)) + xmax = min(nx - 1, int(xmax - 0.5)) + ymin = max(0, int(ymin + 0.5)) + ymax = min(ny - 1, int(ymax - 0.5)) + if xmin > xmax: + (xmin, xmax) = (xmax, xmin) + if ymin > ymax: + (ymin, ymax) = (ymax, ymin) + + k = 0 + dxy = [1, -1, -1, 1] + + while xmin < xmax and ymin < ymax: + try: + (x, y, image_area, center, b, r, t, l) = _get_boundary_points( + xmin=xmin, + xmax=xmax, + ymin=ymin, + ymax=ymax, + dx=min((xmax - xmin) // 4, 15), + dy=min((ymax - ymin) // 4, 15) + ) + except ValueError: + return None + + world = wcs(x, y) + ra = world[spatial_idx[0]] + dec = world[spatial_idx[1]] + + limits = [ymin, xmax, ymax, xmin] + + for j in range(4): + sl = [b, r, t, l][k] + if not (np.all(np.isfinite(ra[sl])) and + np.all(np.isfinite(dec[sl]))): + limits[k] += dxy[k] + ymin, xmax, ymax, xmin = limits + k = (k + 1) % 4 + break + k = (k + 1) % 4 + else: + valid_polygon = True + break + + ymin, xmax, ymax, xmin = limits + + if not valid_polygon: + return None + + world = wcs(*center) + wcenter = (world[spatial_idx[0]], world[spatial_idx[1]]) + + sky_area = SphericalPolygon.from_radec(ra, dec, center=wcenter).area() + if sky_area > 2 * np.pi: + log.warning( + "Unexpectedly large computed sky area for an image. " + "Setting area to: 4*Pi - area" + ) + sky_area = 4 * np.pi - sky_area + pix_area = sky_area / image_area + + return pix_area + + +def _get_boundary_points(xmin, xmax, ymin, ymax, dx=None, dy=None, + shrink=0): # noqa: E741 + """ + xmin, xmax, ymin, ymax - integer coordinates of pixel boundaries + step - distance between points along an edge + shrink - number of pixels by which to reduce `shape` + + Returns a list of points and the area of the rectangle + """ + nx = xmax - xmin + 1 + ny = ymax - ymin + 1 + + if dx is None: + dx = nx + if dy is None: + dy = ny + + if nx - 2 * shrink < 1 or ny - 2 * shrink < 1: + raise ValueError("Image size is too small.") + + sx = max(1, int(np.ceil(nx / dx))) + sy = max(1, int(np.ceil(ny / dy))) + + xmin += shrink + xmax -= shrink + ymin += shrink + ymax -= shrink + + size = 2 * sx + 2 * sy + x = np.empty(size) + y = np.empty(size) + + b = np.s_[0:sx] # bottom edge + r = np.s_[sx:sx + sy] # right edge + t = np.s_[sx + sy:2 * sx + sy] # top edge + l = np.s_[2 * sx + sy:2 * sx + 2 * sy] # noqa: E741 left edge + + x[b] = np.linspace(xmin, xmax, sx, False) + y[b] = ymin + x[r] = xmax + y[r] = np.linspace(ymin, ymax, sy, False) + x[t] = np.linspace(xmax, xmin, sx, False) + y[t] = ymax + x[l] = xmin + y[l] = np.linspace(ymax, ymin, sy, False) + + area = (xmax - xmin) * (ymax - ymin) + center = (0.5 * (xmin + xmax), 0.5 * (ymin + ymax)) + + return x, y, area, center, b, r, t, l From 47a2a93749cf434707f714861c0557a3483f81fd Mon Sep 17 00:00:00 2001 From: Mihai Cara Date: Wed, 27 Nov 2024 16:21:27 -0500 Subject: [PATCH 02/13] remove unused imports --- src/stcal/resample/resample.py | 5 +---- 1 file changed, 1 insertion(+), 4 deletions(-) diff --git a/src/stcal/resample/resample.py b/src/stcal/resample/resample.py index b9891d3d..8b3602a1 100644 --- a/src/stcal/resample/resample.py +++ b/src/stcal/resample/resample.py @@ -2,14 +2,11 @@ import math import os import warnings -import json -import abc -from copy import deepcopy import sys import numpy as np -from scipy.ndimage import median_filter import psutil +from scipy.ndimage import median_filter from astropy import units as u from astropy.nddata.bitmask import ( From 669bb30473e4fe868362b4f8ead93adc6d47f219 Mon Sep 17 00:00:00 2001 From: Mihai Cara Date: Wed, 27 Nov 2024 16:27:13 -0500 Subject: [PATCH 03/13] remove available memory check --- src/stcal/resample/resample.py | 96 +--------------------------------- 1 file changed, 1 insertion(+), 95 deletions(-) diff --git a/src/stcal/resample/resample.py b/src/stcal/resample/resample.py index 8b3602a1..bb402eae 100644 --- a/src/stcal/resample/resample.py +++ b/src/stcal/resample/resample.py @@ -1,11 +1,9 @@ import logging import math -import os import warnings import sys import numpy as np -import psutil from scipy.ndimage import median_filter from astropy import units as u @@ -15,11 +13,9 @@ ) from drizzle.utils import calc_pixmap from drizzle.resample import Drizzle -from stdatamodels.jwst.library.basic_utils import bytes2human from stcal.resample.utils import ( - bytes2human, compute_wcs_pixel_area, get_tmeasure, resample_range, @@ -84,8 +80,7 @@ def __init__(self, n_input_models=None, pixfrac=1.0, kernel="square", fillval=0.0, wht_type="ivm", good_bits=0, output_wcs=None, output_model=None, accumulate=False, enable_ctx=True, enable_var=True, - compute_err=None, - allowed_memory=None): + compute_err=None): """ Parameters ---------- @@ -238,18 +233,12 @@ def __init__(self, n_input_models=None, pixfrac=1.0, kernel="square", At this time, output error array is not equivalent to error propagation results. - allowed_memory : float, None - Fraction of memory allowed to be used for resampling. If - ``allowed_memory`` is `None` then no check for available memory - will be performed. - """ # to see if setting up arrays and drizzle is needed self._finalized = False self._n_res_models = 0 self._n_predicted_input_models = n_input_models - self.allowed_memory = allowed_memory self._output_model = output_model self._create_new_output_model = output_model is not None @@ -435,79 +424,6 @@ def output_model_attributes(cls, accumulate, enable_ctx, enable_var, return attributes - def check_memory_requirements(self, output_model, allowed_memory, - n_input_models=None): - """ Called just before `create_output_model` returns to verify - that there is enough memory to hold the output. - - Parameters - ---------- - allowed_memory : float, None - Fraction of memory allowed to be used for resampling. If - - output_model : dict, None, optional - A dictionary containing data arrays and other attributes that - will be used to add new models to. use - :py:meth:`Resample.output_model_attributes` to get the list of - keywords that must be present. When ``accumulate`` is `False`, - only the WCS object of the model will be used. When ``accumulate`` - is `True`, new models will be added to the existing data in the - ``output_model``. - - When ``output_model`` is `None`, a new model will be created. - - n_input_models : int, None, optional - Number of input models expected to be resampled. When provided, - this is used to estimate memory requirements and optimize memory - allocation for the context array. - - - """ - if ((allowed_memory is None and - "DMODEL_ALLOWED_MEMORY" not in os.environ) or - n_input_models is None): - return - - allowed_memory = float(allowed_memory) - - # get the available memory - available_memory = ( - psutil.virtual_memory().available + psutil.swap_memory().total - ) - - # compute the output array size - npix = np.prod(self._output_array_shape) - nconpl = n_input_models // 32 + (1 if n_input_models % 32 else 0) # context planes - required_memory = 0 - for arr in self.output_array_types: - if arr in output_model: - if arr == "con": - f = nconpl - elif arr == "err": - if self._compute_err == "from_var": - f = 2 # data and weight arrays - elif self._compute_err == "driz_err": - f = 1 - elif arr.startswith("var"): - f = 3 # variance data, weight, and total arrays - else: - f = 1 - - required_memory += f * self.output_array_types[arr].itemsize - - # add pixmap itemsize: - required_memory += 2 * np.dtype(float).itemsize - required_memory *= npix - - # compare used to available - used_fraction = required_memory / available_memory - if used_fraction > allowed_memory: - raise OutputTooLargeError( - f'Combined ImageModel size {self._output_wcs.array_shape} ' - f'requires {bytes2human(required_memory)}. ' - f'Model cannot be instantiated.' - ) - def check_output_wcs(self, output_wcs, estimate_output_shape=True): """ Check that provided WCS has expected properties and that its @@ -607,9 +523,6 @@ def validate_output_model(self, output_model, accumulate, def create_output_model(self): """ Create a new "output model": a dictionary of data and meta fields. - Check that there is enough memory to hold all arrays by calling - `check_memory_requirements`. - """ assert self._output_wcs is not None assert np.array_equiv( @@ -672,13 +585,6 @@ def create_output_model(self): if self._compute_err is not None: output_model["err"] = None - if self.allowed_memory: - self.check_memory_requirements( - output_model, - self.allowed_memory, - n_input_models=self._n_predicted_input_models, - ) - return output_model @property From c5f378ae8aa9c0216810ee15dd687b3a54f4588b Mon Sep 17 00:00:00 2001 From: Mihai Cara Date: Tue, 3 Dec 2024 11:41:24 -0500 Subject: [PATCH 04/13] Changes to accomodate outlier detection and spec in jwst --- changes/320.apichange.rst | 1 + src/stcal/resample/resample.py | 45 +++++++++++++++++++++++++++++++--- 2 files changed, 43 insertions(+), 3 deletions(-) create mode 100644 changes/320.apichange.rst diff --git a/changes/320.apichange.rst b/changes/320.apichange.rst new file mode 100644 index 00000000..caaf8bd9 --- /dev/null +++ b/changes/320.apichange.rst @@ -0,0 +1 @@ +Added ``resample`` submodule. diff --git a/src/stcal/resample/resample.py b/src/stcal/resample/resample.py index bb402eae..87318bfe 100644 --- a/src/stcal/resample/resample.py +++ b/src/stcal/resample/resample.py @@ -440,6 +440,14 @@ def check_output_wcs(self, output_wcs, estimate_output_shape=True): """ naxes = output_wcs.output_frame.naxes + if 'SPECTRAL' in output_wcs.output_frame.axes_type: + if naxes != 3: + raise UnsupportedWCSError( + "Output spectral WCS needs 3 coordinate axes but the " + f"supplied WCS has {naxes} axes." + ) + return + if naxes != 2: raise UnsupportedWCSError( "Output WCS needs 2 coordinate axes but the " @@ -599,10 +607,38 @@ def output_array_shape(self): def output_wcs(self): return self._output_wcs + @property + def pixel_scale_ratio(self): + return self._pixel_scale_ratio + + @property + def output_pixel_scale(self): + return self._output_pixel_scale # in arcsec + @property def group_ids(self): return self._group_ids + @property + def enable_ctx(self): + """ Indicates whether context array is enabled. """ + return self._enable_ctx + + @property + def enable_var(self): + """ Indicates whether variance arrays are resampled. """ + return self._enable_var + + @property + def compute_err(self): + """ Indicates whether error array is computed and how it is computed. """ + return self._compute_err + + @property + def is_in_accumulate_mode(self): + """ Indicates whether resample is continuing adding to previous co-adds. """ + return self._accumulate + def _get_intensity_scale(self, model): """ Compute an intensity scale from the input and output pixel area. @@ -637,7 +673,9 @@ def _get_intensity_scale(self, model): # If input image is in flux density units, correct the # flux for the user-specified change to the spatial dimension if _is_flux_density(model["bunit_data"]): - input_pixel_area *= self.pscale_ratio + iscale = 1.0 / math.sqrt(self.pixel_scale_ratio) + else: + iscale = 1.0 else: input_pixel_area = compute_wcs_pixel_area( wcs, @@ -667,7 +705,7 @@ def _get_intensity_scale(self, model): self._output_model["pixel_scale_ratio"] is None): self._output_model["pixel_scale_ratio"] = self._pixel_scale_ratio - iscale = math.sqrt(input_pixflux_area / input_pixel_area) + iscale = math.sqrt(input_pixflux_area / input_pixel_area) else: iscale = 1.0 @@ -971,8 +1009,9 @@ def finalize(self, free_memory=True): # set those values to NaN instead all_nan = np.all(np.isnan(var_components), axis=0) self._output_model["err"][all_nan] = np.nan + del all_nan - del var_components, all_nan + del var_components self._finalized = True From aa00c23218757485b32613acc2ae81cfe6027756 Mon Sep 17 00:00:00 2001 From: Mihai Cara Date: Tue, 3 Dec 2024 13:25:03 -0500 Subject: [PATCH 05/13] make code more robust --- src/stcal/resample/resample.py | 10 +++++++--- 1 file changed, 7 insertions(+), 3 deletions(-) diff --git a/src/stcal/resample/resample.py b/src/stcal/resample/resample.py index 87318bfe..581a44e5 100644 --- a/src/stcal/resample/resample.py +++ b/src/stcal/resample/resample.py @@ -1445,12 +1445,16 @@ def update_time(self, model): self._exptime_start.append(model["start_time"]) self._exptime_end.append(model["end_time"]) + if (exposure_time := model["exposure_time"]) is not None: + self._total_exposure_time += exposure_time + t, success = get_tmeasure(model) - self._total_exposure_time += model["exposure_time"] self._measurement_time_success.append(success) - self._total_measurement_time += t + if t is not None: + self._total_measurement_time += t - self._duration += model["duration"] + if (duration := model["duration"]) is not None: + self._duration += duration def finalize_time_info(self): """ Perform final computations for the total time and update relevant From 0bca7a35cb7498dfdd0829cb8ec65093ae425f1c Mon Sep 17 00:00:00 2001 From: Mihai Cara Date: Tue, 3 Dec 2024 13:42:41 -0500 Subject: [PATCH 06/13] fix type --- src/stcal/resample/resample.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/stcal/resample/resample.py b/src/stcal/resample/resample.py index 581a44e5..7aef0092 100644 --- a/src/stcal/resample/resample.py +++ b/src/stcal/resample/resample.py @@ -74,7 +74,7 @@ class Resample: "err": np.float32, } - dq_flag_name_map = {} + dq_flag_name_map = {} # type: dict[str, int] def __init__(self, n_input_models=None, pixfrac=1.0, kernel="square", fillval=0.0, wht_type="ivm", good_bits=0, From b5844aa88b757d3e91b4b1c3af434a5618ea26ce Mon Sep 17 00:00:00 2001 From: Mihai Cara Date: Tue, 3 Dec 2024 14:07:23 -0500 Subject: [PATCH 07/13] fix imports --- pyproject.toml | 2 +- src/stcal/resample/utils.py | 1 - 2 files changed, 1 insertion(+), 2 deletions(-) diff --git a/pyproject.toml b/pyproject.toml index 1b2c79e9..42d00d37 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -14,7 +14,7 @@ classifiers = [ ] dependencies = [ "astropy >=5.0.4", - "drizzle>=1.15.0", + "drizzle>=2.0.0", "scipy >=1.7.2", "scikit-image>=0.19", "numpy >=1.21.2", diff --git a/src/stcal/resample/utils.py b/src/stcal/resample/utils.py index 7175af4b..6968a817 100644 --- a/src/stcal/resample/utils.py +++ b/src/stcal/resample/utils.py @@ -1,6 +1,5 @@ from copy import deepcopy import logging -import math import asdf import numpy as np From 5079e69dba9dcc1aedede330e37e8994f1ce0d48 Mon Sep 17 00:00:00 2001 From: Mihai Cara Date: Thu, 12 Dec 2024 21:23:34 -0500 Subject: [PATCH 08/13] address reviewers' comments - part 1 --- src/stcal/resample/__init__.py | 2 -- src/stcal/resample/resample.py | 46 +++++++++++++++------------------- 2 files changed, 20 insertions(+), 28 deletions(-) diff --git a/src/stcal/resample/__init__.py b/src/stcal/resample/__init__.py index 7152f15c..545841f6 100644 --- a/src/stcal/resample/__init__.py +++ b/src/stcal/resample/__init__.py @@ -1,12 +1,10 @@ from .resample import ( - OutputTooLargeError, Resample, compute_wcs_pixel_area, UnsupportedWCSError, ) __all__ = [ - "OutputTooLargeError", "Resample", "compute_wcs_pixel_area", "UnsupportedWCSError", diff --git a/src/stcal/resample/resample.py b/src/stcal/resample/resample.py index 7aef0092..09cd178b 100644 --- a/src/stcal/resample/resample.py +++ b/src/stcal/resample/resample.py @@ -27,17 +27,12 @@ __all__ = [ "compute_wcs_pixel_area" - "OutputTooLargeError", "Resample", "resampled_wcs_from_models", "UnsupportedWCSError", ] -class OutputTooLargeError(RuntimeError): - """Raised when the output is too large for in-memory instantiation""" - - class UnsupportedWCSError(RuntimeError): """ Raised when provided output WCS has an unexpected number of axes or has an unsupported structure. @@ -77,7 +72,7 @@ class Resample: dq_flag_name_map = {} # type: dict[str, int] def __init__(self, n_input_models=None, pixfrac=1.0, kernel="square", - fillval=0.0, wht_type="ivm", good_bits=0, + fillval=0.0, weight_type="ivm", good_bits=0, output_wcs=None, output_model=None, accumulate=False, enable_ctx=True, enable_var=True, compute_err=None): @@ -116,15 +111,15 @@ def __init__(self, n_input_models=None, pixfrac=1.0, kernel="square", pixels with no contributions from input images will be set to this ``fillval`` value. - wht_type : {"exptime", "ivm"}, optional - The weighting type for adding models' data. For ``wht_type="ivm"`` - (the default), the weighting will be determined per-pixel using - the inverse of the read noise (VAR_RNOISE) array stored in each - input image. If the ``VAR_RNOISE`` array does not exist, - the variance is set to 1 for all pixels (i.e., equal weighting). - If ``weight_type="exptime"``, the weight will be set equal - to the measurement time (``TMEASURE``) when available and to - the exposure time (``EFFEXPTM``) otherwise. + weight_type : {"exptime", "ivm"}, optional + The weighting type for adding models' data. For + ``weight_type="ivm"`` (the default), the weighting will be + determined per-pixel using the inverse of the read noise + (VAR_RNOISE) array stored in each input image. If the + ``VAR_RNOISE`` array does not exist, the variance is set to 1 for + all pixels (i.e., equal weighting). If ``weight_type="exptime"``, + the weight will be set equal to the measurement time (``TMEASURE``) + when available and to the exposure time (``EFFEXPTM``) otherwise. good_bits : int, str, None, optional An integer bit mask, `None`, a Python list of bit flags, a comma-, @@ -247,7 +242,7 @@ def __init__(self, n_input_models=None, pixfrac=1.0, kernel="square", self._compute_err = compute_err self._accumulate = accumulate - # these are attributes that are used only for information purpose + # these attributes are used only for informational purposes # and are added to created the output_model only if they are # not already present there: self._pixel_scale_ratio = None @@ -259,8 +254,8 @@ def __init__(self, n_input_models=None, pixfrac=1.0, kernel="square", self.fillval = fillval self.good_bits = good_bits - if wht_type in ["ivm", "exptime"]: - self.weight_type = wht_type + if weight_type in ["ivm", "exptime"]: + self.weight_type = weight_type else: raise ValueError("Unexpected weight type: '{self.weight_type}'") @@ -269,12 +264,12 @@ def __init__(self, n_input_models=None, pixfrac=1.0, kernel="square", self.input_file_names = [] self._group_ids = [] - # determine output WCS and set-up output model if needed: + # determine output WCS and set up output model if needed: if output_model is None: if output_wcs is None: raise ValueError( "Output WCS must be provided either through the " - "'output_wcs' parameter or the 'ouput_model' parameter. " + "'output_wcs' parameter or the 'output_model' parameter. " ) else: if isinstance(output_wcs, dict): @@ -319,7 +314,7 @@ def __init__(self, n_input_models=None, pixfrac=1.0, kernel="square", self._output_array_shape = self._output_wcs.array_shape - # Check that the output data shape has no zero length dimensions + # Check that the output data shape has no zero-length dimensions npix = np.prod(self._output_array_shape) if not npix: raise ValueError( @@ -335,7 +330,7 @@ def __init__(self, n_input_models=None, pixfrac=1.0, kernel="square", f"Output mosaic size (nx, ny): {self._output_wcs.pixel_shape}" ) - # set up an empty (don't allocate arrays at this time) output model: + # set up an empty output model (don't allocate arrays at this time): if self._output_model is None: self._output_model = self.create_output_model() @@ -737,7 +732,7 @@ def reset_arrays(self, reset_output=True, n_input_models=None): """ self._n_predicted_input_models = n_input_models - # set up an empty (don't allocate arrays at this time) output model: + # set up an empty output model (don't allocate arrays at this time): if reset_output or getattr(self, "_output_model", None) is None: self._output_model = self.create_output_model() @@ -908,7 +903,6 @@ def add_model(self, model): blevel = model["level"] if not model["subtracted"] and blevel is not None: data = data - blevel - # self._output_model["subtracted"] = True xmin, xmax, ymin, ymax = resample_range( data.shape, @@ -1292,8 +1286,8 @@ def build_driz_weight(self, model, weight_type=None, good_bits=None): Parameters ---------- - wht_type : {"exptime", "ivm"}, optional - The weighting type for adding models' data. For ``wht_type="ivm"`` + weight_type : {"exptime", "ivm"}, optional + The weighting type for adding models' data. For ``weight_type="ivm"`` (the default), the weighting will be determined per-pixel using the inverse of the read noise (VAR_RNOISE) array stored in each input image. If the ``VAR_RNOISE`` array does not exist, From 06bd2fc74a719b82784b56555ebc8743b6444b0b Mon Sep 17 00:00:00 2001 From: Mihai Cara Date: Thu, 12 Dec 2024 21:24:59 -0500 Subject: [PATCH 09/13] Update src/stcal/resample/resample.py Co-authored-by: Ned Molter --- src/stcal/resample/resample.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/stcal/resample/resample.py b/src/stcal/resample/resample.py index 09cd178b..e9a603f6 100644 --- a/src/stcal/resample/resample.py +++ b/src/stcal/resample/resample.py @@ -1231,8 +1231,8 @@ def _resample_one_variance_array(self, name, model, iscale, ymax=None): """Resample one variance image from an input model. - The error image is passed to drizzle instead of the variance, to - better match kernel overlap and user weights to the data, in the + The error image is passed to drizzle instead of the variance in order to + better match kernel overlap and user weights to the data during the pixel averaging process. The drizzled error image is squared before returning. """ From c86aee01bac82cf1658432c4ad88bda8a1fceef3 Mon Sep 17 00:00:00 2001 From: Mihai Cara Date: Thu, 12 Dec 2024 21:25:12 -0500 Subject: [PATCH 10/13] Update src/stcal/resample/resample.py Co-authored-by: Ned Molter --- src/stcal/resample/resample.py | 12 ++++++------ 1 file changed, 6 insertions(+), 6 deletions(-) diff --git a/src/stcal/resample/resample.py b/src/stcal/resample/resample.py index e9a603f6..fa25fef2 100644 --- a/src/stcal/resample/resample.py +++ b/src/stcal/resample/resample.py @@ -837,12 +837,12 @@ def validate_input_model(self, model): ) def add_model(self, model): - """ Resamples model image and either variance data (if ``enable_var`` - was `True`) or error data (if ``enable_err`` was `True`) and adds - them using appropriate weighting to the corresponding - arrays of the output model. It also updates resampled data weight, - the context array (if ``enable_ctx`` is `True`), relevant output - model's values such as "n_coadds". + """ Resamples model image, variance data (if ``enable_var`` + is `True`) , and error data (if ``enable_err`` is `True`), and adds + them to the corresponding + arrays of the output model using appropriate weighting. + It also updates the weight array and context array (if ``enable_ctx`` is `True`) + of the resampled data, as well as relevant metadata such as "n_coadds". Whenever ``model`` has a unique group ID that was never processed before, the "pointings" value of the output model is incremented and From 2b2dd3b78f52c4509d1bab4c26b1a1af06d78d7f Mon Sep 17 00:00:00 2001 From: Mihai Cara Date: Sun, 15 Dec 2024 05:51:56 -0500 Subject: [PATCH 11/13] add more docs --- docs/conf.py | 10 +- docs/stcal/package_index.rst | 1 + docs/stcal/resample/description.rst | 142 +++++++++++++++ docs/stcal/resample/index.rst | 19 ++ docs/stcal/resample/utils.rst | 10 ++ src/stcal/resample/__init__.py | 4 +- src/stcal/resample/resample.py | 270 +++++++++++++++++++++------- src/stcal/resample/utils.py | 144 ++++++++++++--- 8 files changed, 504 insertions(+), 96 deletions(-) create mode 100644 docs/stcal/resample/description.rst create mode 100644 docs/stcal/resample/index.rst create mode 100644 docs/stcal/resample/utils.rst diff --git a/docs/conf.py b/docs/conf.py index 53c05d50..659bc9c7 100644 --- a/docs/conf.py +++ b/docs/conf.py @@ -39,6 +39,10 @@ "gwcs": ("https://gwcs.readthedocs.io/en/latest/", None), "astropy": ("https://docs.astropy.org/en/stable/", None), "tweakwcs": ("https://tweakwcs.readthedocs.io/en/latest/", None), + "drizzle": ( + "https://spacetelescope-drizzle.readthedocs.io/en/latest/", + None + ), } nitpick_ignore = [("py:class", "optional"), ("py:class", "np.ndarray")] @@ -75,4 +79,8 @@ html_use_index = True # Enable nitpicky mode - which ensures that all references in the docs resolve. -nitpicky = True +nitpicky = False + +nitpick_ignore = [ + ('py:obj', 'type'), +] diff --git a/docs/stcal/package_index.rst b/docs/stcal/package_index.rst index e1db02b0..3d3e3ba2 100644 --- a/docs/stcal/package_index.rst +++ b/docs/stcal/package_index.rst @@ -9,3 +9,4 @@ Package Index alignment/index.rst tweakreg/index.rst outlier_detection/index.rst + resample/index.rst diff --git a/docs/stcal/resample/description.rst b/docs/stcal/resample/description.rst new file mode 100644 index 00000000..fd5c396f --- /dev/null +++ b/docs/stcal/resample/description.rst @@ -0,0 +1,142 @@ +Description +=========== + +:Classes: `stcal.resample.Resample` +:Alias: resample + +This routine will resample each input 2D image based on the WCS and +distortion information, and will combine multiple resampled images +into a single undistorted product. + +This step uses the interface to the C-based cdriz routine to do the +resampling via the drizzle method. The input-to-output pixel +mapping is determined via a mapping function derived from the +WCS of each input image and the WCS of the defined output product. +This mapping function gets passed to cdriz to drive the actual +drizzling to create the output product. + + +Error Propagation +----------------- + +The error associated with each resampled pixel can in principle be derived +from the variance components associated with each input pixel, weighted by +the square of the input user weights and the square of the overlap between +the input and output pixels. In practice, the ``cdriz`` routine does not +currently support propagating variance data alongside science images, so +the output error cannot be precisely calculated. + +To approximate the error on a resampled pixel, the variance arrays associated +with each input model are resampled individually, then combined with a weighted +sum. The process is: + +#. For each input model, take the square root of each of the read noise variance + array to make an error image. + +#. Drizzle the read noise error image onto the output WCS, with drizzle + parameters matching those used for the science data. + +#. Square the resampled read noise to make a variance array. + + a. If the resampling `weight_type` is an inverse variance map (`ivm`), weight + the resampled variance by the square of its own inverse. + + #. If the `weight_type` is the exposure time (`exptime`), weight the + resampled variance by the square of the exposure time for the image. + +#. Add the weighted, resampled read noise variance to a running sum across all + images. Add the weights (unsquared) to a separate running sum across + all images. + +#. Perform the same steps for the Poisson noise variance and the flat variance. + For these components, the weight for the sum is either the resampled read + noise variance or else the exposure time. + +#. For each variance component (read noise, Poisson, and flat), divide the + weighted variance sum by the total weight, squared. + +After each variance component is resampled and summed, the final error +array is computed as the square root of the sum of the three independent +variance components. This error image is stored in the ``err`` attribute +in the output data model. Alternatively, the error array of the resampled +image can be computed by resampling the error array associated with input +data. + +It is expected that the output errors computed in this way will +generally overestimate the true error on the resampled data. The magnitude +of the overestimation depends on the details of the pixel weights +and error images. Note, however, that drizzling error images produces +a much better estimate of the output error than directly drizzling +the variance images, since the kernel overlap weights do not need to be +squared for combining error values. + + +Context Image +------------- + +In addition to image data, resample step also creates a "context image" stored +in the ``con`` attribute in the output data model . Each pixel in the context +image is a bit field that encodes +information about which input image has contributed to the corresponding +pixel in the resampled data array. Context image uses 32 bit integers to encode +this information and hence it can keep track of only 32 input images. +First bit corresponds to the first input image, second bit corrsponds to the +second input image, and so on. If the number of input images is larger than 32, +then it is necessary to have multiple context images ("planes") to hold +information about all input images +with the first plane encoding which of the first 32 images contributed +to the output data pixel, second plane representing next 32 input images +(number 33-64), etc. For this reason, context array is a 3D array of the type +`numpy.int32` and shape ``(np, ny, nx)`` where ``nx`` and ``ny`` +are dimensions of image's data. ``np`` is the number of "planes" equal to +``(number of input images - 1) // 32 + 1``. If a bit at position ``k`` in a +pixel with coordinates ``(p, y, x)`` is 0 then input image number +``32 * p + k`` (0-indexed) did not contribute to the output data pixel +with array coordinates ``(y, x)`` and if that bit is 1 then input image number +``32 * p + k`` did contribute to the pixel ``(y, x)`` in the resampled image. + +As an example, let's assume we have 8 input images. Then, when ``'CON'`` pixel +values are displayed using binary representation (and decimal in parenthesis), +one could see values like this:: + + 00000001 (1) - only first input image contributed to this output pixel; + 00000010 (2) - 2nd input image contributed; + 00000100 (4) - 3rd input image contributed; + 10000000 (128) - 8th input image contributed; + 10000100 (132=128+4) - 3rd and 8th input images contributed; + 11001101 (205=1+4+8+64+128) - input images 1, 3, 4, 7, 8 have contributed + to this output pixel. + +In order to test if a specific input image contributed to an output pixel, +one needs to use bitwise operations. Using the example above, to test whether +input images number 4 and 5 have contributed to the output pixel whose +corresponding ``'CON'`` value is 205 (11001101 in binary form) we can do +the following: + +>>> bool(205 & (1 << (5 - 1))) # (205 & 16) = 0 (== 0 => False): did NOT contribute +False +>>> bool(205 & (1 << (4 - 1))) # (205 & 8) = 8 (!= 0 => True): did contribute +True + +In general, to get a list of all input images that have contributed to an +output resampled pixel with image coordinates ``(x, y)``, and given a +context array ``con``, one can do something like this: + +.. doctest-skip:: + + >>> import numpy as np + >>> np.flatnonzero([v & (1 << k) for v in con[:, y, x] for k in range(32)]) + +For convenience, this functionality was implemented in the +:py:func:`~drizzle.utils.decode_context` function. + + +References +---------- + +A full description of the drizzling algorithm can be found in +`Fruchter and Hook, PASP 2002 `_. +A description of the inverse variance map method can be found in +`Casertano et al., AJ 2000 `_, see Appendix A2. +A description of the drizzle parameters and other useful drizzle-related +resources can be found at `DrizzlePac Handbook `_. diff --git a/docs/stcal/resample/index.rst b/docs/stcal/resample/index.rst new file mode 100644 index 00000000..6ff35c6e --- /dev/null +++ b/docs/stcal/resample/index.rst @@ -0,0 +1,19 @@ +.. _resample_module: + +======== +Resample +======== + +.. toctree:: + :maxdepth: 1 + + description.rst + +**Also See:** + +.. toctree:: + :maxdepth: 1 + + utils.rst + +.. automodapi:: stcal.resample diff --git a/docs/stcal/resample/utils.rst b/docs/stcal/resample/utils.rst new file mode 100644 index 00000000..af1f0a9a --- /dev/null +++ b/docs/stcal/resample/utils.rst @@ -0,0 +1,10 @@ +================= +Utility Functions +================= + +The ``utils`` module provides helpful functions for `Resample` such as creating image mask from model's DQ array, computing average pixel area, loading a custom WCS from an ASDF file, etc. + +.. currentmodule:: stcal.resample.utils + +.. automodapi:: stcal.resample.utils + :noindex: diff --git a/src/stcal/resample/__init__.py b/src/stcal/resample/__init__.py index 545841f6..9c717832 100644 --- a/src/stcal/resample/__init__.py +++ b/src/stcal/resample/__init__.py @@ -1,11 +1,11 @@ from .resample import ( Resample, - compute_wcs_pixel_area, + compute_mean_pixel_area, UnsupportedWCSError, ) __all__ = [ "Resample", - "compute_wcs_pixel_area", + "compute_mean_pixel_area", "UnsupportedWCSError", ] diff --git a/src/stcal/resample/resample.py b/src/stcal/resample/resample.py index fa25fef2..8c7930f1 100644 --- a/src/stcal/resample/resample.py +++ b/src/stcal/resample/resample.py @@ -16,7 +16,7 @@ from stcal.resample.utils import ( - compute_wcs_pixel_area, + compute_mean_pixel_area, get_tmeasure, resample_range, ) @@ -26,9 +26,7 @@ log.setLevel(logging.DEBUG) __all__ = [ - "compute_wcs_pixel_area" "Resample", - "resampled_wcs_from_models", "UnsupportedWCSError", ] @@ -40,20 +38,25 @@ class UnsupportedWCSError(RuntimeError): class Resample: - """ - This is the controlling routine for the resampling process. - - Notes - ----- - This routine performs the following operations:: - - 1. Extracts parameter settings from input model, such as pixfrac, - weight type, exposure time (if relevant), and kernel, and merges - them with any user-provided values. - 2. Creates output WCS based on input images and define mapping function - between all input arrays and the output array. - 3. Updates output data model with output arrays from drizzle, including - a record of metadata from all input models. + """ Base class for resampling images. + + The main purpose of this class is to resample and add input images + (data, variance array) to an output image defined by an output WCS. + + In particular, this class performs the following operations: + + 1. Sets up output arrays based on arguments used at initialization. + 2. Based on information about the input images and user arguments, computes + scale factors needed to obtain correctly convert resampled counts to + fluxes. + 3. For each input image computes coordinate transformations (``pixmap``) + from coordinate system of the input image to the coordinate system of + the output image. + 4. For each input image computes weight image. + 5. Calls :py:class:`~drizzle.resample.Drizzle` methods to resample and + combine input images and their variance/error arrays. + 6. Keeps track of total exposure time and other time-related quantities. + """ resample_suffix = 'i2d' resample_file_ext = '.fits' @@ -91,7 +94,7 @@ def __init__(self, n_input_models=None, pixfrac=1.0, kernel="square", dimension, so the flux is confined to a quarter of the pixel area when the square kernel is used. - kernel: {"square", "gaussian", "point", "turbo", "lanczos2", "lanczos3"}, optional + kernel : {"square", "gaussian", "point", "turbo", "lanczos2", "lanczos3"}, optional The name of the kernel used to combine the input. The choice of kernel controls the distribution of flux over the kernel. The square kernel is the default. @@ -100,7 +103,7 @@ def __init__(self, n_input_models=None, pixfrac=1.0, kernel="square", The "gaussian" and "lanczos2/3" kernels **DO NOT** conserve flux. - fillval: float, None, str, optional + fillval : float, None, str, optional The value of output pixels that did not have contributions from input images' pixels. When ``fillval`` is either `None` or ``"INDEF"`` and ``out_img`` is provided, the values of ``out_img`` @@ -111,7 +114,7 @@ def __init__(self, n_input_models=None, pixfrac=1.0, kernel="square", pixels with no contributions from input images will be set to this ``fillval`` value. - weight_type : {"exptime", "ivm"}, optional + weight_type : {"ivm", "exptime"}, optional The weighting type for adding models' data. For ``weight_type="ivm"`` (the default), the weighting will be determined per-pixel using the inverse of the read noise @@ -168,12 +171,12 @@ def __init__(self, n_input_models=None, pixfrac=1.0, kernel="square", use a value of ``~4+8``, or ``~4,8``. A string value of ``~0`` would be equivalent to a setting of ``None``. - | Default value (0) will make *all* pixels with non-zero DQ + Default value (0) will make *all* pixels with non-zero DQ values be considered "bad" pixels, and the corresponding data pixels will be assigned zero weight and thus these pixels will not contribute to the output resampled data array. - | Set `good_bits` to `None` to turn off the use of model's DQ + Set `good_bits` to `None` to turn off the use of model's DQ array. For more details, see documentation for @@ -301,7 +304,9 @@ def __init__(self, n_input_models=None, pixfrac=1.0, kernel="square", if self._output_pixel_scale is None: self._output_pixel_scale = 3600.0 * np.rad2deg( - math.sqrt(compute_wcs_pixel_area(self._output_wcs)) + math.sqrt( + self.get_output_model_pixel_area({"wcs": self._output_wcs}) + ) ) log.info( "Computed output pixel scale: " @@ -336,6 +341,67 @@ def __init__(self, n_input_models=None, pixfrac=1.0, kernel="square", self.reset_arrays(reset_output=False, n_input_models=n_input_models) + def get_input_model_pixel_area(self, model): + """ + Computes or retrieves pixel area of an input model. Currently, + this is the average pixel area of input model's pixels within either + the bounding box (if available) or the entire data array. + + This value is used to compute a scale factor that will be applied + to input image data. This scale factor takes into account the + difference in the definition of the pixel area reported in model's + ``meta`` and the pixel area at the location used to construct + output WCS from the WCS of input models using ``pixel_scale_ratio``. + + Intensity scale factor is computed elsewhere as the ratio of the value + of the pixel area in the meta to the area returned by this function. + + Subclasses can override this method to return the most appropriate + pixel area value. + + Parameters + ---------- + + model : dict, None + A dictionary containing data arrays and other meta attributes + and values of actual models used by pipelines. In particular, it + must have a keyword "wcs" and a WCS associated with it. + + Returns + ------- + pix_area : float + Pixel area in steradians. + + """ + pixel_area = compute_mean_pixel_area( + model["wcs"], + shape=model["data"].shape + ) + return pixel_area + + def get_output_model_pixel_area(self, model): + """ + Computes or retrieves pixel area of the output model. Currently, + this is the average pixel area of the model's pixels within either + the bounding box (if available) or the entire data array. + + Parameters + ---------- + + model : dict, None + A dictionary containing data arrays and other meta attributes + and values of actual models used by pipelines. In particular, it + must have a keyword "wcs" and a WCS associated with it. + + Returns + ------- + pix_area : float + Pixel area in steradians. + + """ + pixel_area = compute_mean_pixel_area(model["wcs"]) + return pixel_area + @classmethod def output_model_attributes(cls, accumulate, enable_ctx, enable_var, compute_err): @@ -374,6 +440,13 @@ def output_model_attributes(cls, accumulate, enable_ctx, enable_var, At this time, output error array is not equivalent to error propagation results. + Returns + ------- + + attributes : set + A set of attributes that an output model must have when it + is provided as an input to `Resample.__init__` initializer. + """ # always required: attributes = { @@ -422,7 +495,7 @@ def output_model_attributes(cls, accumulate, enable_ctx, enable_var, def check_output_wcs(self, output_wcs, estimate_output_shape=True): """ Check that provided WCS has expected properties and that its - ``array_shape`` property is defined. + ``array_shape`` property is defined. May modify ``output_wcs``. Parameters ---------- @@ -430,8 +503,12 @@ def check_output_wcs(self, output_wcs, estimate_output_shape=True): A WCS object corresponding to the output (resampled) image. estimate_output_shape : bool, optional - Indicates whether to *estimate* pixel scale of the ``output_wcs`` - from + Indicates whether to *estimate* output image shape of the + ``output_wcs`` from other available attributes such as + ``bounding_box`` when ``output_wcs.array_shape`` is `None`. + If ``estimate_output_shape`` is `True` and + ``output_wcs.array_shape`` is `None`, upon return + ``output_wcs.array_shape`` will be assigned an estimated value. """ naxes = output_wcs.output_frame.naxes @@ -451,9 +528,6 @@ def check_output_wcs(self, output_wcs, estimate_output_shape=True): # make sure array_shape and pixel_shape are set: if output_wcs.array_shape is None and estimate_output_shape: - # if wcs_pars and "output_shape" in wcs_pars: - # output_wcs.array_shape = wcs_pars["output_shape"] - # else: if output_wcs.bounding_box: halfpix = 0.5 + sys.float_info.epsilon output_wcs.array_shape = ( @@ -473,10 +547,33 @@ def check_output_wcs(self, output_wcs, estimate_output_shape=True): def validate_output_model(self, output_model, accumulate, enable_ctx, enable_var): """ Checks that ``output_model`` dictionary has all the required - keywords that the code would expect it to have based on the values + keywords that the code expects it to have based on the values of ``accumulate``, ``enable_ctx``, ``enable_var``. It will raise `ValueError` if `output_model` is missing required keywords/values. + Parameters + ---------- + + output_model : dict + A dictionary representing data and meta values from a data model. + + accumulate : bool + Indicates whether resampled models should be added to the + provided ``output_model`` data or if new arrays should be + created. + + enable_ctx : bool + Indicates whether to create a context image. If ``disable_ctx`` + is set to `True`, parameters ``out_ctx``, ``begin_ctx_id``, and + ``max_ctx_id`` will be ignored. + + enable_var : bool + Indicates whether to resample variance arrays. + + compute_err : {"from_var", "driz_err"}, None + A string indicating how error array for the resampled image should + be computed. See `Resample.__init__` for more details. + """ if output_model is None: if accumulate: @@ -526,6 +623,13 @@ def validate_output_model(self, output_model, accumulate, def create_output_model(self): """ Create a new "output model": a dictionary of data and meta fields. + + Returns + ------- + + output_model : dict + A dictionary of data model attributes and values. + """ assert self._output_wcs is not None assert np.array_equiv( @@ -576,12 +680,6 @@ def create_output_model(self): "var_rnoise": None, "var_flat": None, "var_poisson": None, - # TODO: if we want to support adding more data to - # existing output models, we need to also store weights - # for variance arrays: - # var_rnoise_weight - # var_flat_weight - # var_poisson_weight } ) @@ -592,26 +690,35 @@ def create_output_model(self): @property def output_model(self): + """ Output (resampled) model. """ return self._output_model @property def output_array_shape(self): + """ Shape of the output model arrays. """ return self._output_array_shape @property def output_wcs(self): + """ WCS of the output (resampled) model. """ return self._output_wcs @property def pixel_scale_ratio(self): + """ Get the ratio of the output pixel scale to the input pixel scale. + """ return self._pixel_scale_ratio @property def output_pixel_scale(self): + """ Get pixel scale of the output model in arcsec. """ return self._output_pixel_scale # in arcsec @property def group_ids(self): + """ Get a list of all group IDs of models resampled and added to the + output model. + """ return self._group_ids @property @@ -626,12 +733,15 @@ def enable_var(self): @property def compute_err(self): - """ Indicates whether error array is computed and how it is computed. """ + """ Indicates whether error array is computed and how it is computed. + """ return self._compute_err @property def is_in_accumulate_mode(self): - """ Indicates whether resample is continuing adding to previous co-adds. """ + """ Indicates whether resample is continuing adding to previous + co-adds. + """ return self._accumulate def _get_intensity_scale(self, model): @@ -657,13 +767,13 @@ def _get_intensity_scale(self, model): The scale to apply to the input data before drizzling. """ - input_pixflux_area = model["pixelarea_steradians"] + photom_pixel_area = model["pixelarea_steradians"] wcs = model["wcs"] - if input_pixflux_area: + if photom_pixel_area: if 'SPECTRAL' in wcs.output_frame.axes_type: # Use the nominal area as is - input_pixel_area = input_pixflux_area + input_pixel_area = photom_pixel_area # If input image is in flux density units, correct the # flux for the user-specified change to the spatial dimension @@ -672,10 +782,8 @@ def _get_intensity_scale(self, model): else: iscale = 1.0 else: - input_pixel_area = compute_wcs_pixel_area( - wcs, - shape=model["data"].shape - ) + input_pixel_area = self.get_input_model_pixel_area(model) + if input_pixel_area is None: model_name = model["filename"] if not model_name: @@ -700,7 +808,7 @@ def _get_intensity_scale(self, model): self._output_model["pixel_scale_ratio"] is None): self._output_model["pixel_scale_ratio"] = self._pixel_scale_ratio - iscale = math.sqrt(input_pixflux_area / input_pixel_area) + iscale = math.sqrt(photom_pixel_area / input_pixel_area) else: iscale = 1.0 @@ -709,6 +817,7 @@ def _get_intensity_scale(self, model): @property def finalized(self): + """ Indicates whether the output model was "finalized". """ return self._finalized def reset_arrays(self, reset_output=True, n_input_models=None): @@ -848,7 +957,7 @@ def add_model(self, model): before, the "pointings" value of the output model is incremented and the "group_id" attribute is updated. Also, time counters are updated with new values from the input ``model`` by calling - :py:meth:`~Resample.update_time`. + :py:meth:`~Resample.update_time` . Parameters ---------- @@ -914,9 +1023,9 @@ def add_model(self, model): 'pixmap': pixmap, 'scale': iscale, 'weight_map': weight, - 'wht_scale': 1.0, # hard-coded for JWST count-rate data + 'wht_scale': 1.0, 'pixfrac': self.pixfrac, - 'in_units': 'cps', # TODO: get units from data model + 'in_units': 'cps', 'xmin': xmin, 'xmax': xmax, 'ymin': ymin, @@ -1183,6 +1292,21 @@ def finalize_resample_variance(self, output_model, free_memory=True): """ Compute variance for the resampled image from running sums and weights. Free memory (when ``free_memory=True``) that holds these running sums and weights arrays. + + output_model : dict, None + A dictionary containing data arrays and other attributes that + will be used to add new models to. use + :py:meth:`Resample.output_model_attributes` to get the list of + keywords that must be present. When ``accumulate`` is `False`, + only the WCS object of the model will be used. When ``accumulate`` + is `True`, new models will be added to the existing data in the + ``output_model``. + + free_memory : True + Indicates whether to free temporary arrays (i.e., weight arrays) + that are no longer needed. If this is `True` it will not be + possible to continue adding new models to the output model. + """ # Divide by the total weights, squared, and set in the output model. # Zero weight and missing values are NaN in the output. @@ -1191,24 +1315,24 @@ def finalize_resample_variance(self, output_model, free_memory=True): warnings.filterwarnings("ignore", "divide by zero*", RuntimeWarning) output_variance = ( - self._var_rnoise_wsum / self._var_rnoise_weight / - self._var_rnoise_weight + self._var_rnoise_wsum / (self._var_rnoise_weight * + self._var_rnoise_weight) ).astype( dtype=self.output_array_types["var_rnoise"] ) output_model["var_rnoise"] = output_variance output_variance = ( - self._var_poisson_wsum / self._var_poisson_weight / - self._var_poisson_weight + self._var_poisson_wsum / (self._var_poisson_weight * + self._var_poisson_weight) ).astype( dtype=self.output_array_types["var_poisson"] ) output_model["var_poisson"] = output_variance output_variance = ( - self._var_flat_wsum / self._var_flat_weight / - self._var_flat_weight + self._var_flat_wsum / (self._var_flat_weight * + self._var_flat_weight) ).astype( dtype=self.output_array_types["var_flat"] ) @@ -1231,10 +1355,11 @@ def _resample_one_variance_array(self, name, model, iscale, ymax=None): """Resample one variance image from an input model. - The error image is passed to drizzle instead of the variance in order to - better match kernel overlap and user weights to the data during the + The error image is passed to drizzle instead of the variance in order + to better match kernel overlap and user weights to the data during the pixel averaging process. The drizzled error image is squared before returning. + """ variance = model.get(name) if variance is None or variance.size == 0: @@ -1270,9 +1395,9 @@ def _resample_one_variance_array(self, name, model, iscale, pixmap=pixmap, scale=iscale, weight_map=weight_map, - wht_scale=1.0, # hard-coded for JWST count-rate data + wht_scale=1.0, pixfrac=self.pixfrac, - in_units="cps", # TODO: get units from data model + in_units="cps", xmin=xmin, xmax=xmax, ymin=ymin, @@ -1282,15 +1407,20 @@ def _resample_one_variance_array(self, name, model, iscale, return driz.out_img ** 2 def build_driz_weight(self, model, weight_type=None, good_bits=None): - """ Create a weight map for use by drizzle. + """ Create a weight map that is used for weighting input images when + they are co-added to the ouput model. Parameters ---------- + model : dict + Input model: a dictionar of relevant keywords and values. + weight_type : {"exptime", "ivm"}, optional - The weighting type for adding models' data. For ``weight_type="ivm"`` - (the default), the weighting will be determined per-pixel using - the inverse of the read noise (VAR_RNOISE) array stored in each - input image. If the ``VAR_RNOISE`` array does not exist, + The weighting type for adding models' data. For + ``weight_type="ivm"`` (the default), the weighting will be + determined per-pixel using the inverse of the read noise + (VAR_RNOISE) array stored in each input image. If the + ``VAR_RNOISE`` array does not exist, the variance is set to 1 for all pixels (i.e., equal weighting). If ``weight_type="exptime"``, the weight will be set equal to the measurement time (``TMEASURE``) when available and to @@ -1302,7 +1432,7 @@ def build_driz_weight(self, model, weight_type=None, good_bits=None): bit flags or mnemonic flag names that indicate what bits in models' DQ bitfield array should be *ignored* (i.e., zeroed). - See `Resample` for more information + See `Resample` for more information. """ data = model["data"] @@ -1429,8 +1559,10 @@ def init_time_counters(self): self._measurement_time_success = [] def update_time(self, model): - """ A method called by the `~Resample.add_model` method to process each - image's time attributes *only when ``model`` has a new group ID. + """ + A method called by the :py:meth:`~Resample.add_model` method to + process each image's time attributes *only* when ``model`` has a new + group ID. """ if model["group_id"] in self._group_ids: @@ -1497,6 +1629,10 @@ def _check_var_array(self, model, array_name): def _get_model_name(model): + """ Return the value of ``"filename"`` from the model dictionary or + ``"Unknown"`` when ``"filename"`` is either not present or it is `None`. + + """ model_name = model.get("filename") if model_name is None or not model_name.strip(): model_name = "Unknown" diff --git a/src/stcal/resample/utils.py b/src/stcal/resample/utils.py index 6968a817..35498c23 100644 --- a/src/stcal/resample/utils.py +++ b/src/stcal/resample/utils.py @@ -10,7 +10,7 @@ __all__ = [ "build_mask", "bytes2human", - "compute_wcs_pixel_area", + "compute_mean_pixel_area", "get_tmeasure", "is_imaging_wcs", "load_custom_wcs", @@ -52,7 +52,7 @@ def load_custom_wcs(asdf_wcs_file, output_shape=None): Returns ------- - wcs : WCS + wcs : ~gwcs.wcs.WCS The output WCS to resample into. """ @@ -121,7 +121,7 @@ def get_tmeasure(model): def bytes2human(n): """Convert bytes to human-readable format - Taken from the `psutil` library which references + Taken from the ``psutil`` library which references http://code.activestate.com/recipes/578019 Parameters @@ -161,8 +161,36 @@ def is_imaging_wcs(wcs): return imaging -def compute_wcs_pixel_area(wcs, shape=None): - """ Computes pixel area in steradians. +def compute_mean_pixel_area(wcs, shape=None): + """ Computes the average pixel area (in steradians) based on input WCS + using pixels within either the bounding box (if available) or the entire + data array as defined either by ``wcs.array_shape`` or the ``shape`` + argument. + + Parameters + ---------- + shape : tuple, optional + Shape of the region over which average pixel area will be computed. + When not provided, pixel average will be estimated over a region + defined by ``wcs.array_shape``. + + Returns + ------- + pix_area : float + Pixel area in steradians. + + Notes + ----- + + This function takes the outline of the region in which the average is + computed (a rectangle defined by either the bounding box or + ``wcs.array_shape`` or the ``shape``) and projects it to world coordinates. + It then uses ``spherical_geometry`` to compute the area of the polygon + defined by this outline on the sky. In order to minimize errors due to + distortions in the ``wcs``, the code defines the outline using pixels + spaced no more than 15 pixels apart along the border of the rectangle + in which the average is computed. + """ if (shape := (shape or wcs.array_shape)) is None: raise ValueError( @@ -182,15 +210,16 @@ def compute_wcs_pixel_area(wcs, shape=None): else: ((xmin, xmax), (ymin, ymax)) = wcs.bounding_box - xmin = max(0, int(xmin + 0.5)) - xmax = min(nx - 1, int(xmax - 0.5)) - ymin = max(0, int(ymin + 0.5)) - ymax = min(ny - 1, int(ymax - 0.5)) if xmin > xmax: (xmin, xmax) = (xmax, xmin) if ymin > ymax: (ymin, ymax) = (ymax, ymin) + xmin = max(0, int(xmin + 0.5)) + xmax = min(nx - 1, int(xmax - 0.5)) + ymin = max(0, int(ymin + 0.5)) + ymax = min(ny - 1, int(ymax - 0.5)) + k = 0 dxy = [1, -1, -1, 1] @@ -249,11 +278,74 @@ def compute_wcs_pixel_area(wcs, shape=None): def _get_boundary_points(xmin, xmax, ymin, ymax, dx=None, dy=None, shrink=0): # noqa: E741 """ - xmin, xmax, ymin, ymax - integer coordinates of pixel boundaries - step - distance between points along an edge - shrink - number of pixels by which to reduce `shape` + Creates a list of ``x`` and ``y`` coordinates of points along the perimiter + of the rectangle defined by ``xmin``, ``xmax``, ``ymin``, ``ymax``, and + ``shrink`` in counter-clockwise order. + + Parameters + ---------- + + xmin : int + X-coordinate of the left edge of a rectangle. + + xmax : int + X-coordinate of the right edge of a rectangle. + + ymin : int + Y-coordinate of the bottom edge of a rectangle. + + ymax : int + Y-coordinate of the top edge of a rectangle. + + dx : int, float, None, optional + Desired spacing between ajacent points alog horizontal edges of + the rectangle. + + dy : int, float, None, optional + Desired spacing between ajacent points alog vertical edges of + the rectangle. + + shrink : int, optional + Amount to be applied to input ``xmin``, ``xmax``, ``ymin``, ``ymax`` + to reduce the rectangle size. + + Returns + ------- + + x : numpy.ndarray + An array of X-coordinates of points along the perimiter + of the rectangle defined by ``xmin``, ``xmax``, ``ymin``, ``ymax``, and + ``shrink`` in counter-clockwise order. + + y : numpy.ndarray + An array of Y-coordinates of points along the perimiter + of the rectangle defined by ``xmin``, ``xmax``, ``ymin``, ``ymax``, and + ``shrink`` in counter-clockwise order. + + area : float + Area in units of pixels of the region defined by ``xmin``, ``xmax``, + ``ymin``, ``ymax``, and ``shrink``. + + center : tuple + A tuple of pixel coordinates at the center of the rectangle defined + by ``xmin``, ``xmax``, ``ymin``, ``ymax``. + + bottom : slice + A `slice` object that allows selection of pixels from ``x`` and ``y`` + arrays along the bottom edge of the rectangle. + + right : slice + A `slice` object that allows selection of pixels from ``x`` and ``y`` + arrays along the right edge of the rectangle. + + top : slice + A `slice` object that allows selection of pixels from ``x`` and ``y`` + arrays along the top edge of the rectangle. + + left : slice + A `slice` object that allows selection of pixels from ``x`` and ``y`` + arrays along the left edge of the rectangle. - Returns a list of points and the area of the rectangle """ nx = xmax - xmin + 1 ny = ymax - ymin + 1 @@ -278,21 +370,21 @@ def _get_boundary_points(xmin, xmax, ymin, ymax, dx=None, dy=None, x = np.empty(size) y = np.empty(size) - b = np.s_[0:sx] # bottom edge - r = np.s_[sx:sx + sy] # right edge - t = np.s_[sx + sy:2 * sx + sy] # top edge - l = np.s_[2 * sx + sy:2 * sx + 2 * sy] # noqa: E741 left edge + bottom = np.s_[0:sx] # bottom edge + right = np.s_[sx:sx + sy] # right edge + top = np.s_[sx + sy:2 * sx + sy] # top edge + left = np.s_[2 * sx + sy:2 * sx + 2 * sy] # noqa: E741 left edge - x[b] = np.linspace(xmin, xmax, sx, False) - y[b] = ymin - x[r] = xmax - y[r] = np.linspace(ymin, ymax, sy, False) - x[t] = np.linspace(xmax, xmin, sx, False) - y[t] = ymax - x[l] = xmin - y[l] = np.linspace(ymax, ymin, sy, False) + x[bottom] = np.linspace(xmin, xmax, sx, False) + y[bottom] = ymin + x[right] = xmax + y[right] = np.linspace(ymin, ymax, sy, False) + x[top] = np.linspace(xmax, xmin, sx, False) + y[top] = ymax + x[left] = xmin + y[left] = np.linspace(ymax, ymin, sy, False) area = (xmax - xmin) * (ymax - ymin) center = (0.5 * (xmin + xmax), 0.5 * (ymin + ymax)) - return x, y, area, center, b, r, t, l + return x, y, area, center, bottom, right, top, left From fd714d2b196596e0225505b9c28ae4442c989c24 Mon Sep 17 00:00:00 2001 From: Mihai Cara Date: Sun, 15 Dec 2024 15:51:20 -0500 Subject: [PATCH 12/13] Fix type warning --- src/stcal/resample/utils.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/stcal/resample/utils.py b/src/stcal/resample/utils.py index 35498c23..6a13d505 100644 --- a/src/stcal/resample/utils.py +++ b/src/stcal/resample/utils.py @@ -4,7 +4,7 @@ import asdf import numpy as np from astropy.nddata.bitmask import interpret_bit_flags -from spherical_geometry.polygon import SphericalPolygon +from spherical_geometry.polygon import SphericalPolygon # type: ignore[import-untyped] __all__ = [ From 6743256fea70a6737079cddd3d5885c495d33ae0 Mon Sep 17 00:00:00 2001 From: Mihai Cara Date: Mon, 16 Dec 2024 01:54:50 -0500 Subject: [PATCH 13/13] Use updated drizzle to deal with gwcs bbox --- pyproject.toml | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/pyproject.toml b/pyproject.toml index 42d00d37..1cd2273d 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -14,7 +14,8 @@ classifiers = [ ] dependencies = [ "astropy >=5.0.4", - "drizzle>=2.0.0", + # "drizzle>=2.0.0", + "drizzle @ git+https://github.com/mcara/drizzle.git@disable-bbox", "scipy >=1.7.2", "scikit-image>=0.19", "numpy >=1.21.2",