Source code for PyFHD.gridding.visibility_degrid

import numpy as np
from numpy.typing import NDArray
import warnings
import h5py
from PyFHD.gridding.gridding_utils import (
    baseline_grid_locations,
    interpolate_kernel,
    grid_beam_per_baseline,
)
from PyFHD.pyfhd_tools.pyfhd_utils import (
    l_m_n,
    rebin,
    weight_invert,
    histogram,
    deriv_coefficients,
)



[docs]
def visibility_degrid(
    image_uv: NDArray[np.complex128],
    vis_weights: NDArray[np.float64],
    obs: dict,
    psf: dict | h5py.File,
    params: dict,
    polarization: int = 0,
    fill_model_visibilities: bool = False,
    vis_input: NDArray[np.complex128] | None = None,
    spectral_model_uv_arr: NDArray[np.float64] | None = None,
    beam_per_baseline: bool = False,
    uv_grid_phase_only: bool = True,
    conserve_memory: bool = False,
    memory_threshold: float | int = 1e8,
):
    """
    Generate visibilities from a 2D hyperresolved {u,v} plane using the Fourier transform of the beam sensitivity as the
    kernel (or integration function). The input {u,v} plane is the slant-orthographic projection of the sky when Fourier
    transformed with no instrumental effects. The integration kernel adds the instrumental effects to the visiblities.

    Degridding is performed only on simulated model {u,v} planes. Simulated sources towards the edge of the sky image will be
    distorted (smeared) due to the projection of the 2D {u,v} plane.

    The kernel is a extremely hyperresolved look-up table, which is (optionally) interpolated even further.
    Since the {u,v} pixels are discrete and the baseline locations are not, the kernel will integrate the pixels
    in a unique way for each individual baseline. This code is optimized to provide the best estimate for each
    baseline whilst maintaining speed.

    Parameters
    ----------
    image_uv : NDArray[np.complex128]
        A simulated {u,v} plane with no instrumental effects
    vis_weight : NDArray[np.float64]
        Weights (flags) of the visibilities
    obs : dict
        Observation metadata dictionary
    psf : dict | h5py.File
        Beam metadata dictionary
    params : dict
        Visibility metadata dictionary
    polarization : int
        Index of the current polarization, by default 0
    fill_model_visibilities : bool, optional
        Create all model visibilities disregarding flags, by default False
    vis_input : NDArray[np.complex128] | None, optional
        Extra model visibilities to add to the degridded products, by default None
    spectral_model_uv_arr : NDArray[np.float64] | None, optional
        Additional {u,v} planes to degrid for complicated source spectral dependencies, by default None
    beam_per_baseline : bool, optional
        Generate beams with corrective phases given the baseline location, by default False
    uv_grid_phase_only : bool, optional
        Generate beams with only {u,v} corrective phases, disregarding w phases, by default True
    conserve_memory : bool, optional
        Reduce memory load by running loops, by default False

    Returns
    -------
    visibility_array : NDArray[np.complex128]
        A simulated visibility array from degridding the input {u,v} plane with the instrumental kernel
    obs : dict
        Updated observation metadata dictionary
    """

    complex_flag = psf["complex_flag"][0]
    n_spectral = obs["degrid_spectral_terms"][0]
    interp_flag = psf["interpolate_kernel"][0]
    if conserve_memory:
        # memory threshold is in bytes
        if memory_threshold < 1e6:
            memory_threshold = 1e8

    # If both beam and interp_flag leave a warning, prioritise beam_per_baseline
    if beam_per_baseline and interp_flag:
        warnings.warn(
            "Cannot have beam per baseline and interpolation at the same time, turning off interpolation"
        )
        interp_flag = False

    # For each unflagged baseline, get the minimum contributing pixel number for gridding
    # and the 2D derivatives for bilinear interpolation
    baselines_dict = baseline_grid_locations(
        obs,
        psf,
        params,
        vis_weights,
        fill_model_visibilities=fill_model_visibilities,
        interp_flag=interp_flag,
    )

    # Extract data from the data structures
    bin_n = baselines_dict["bin_n"]
    bin_i = baselines_dict["bin_i"]
    n_bin_use = baselines_dict["n_bin_use"]
    ri = baselines_dict["ri"]
    xmin = baselines_dict["xmin"]
    ymin = baselines_dict["ymin"]
    x_offset = baselines_dict["x_offset"]
    y_offset = baselines_dict["y_offset"]
    if interp_flag:
        dx0dy0_arr = baselines_dict["dx0dy0_arr"]
        dx0dy1_arr = baselines_dict["dx0dy1_arr"]
        dx1dy0_arr = baselines_dict["dx1dy0_arr"]
        dx1dy1_arr = baselines_dict["dx1dy1_arr"]
    dimension = obs["dimension"][0]
    kbinsize = obs["kpix"][0]
    freq_bin_i = obs["baseline_info"][0]["fbin_i"][0]
    frequency_array = obs["baseline_info"][0]["freq"][0]
    freq_delta = (frequency_array - obs["freq_center"][0]) / obs["freq_center"][0]
    psf_dim = psf["dim"][0]
    psf_resolution = psf["resolution"][0]
    psf_dim3 = int(psf_dim**2)
    n_baselines = obs["n_baselines"][0]
    n_samples = obs["n_time"][0]
    n_freq_use = frequency_array.size
    n_freq = obs["n_freq"][0]
    group_arr = np.squeeze(psf["id"][0][:, freq_bin_i, polarization])
    beam_arr = psf["beam_ptr"][0]

    if beam_per_baseline:
        uu = params["uu"][0]
        vv = params["vv"][0]
        ww = params["ww"][0]
        psf_image_dim = psf["image_info"][0]["psf_image_dim"][0]
        psf_intermediate_res = np.min(
            np.ceil(np.sqrt(psf_resolution) / 2) * 2, psf_resolution
        )
        image_bot = -(psf_dim / 2) * psf_intermediate_res + psf_image_dim / 2
        image_top = (
            (psf_dim * psf_resolution - 1)
            - (psf_dim / 2) * psf_intermediate_res
            + psf_image_dim / 2
        )

        l_mode, m_mode, n_tracked = l_m_n(obs, psf)

        # w-terms have not been tested, thus they've been turned off for now
        if uv_grid_phase_only:
            n_tracked = np.zeros_like(n_tracked)

        beam_int = np.zeros(n_freq)
        beam2_int = np.zeros(n_freq)
        n_grp_use = np.zeros(n_freq)
        primary_beam_area = np.zeros(n_freq)
        primary_beam_sq_area = np.zeros(n_freq)

        x = (np.arange(dimension) - dimension / 2) * kbinsize
        y = x.copy()

    conj_i = np.where(params["vv"][0] > 0)
    if conj_i[0].size > 0:
        if beam_per_baseline:
            uu[conj_i] = -uu[conj_i]
            vv[conj_i] = -vv[conj_i]
            ww[conj_i] = -ww[conj_i]

    # Create the correct size visibility array
    vis_dimension = n_baselines * n_samples
    visibility_array = np.zeros((vis_dimension, n_freq), dtype=np.cdouble)

    ind_ref = np.arange(max(bin_n))

    if complex_flag:
        arr_type = np.cdouble
    else:
        arr_type = np.double

    if n_spectral:
        prefactor = np.empty(n_spectral, dtype=object)
        for s_i in range(n_spectral):
            prefactor[s_i] = deriv_coefficients(s_i + 1, divide_factorial=True)
        box_arr_ptr = np.empty(n_spectral, dtype=object)

    for bi in range(n_bin_use):
        vis_n = bin_n[bin_i[bi]]
        """
            Python is not inclusive of end of loop 
            while IDL is, as such n_bin_use - 1 does not do
            the last index properly on Python, as such when we
            have reached the last index we need to change the 
            indexation of ri to include from that point to the end.
        """
        if bi == n_bin_use - 1:
            inds = ri[ri[bin_i[bi]] :]
        else:
            inds = ri[ri[bin_i[bi]] : ri[bin_i[bi + 1]]]

        # if constraining memory usage, then est number of loops needed
        if conserve_memory:
            required_bytes = 8 * vis_n * psf_dim3
            mem_iter = int(np.ceil(required_bytes / memory_threshold))
            if mem_iter > 1:
                vis_n_full = vis_n
                inds_full = inds
                vis_n_per_iter = int(np.ceil(vis_n_full / mem_iter))
        else:
            mem_iter = 1
        # loop over chunks of visibilities to grid to conserve memory
        for mem_i in range(mem_iter):
            if mem_iter > 1:
                # calculate the indices of this visibility chunk if split into multiple chunks
                if vis_n_per_iter * (mem_i + 1) > vis_n_full:
                    max_ind = vis_n_full
                else:
                    max_ind = vis_n_per_iter * (mem_i + 1)
                inds = inds_full[vis_n_per_iter * mem_i : max_ind]
                vis_n = max_ind - vis_n_per_iter * mem_i

            x_off = x_offset.flat[inds].astype(np.int64)
            y_off = y_offset.flat[inds].astype(np.int64)
            # xmin and ymin should be all the same
            xmin_use = xmin.flat[inds[0]]
            ymin_use = ymin.flat[inds[0]]
            freq_i = inds % n_freq_use
            fbin = freq_bin_i[freq_i]
            baseline_inds = (inds / n_freq_use).astype(int) % n_baselines

            box_matrix = np.zeros((vis_n, psf_dim3), dtype=arr_type)
            box_arr = image_uv[
                ymin_use : ymin_use + psf_dim, xmin_use : xmin_use + psf_dim
            ].flatten()

            if interp_flag:
                dx0dy0 = dx0dy0_arr.flat[inds]
                dx0dy1 = dx0dy1_arr.flat[inds]
                dx1dy0 = dx1dy0_arr.flat[inds]
                dx1dy1 = dx1dy1_arr.flat[inds]
                ind_remap_flag = False
                bt_index = inds / n_freq_use
                for ii in range(vis_n):
                    kernel = interpolate_kernel(
                        beam_arr[baseline_inds[ii], fbin[ii], polarization],
                        x_off[ii],
                        y_off[ii],
                        dx0dy0[ii],
                        dx1dy0[ii],
                        dx0dy1[ii],
                        dx1dy1[ii],
                    )
                    box_matrix.flat[psf_dim3 * ii : psf_dim3 * ii + kernel.size] = (
                        kernel
                    )
            else:
                group_id = group_arr[inds]
                group_max = np.max(group_id) + 1
                xyf_i = (
                    x_off + y_off * psf_resolution + fbin * psf_resolution**2
                ) * group_max + group_id
                xyf_si = np.sort(xyf_i)
                xyf_i = xyf_i[xyf_si]
                xyf_ui = np.unique(xyf_i)
                n_xyf_bin = xyf_ui.size

                # There might be a better selection criteria to determine which is more efficient
                if vis_n > np.ceil(1.1 * n_xyf_bin) and not beam_per_baseline:
                    ind_remap_flag = True
                    inds = inds[xyf_si]
                    inds_use = xyf_si[xyf_ui]
                    freq_i = freq_i[inds_use]
                    x_off = x_off[inds_use]
                    y_off = y_off[inds_use]
                    fbin = fbin[inds_use]
                    baseline_inds = baseline_inds[inds]

                    if n_xyf_bin == 1:
                        ind_remap = np.arange(vis_n, dtype=int)
                    else:
                        hist_inds_u, _, ri_xyf = histogram(xyf_ui, bin_size=1, min=0)
                        ind_remap = ind_ref[ri_xyf[0 : hist_inds_u.size] - ri_xyf[0]]

                    vis_n = n_xyf_bin
                else:
                    ind_remap_flag = False
                    bt_index = inds / n_freq_use

                if beam_per_baseline:
                    box_matrix = grid_beam_per_baseline(
                        psf,
                        uu,
                        vv,
                        ww,
                        l_mode,
                        m_mode,
                        n_tracked,
                        frequency_array,
                        x,
                        y,
                        xmin_use,
                        ymin_use,
                        freq_i,
                        bt_index,
                        polarization,
                        fbin,
                        image_bot,
                        image_top,
                        psf_dim3,
                        box_matrix,
                        vis_n,
                        beam_int=beam_int,
                        beam2_int=beam2_int,
                        n_grp_use=n_grp_use,
                        degrid_flag=True,
                        obs=obs,
                        params=params,
                        weights=vis_weights,
                    )
                else:
                    for ii in range(vis_n):
                        # more efficient array subscript notation
                        box_matrix[psf_dim3 * ii] = beam_arr[
                            baseline_inds[ii], fbin[ii], polarization
                        ][y_off[ii], x_off[ii]]

            if n_spectral:
                vis_box = np.dot(box_arr, np.transpose(box_matrix))
                freq_term_arr = rebin(
                    np.transpose(freq_delta[freq_i]), (vis_n, psf_dim3), sample=True
                )
                for s_i in range(n_spectral):
                    # s_i loop is over terms of the Taylor expansion, starting from the lowest-order term
                    prefactor_use = prefactor[s_i]
                    box_matrix *= freq_term_arr
                    box_arr_ptr[s_i] = spectral_model_uv_arr[s_i][
                        ymin_use : ymin_use + psf_dim - 1,
                        xmin_use : xmin_use + psf_dim - 1,
                    ].flatten()

                    for s_i_i in range(s_i):
                        # s_i_i loop is over powers of the model x alpha^n, n=s_i_i+1
                        box_arr = prefactor_use[s_i_i] * box_arr_ptr[s_i_i]
                        vis_box += np.dot(box_arr, np.transpose(box_matrix))
                del box_arr_ptr
            else:
                vis_box = np.dot(box_arr, np.transpose(box_matrix))
            if ind_remap_flag:
                vis_box = vis_box[ind_remap]
            visibility_array.flat[inds] = vis_box

    if beam_per_baseline:
        # factor of kbinsize^2 is FFT units normalization
        beam2_int *= weight_invert(n_grp_use) / kbinsize**2
        beam_int *= weight_invert(n_grp_use) / kbinsize**2
        primary_beam_area = beam2_int
        primary_beam_area = beam_int
        # Returning obs in this case?
        obs["primary_beam_area"][polarization] = primary_beam_area
        obs["primary_beam_sq_area"][polarization] = primary_beam_sq_area

    del (x_offset, y_offset, xmin, ymin, bin_n)
    if conj_i[0].size > 0:
        visibility_array[conj_i, :] = np.conj(visibility_array[conj_i, :])

    if vis_input is not None:
        visibility_array += vis_input

    if beam_per_baseline:
        return visibility_array, obs
    else:
        return visibility_array