Source code for psfsim.aberration_models

"""Aberration models."""

from importlib.resources import files

import numpy as np
from astropy.io import fits

from .romantrace import RomanRayBundle
from .wfi_data import remove_tiptilt
from .zernike import noll_to_zernike, zernike

# parameters

[docs]
fratio = 8.0




[docs]
def aberration_gradients(use_filter="W", nn=128, subtract_offset=False, mask=False):
    """
    Build a table of the derivatives of the wavefront error with respect to each surface mode.

    Parameters
    ----------
    use_filter : str, optional
        Which filter to use.
    nn : int, optional
        What size pupil array to use.
    subtract_offset : bool, optional
        Whether to subtract the Z1 mode (which has no effect on the PSF).
    mask : bool, optional
        Whether to null out masked regions.

    Returns
    -------
    np.ndarray
        A table of sensitivities of OPD to each surface error mode. The shape is
        (number of field points, `nn`, `nn`, number of basis modes).

        Reminder that this can be huge!

    """

    fpos = np.loadtxt(files("psfsim.data").joinpath("fpos.dat"))

    for j in range(np.shape(fpos)[0]):
        RB = RomanRayBundle(fpos[j, 0], fpos[j, 1], nn, use_filter, hasE=False, errs={"grad": True})
        if j == 0:
            n = np.shape(RB.grad)[-1]  # get number of basis modes
            g = np.zeros((np.shape(fpos)[0], nn, nn, n))
        if subtract_offset:
            u = RB.open != 0
            for k in range(n):
                mean = np.sum(RB.grad[:, :, k] * u) / np.sum(u)
                RB.grad[:, :, k] -= mean
        if mask:
            for k in range(n):
                RB.grad[:, :, k] *= RB.open > 0.5
        g[j, :, :, :] = -RB.grad
        # the - sign is because we want OPD in Poppy convention, not path length.

    return g




[docs]
def aberration_transfer_matrix(use_filter="W", nn=128, n_zernike=22, outdiagnostic=None):
    """
    Computes the transfer matrix from surface distortion modes to Zernikes.

    Parameters
    ----------
    use_filter : str, optional
        Which filter to use.
    nn : int, optional
        What size pupil array to use.
    n_zernike : int, optional
        How many Zernikes to use?
    outdiagnostic : str, optional
        Output FITS file for diagnostics (for debugging only).

    Returns
    -------
    transfer : np.ndarray
        The transfer matrix, shape (number of field points, `n_zernike`, number of basis modes).
    s_decomp : np.ndarray
        The decomposition of the ray-traced design wavefront, shape (number of field points, `n_zernike`).
        The return value is in Poppy OPD sign convention (*negative* of the path length difference).

    """

    if nn % 2 != 0:
        raise ValueError("nn must be even")

    # first get the field positions
    fpos = np.loadtxt(files("psfsim.data").joinpath("fpos.dat"))
    npos = np.shape(fpos)[0]

    for j in range(npos):
        RB = RomanRayBundle(fpos[j, 0], fpos[j, 1], nn, use_filter, hasE=False, errs={"grad": True})
        if j == 0:
            n = np.shape(RB.grad)[-1]  # get number of basis modes
            transfer = np.zeros((npos, n_zernike, n))
            s_decomp = np.zeros((npos, n_zernike))
        for k in range(n):
            mean = np.sum(RB.grad[:, :, k] * RB.open) / np.sum(RB.open)
            RB.grad[:, :, k] -= mean
            opd = -RB.s + np.sum(RB.s * RB.open) / np.sum(RB.open)
            # this flips sign so that OPD is consistent with the Poppy convention
            # (we're not using Poppy here but it is in such common use across the Roman
            # community that I want to be consistent!!)

        # now get the center
        # note that there is a sign flip between (x,y) in the entrance pupil plane
        # and (u, v) at the exit
        ctr = np.mean(RB.u[nn // 2 - 1 : nn // 2 + 1, nn // 2 - 1 : nn // 2 + 1, :], axis=(0, 1))
        rho12 = 2.0 * fratio * (RB.u - ctr[None, None, :])
        rho = np.hypot(rho12[:, :, 0], rho12[:, :, 1])
        theta = np.arctan2(-rho12[:, :, 1], -rho12[:, :, 0])
        del rho12

        # and the aberrations
        zmode = np.zeros((nn, nn, n_zernike))
        for q in range(n_zernike):
            _n, _m = noll_to_zernike(q + 1)
            zmode[:, :, q] = zernike(_n, _m, rho, theta, normalized=True)

        # diagnostics, if desired
        if outdiagnostic is not None and j == 0:
            z2 = np.transpose(zmode, axes=(2, 0, 1)) * (RB.open >= 0.5)[None, :, :]
            fits.PrimaryHDU(z2).writeto(outdiagnostic, overwrite=True)
            del z2

        # overlap matrix of the Zernikes --- not zero on an obstructed pupil!
        A = np.zeros((n_zernike, n_zernike))
        B = np.zeros((n_zernike, n))
        c = np.zeros((n_zernike,))
        for za in range(n_zernike):
            for zb in range(za + 1):
                A[za, zb] = A[zb, za] = np.sum(zmode[:, :, za] * zmode[:, :, zb] * RB.open)
            for k in range(n):
                # the - sign is to flip from path length to OPD
                B[za, k] = -np.sum(zmode[:, :, za] * RB.grad[:, :, k] * RB.open)
            c[za] = np.sum(opd * zmode[:, :, za] * RB.open)
        s_decomp[j, :] = np.linalg.solve(A, c)
        transfer[j, :, :] = np.linalg.solve(A, B)

    return transfer, s_decomp




[docs]
def aberration_transfer_matrix_svd(use_filter="W", nn=128, n_zernike=22):
    """
    Computes the SVD of the transfer matrix from surface distortion modes to Zernikes.

    Parameters
    ----------
    use_filter : str, optional
        Which filter to use.
    nn : int, optional
        What size pupil array to use.
    n_zernike : int, optional
        How many Zernikes to use?
    outdiagnostic : str, optional
        Output FITS file for diagnostics (for debugging only).

    Returns
    -------
    U, S, Vh: np.ndarray
        The SVD of the transfer matrix:

        - `U` has dimension (number of field points * `n_zernike`, nbasis)
        - `S` has length nbasis
        - `Vh` has dimension (nbasis, nbasis)

        The transfer matrix is ``U @ diag(S) @ Vh``.

    """

    T, _ = aberration_transfer_matrix(use_filter=use_filter, nn=nn, n_zernike=n_zernike)
    T = T.reshape((-1, np.shape(T)[-1]))
    (m, n) = np.shape(T)
    if m < n:
        assert ValueError("Too many surface modes to constrain with these Zernikes.")
    U, S, Vh = np.linalg.svd(T, full_matrices=False, compute_uv=True)
    return U, S, Vh




[docs]
def extract_basis_coefs(
    infile,
    use_filter,
    nn=128,
    smin=0.01,
    pars_input=None,
    flip_y=True,
    nmin=None,
    nmax=None,
    c=3,
    verbose=True,
    return_coefs=False,
):
    """
    Computes basis coefficients from a Zernike file.

    Parameters
    ----------
    infile : str
        The input Zernike file to read. This should be a ``.csv`` file.
    use_filter : str
        The filter to use (1-character string).
    nn : int, optional
        Grid size to use for the Zernikes.
    smin : float, optional
        The minimum singular value to invert.
    pars_input : np.ndarray, optional
        If provided, take this set of instrument parameters as an initial condition; default is all 0's.
    flip_y : bool, optional
        Whether to flip the Y-axis of the input Zernikes (useful for WFI-local vs FPA coordinates).
    nmin, nmax : int, optional
        Minimum and maximum coefficient indices to fit (otherwise starts from `pars_input`).
    c : int, optional
        Number of Zernike modes to exclude from the fit. This is usually either 3 (default, skip piston
        and tip+tilt) or 1 (skip piston but include tip+tilt).
    verbose : bool, optional
        Whether to talk a lot to the output.
    return_coefs : bool, optional
        If set to True, returns the matrix of coefficients for the difference between the
        astrometric model computed by PSFSim and the table provided by the Project.

    Returns
    -------
    np.ndarray
        If `return_coefs` is False (default), this is
        a 1D array of the inferred basis coefficients.

        If `return_coefs` is True, this is a 2D array of shape (3, 3) for the residual of the FPA
        positions::

            [tabulated - predicted] = coefs[:2, :] @ [predicted] + coefs[-1, :]

        where the 2nd axis has order x, y, focus.

    """

    fpos = np.loadtxt(files("psfsim.data").joinpath("fpos.dat"))
    npos = np.shape(fpos)[0]

    # Extract input file and columns
    indata = np.loadtxt(infile, delimiter=",", skiprows=1)
    with open(infile, "r") as f:
        header = f.readline().strip().split(",")
    idx_wl = header.index("wavelength")
    w = indata[:, idx_wl]
    indata = indata[np.where(np.abs(w - np.median(w)) < 0.01), :].reshape((npos, -1))
    w = np.median(w)  # in microns

    # Get offsets
    # positions of rays in FPA in mm from input spreadsheet
    pos_table = np.zeros((npos, 2))
    pos_table[:, 0] = indata[:, header.index("global_x")]
    pos_table[:, 1] = indata[:, header.index("global_y")]
    pos_ref = np.zeros((npos, 2))
    for j in range(npos):
        RB = RomanRayBundle(fpos[j, 0], fpos[j, 1], nn, use_filter, hasE=False)
        pos_ref[j, :] = RB.x_out
    dpos = pos_table - pos_ref
    if verbose:
        for ipos in range(npos):
            print(
                f"{ipos:3d}   {pos_ref[ipos, 0]:7.2f} {pos_ref[ipos, 1]:7.2f}"
                f"     {100 * dpos[ipos, 0]:8.3f} {100 * dpos[ipos, 1]:8.3f}"
            )
    # Linear regression of the offsets
    A = np.ones((npos, 3))
    A[:, :2] = pos_ref
    if verbose:
        print("shape of A=", np.shape(A), "shape of dpos=", np.shape(dpos))
    coefs, resids = np.linalg.lstsq(A, dpos)[:2]

    # the fit is:
    # [tabulated - predicted] = coefs[:2, :] @ [predicted] + coefs[-1, :]
    if verbose:
        print("matrix", coefs[:2, :])
        print("intercept", coefs[-1, :])
        print("resids", resids)
        print("rms", np.sqrt(resids / npos))

    nz = 1
    while f"Z{nz + 1:d}" in header:
        nz += 1
    input_zernikes = np.zeros((npos, nz))
    for iz in range(nz):
        input_zernikes[:, iz] = indata[:, header.index(f"Z{iz + 1:d}")]
    input_zernikes *= 0.001 * w  # convert input wavefront to millimeters

    if flip_y:
        # Z3, 5, etc. need to be flipped, so in Python indexing, start with 2
        input_zernikes[:, 2::2] *= -1.0

    # insert tip-tilt
    # check signs!
    input_zernikes[:, 1] += dpos[:, 0] / (4.0 * fratio)
    input_zernikes[:, 2] += dpos[:, 1] / (4.0 * fratio)

    # get transfer matrix
    T, s_decomp = aberration_transfer_matrix(use_filter=use_filter, nn=nn, n_zernike=nz)
    # and null out data we won't use
    if use_filter[0] in remove_tiptilt:
        for ipos in remove_tiptilt[use_filter]:
            input_zernikes[ipos, 1:3] = 0.0
            s_decomp[ipos, 1:3] = 0.0
            T[ipos, 1:3, :] = 0.0
    # reshape for SVD
    shape_orig = np.shape(T)
    T = T.reshape((-1, np.shape(T)[-1]))

    # Get the input parameters
    pars = np.zeros(np.shape(T)[-1]) if pars_input is None else np.copy(pars_input)
    if verbose:
        print(np.shape(s_decomp), np.shape(T), np.shape(pars))
    s_decomp += (T @ pars).reshape(np.shape(s_decomp))

    # and now the target change in Zernikes
    delta_zernike = input_zernikes - s_decomp

    if return_coefs:
        dpos2 = np.zeros((npos, 3))
        dpos2[:, :2] = dpos
        dpos2[:, 2] = delta_zernike[:, 3]  # focus
        coefs2, resids2 = np.linalg.lstsq(A, dpos2)[:2]
        return coefs2

    # SVD of the free parameters
    Tfit = T.reshape(shape_orig)[:, c:, :].reshape((-1, shape_orig[-1]))
    m_, n_ = np.shape(T)
    nmin = 0 if nmin is None else nmin
    nmax = n_ if nmax is None else nmax
    Tfit = Tfit[:, nmin:nmax]  # shape of the parameters to fit
    m_ -= npos * c
    if m_ < nmax - nmin:
        assert ValueError("Too many surface modes to constrain with these Zernikes.")
    U, S, Vh = np.linalg.svd(Tfit, full_matrices=False, compute_uv=True)

    S_pseudoinv = np.where(smin < S, 1.0 / S, 0.0)
    delta_pars = Vh.T @ np.diag(S_pseudoinv) @ U.T @ delta_zernike[:, c:].ravel()
    if verbose:
        print(f"number of Zernikes used in fit = {m_:d}")
        print(f"number of instrument modes constrained = {nmax - nmin:d}")
        print(f"number of singular values used = {np.count_nonzero(smin < S):d}")
        print("S >>", S)

    pars[nmin:nmax] += delta_pars

    # get new OPDs
    s_decomp += (T[:, nmin:nmax] @ delta_pars).reshape(np.shape(s_decomp))
    delta_zernike = input_zernikes - s_decomp

    if verbose:
        err_residual15 = np.sum(delta_zernike[:, 15:] ** 2, axis=1) ** 0.5
        for ipos in range(npos):
            print(
                f"{ipos:3d} {pos_ref[ipos, 0]:7.2f} {pos_ref[ipos, 1]:7.2f}"
                f" {1.0e6 * delta_zernike[ipos, 1]:7.1f}"
                f" {1.0e6 * delta_zernike[ipos, 2]:7.1f}"
                f"  {1.0e6 * delta_zernike[ipos, 3]:6.1f}"
                f" {1.0e6 * delta_zernike[ipos, 4]:6.1f}"
                f" {1.0e6 * delta_zernike[ipos, 5]:6.1f}"
                f"  {1.0e6 * delta_zernike[ipos, 6]:5.1f}"
                f" {1.0e6 * delta_zernike[ipos, 7]:5.1f}"
                f" {1.0e6 * delta_zernike[ipos, 8]:5.1f}"
                f" {1.0e6 * delta_zernike[ipos, 9]:5.1f}"
                f"  {1.0e6 * delta_zernike[ipos, 10]:5.1f}"
                f" {1.0e6 * delta_zernike[ipos, 11]:5.1f}"
                f" {1.0e6 * delta_zernike[ipos, 12]:5.1f}"
                f" {1.0e6 * delta_zernike[ipos, 13]:5.1f}"
                f" {1.0e6 * delta_zernike[ipos, 14]:5.1f}"
                f" {1.0e6 * delta_zernike[ipos, 15]:5.1f}"
                f"   {1.0e6 * err_residual15[ipos]:5.1f}"
            )
        print(
            "rms residual =", (np.sum(delta_zernike[:, 1:] ** 2) / npos) ** 0.5 * 1.0e6, "nm (incl tip+tilt)"
        )
        print("rms residual =", (np.sum(delta_zernike[:, 3:] ** 2) / npos) ** 0.5 * 1.0e6, "nm")
        for j in range(1, len(delta_zernike[0, :])):
            print(f"{j+1} {np.mean(delta_zernike[:, j])} {np.std(delta_zernike[:, j])}")

    return pars




[docs]
def display_aberration_gradients(outfile):
    """
    Save aberration gradients as a FITS file.

    Parameters
    ----------
    outfile : str
        Where to write.

    """

    nn = 100  # must be a multiple of 4
    table = aberration_gradients(nn=nn, subtract_offset=True, mask=True)[::5, :, :, :].astype(np.float32)
    n = np.shape(table)[-1]
    table2 = np.zeros((n, 15 * nn // 4, 6 * nn), dtype=np.float32)
    indx = [2, 2, 2, 1, 1, 1, 0, 0, 0, 3, 3, 3, 4, 4, 4, 5, 5, 5]
    indy = [2, 1, 0] * 6
    y_offset = [3, 1, 0, 0, 1, 3]
    for sca in range(18):
        dy = nn // 4 * y_offset[indx[sca]]
        table2[
            :, indy[sca] * nn + dy : (indy[sca] + 1) * nn + dy, indx[sca] * nn : (indx[sca] + 1) * nn
        ] = np.transpose(table[sca], axes=(2, 0, 1))

    fits.PrimaryHDU(table2).writeto(outfile, overwrite=True)