Source code for vip_hci.psfsub.nmf_fullfr

#! /usr/bin/env python
"""
Module with PSF reference approximation using Non-negative matrix factorization
for ADI and RDI data, in full frames.

.. [LEE99]
   | Lee & Seung 1999
   | **Learning the parts of objects by non-negative matrix factorization**
   | *Nature, Volume 401, Issue 6755, pp. 788-791*
   | `https://ui.adsabs.harvard.edu/abs/1999Natur.401..788L
     <https://ui.adsabs.harvard.edu/abs/1999Natur.401..788L>`_

"""

__author__ = "Thomas Bédrine, Carlos Alberto Gomez Gonzalez, Valentin Christiaens"
__all__ = ["nmf", "NMF_Params"]

import numpy as np
from sklearn.decomposition import NMF
from dataclasses import dataclass, field
from enum import Enum
from typing import Tuple, List
from ..config.utils_param import setup_parameters, separate_kwargs_dict
from ..config.paramenum import Collapse, HandleNeg, Initsvd, ALGO_KEY
from ..config import timing, time_ini
from ..preproc import cube_derotate, cube_collapse
from ..preproc.derotation import _compute_pa_thresh, _find_indices_adi
from ..var import (prepare_matrix, reshape_matrix, frame_center, dist,
                   matrix_scaling, mask_circle)



[docs]
@dataclass
class NMF_Params:
    """
    Set of parameters for the NMF full-frame algorithm.

    See function `nmf` below for the documentation.
    """

    cube: np.ndarray = None
    angle_list: np.ndarray = None
    cube_ref: np.ndarray = None
    ncomp: int = 1
    scaling: Enum = None
    max_iter: int = 10000
    random_state: int = None
    mask_center_px: int = None
    source_xy: Tuple[int] = None
    delta_rot: float = 1
    fwhm: float = 4
    init_svd: Enum = Initsvd.NNDSVD
    collapse: Enum = Collapse.MEDIAN
    full_output: bool = False
    verbose: bool = True
    cube_sig: np.ndarray = None
    handle_neg: Enum = HandleNeg.MASK
    nmf_args: dict = field(default_factory=lambda: {})




[docs]
def nmf(*all_args: List, **all_kwargs: dict):
    """Non Negative Matrix Factorization [LEE99]_ for ADI sequences [GOM17]_.
    Alternative to the full-frame ADI-PCA processing that does not rely on SVD
    or ED for obtaining a low-rank approximation of the datacube. This function
    embeds the scikit-learn NMF algorithm solved through either the coordinate
    descent or the multiplicative update method.

    Parameters
    ----------
    all_args: list, optional
        Positionnal arguments for the NMF algorithm. Full list of parameters
        below.
    all_kwargs: dictionary, optional
        Mix of keyword arguments that can initialize a NMFParams and the optional
        'rot_options' dictionnary, with keyword values for "border_mode", "mask_val",
        "edge_blend", "interp_zeros", "ker" (see documentation of
        ``vip_hci.preproc.frame_rotate``). Can also contain a NMFParams named as
        `algo_params`.

    NMF parameters
    ----------
    cube : numpy ndarray, 3d
        Input cube.
    angle_list : numpy ndarray, 1d
        Corresponding parallactic angle for each frame.
    cube_ref : numpy ndarray, 3d, optional
        Reference library cube. For Reference Star Differential Imaging.
    ncomp : int, optional
        How many components are used as for low-rank approximation of the
        datacube.
    scaling : Enum, see `vip_hci.config.paramenum.Scaling`
        With None, no scaling is performed on the input data before SVD. With
        "temp-mean" then temporal px-wise mean subtraction is done, with
        "spat-mean" then the spatial mean is subtracted, with "temp-standard"
        temporal mean centering plus scaling to unit variance is done and with
        "spat-standard" spatial mean centering plus scaling to unit variance is
        performed.
    max_iter : int optional
        The number of iterations for the coordinate descent solver.
    random_state : int or None, optional
        Controls the seed for the Pseudo Random Number generator.
    mask_center_px : None or int
        If None, no masking is done. If an integer > 1 then this value is the
        radius of the circular mask.
    source_xy : tuple of int, optional
        For ADI-PCA, this triggers a frame rejection in the PCA library, with
        ``source_xy`` as the coordinates X,Y of the center of the annulus where
        the PA criterion is estimated. When ``ncomp`` is a tuple, a PCA grid is
        computed and the S/Ns (mean value in a 1xFWHM circular aperture) of the
        given (X,Y) coordinates are computed.
    delta_rot : float, optional
        Factor for tunning the parallactic angle threshold, expressed in FWHM.
        Default is 1 (excludes 1xFWHM on each side of the considered frame).
    fwhm : float, optional
        Known size of the FWHM in pixels to be used. Default value is 4.
    init_svd: Enum, see `vip_hci.config.paramenum.Initsvd`
        Method used to initialize the iterative procedure to find H and W.
        'nndsvd': non-negative double SVD recommended for sparseness
        'nndsvda': NNDSVD where zeros are filled with the average of cube;
        recommended when sparsity is not desired
        'random': random initial non-negative matrix
    collapse : Enum, see `vip_hci.config.paramenum.Collapse`
        Sets the way of collapsing the frames for producing a final image.
    full_output: boolean, optional
        Whether to return the final median combined image only or with other
        intermediate arrays.
    verbose : {True, False}, bool optional
        If True prints intermediate info and timing.
    handle_neg: Enum, see `vip_hci.config.paramenum.HandleNeg`
        Determines how to handle negative values: mask them, set them to zero,
        or subtract the minimum value in the arrays. Note: 'mask' or 'null'
        may leave significant artefacts after derotation of residual cube
        => those options should be used carefully (e.g. with proper treatment
        of masked values in non-derotated cube of residuals).
    nmf_args : dictionary, optional
        Additional arguments for scikit-learn NMF algorithm. See:
        https://scikit-learn.org/stable/modules/generated/sklearn.decomposition.NMF.html

    Returns
    -------
    If full_output is False the final frame is returned. If True the algorithm
    returns the reshaped NMF components, the reconstructed cube, the residuals,
    the residuals derotated and the final frame.

    """
    # Separating the parameters of the ParamsObject from the optionnal rot_options
    class_params, rot_options = separate_kwargs_dict(
        initial_kwargs=all_kwargs, parent_class=NMF_Params
    )

    # Extracting the object of parameters (if any)
    algo_params = None
    if ALGO_KEY in rot_options.keys():
        algo_params = rot_options[ALGO_KEY]
        del rot_options[ALGO_KEY]

    if algo_params is None:
        algo_params = NMF_Params(*all_args, **class_params)

    array = algo_params.cube.copy()
    if algo_params.verbose:
        start_time = time_ini()
    n, y, x = array.shape

    matrix_ref = None
    matrix_sig = None

    # how to handle negative values
    if algo_params.handle_neg == HandleNeg.MASK:
        if algo_params.mask_center_px:
            array = mask_circle(array, algo_params.mask_center_px)
        if algo_params.cube_sig is not None:
            yy, xx = np.where(
                np.amin(array - np.abs(algo_params.cube_sig), axis=0) > 0)
        else:
            yy, xx = np.where(np.amin(array, axis=0) > 0)
        H_tmp = np.zeros([algo_params.ncomp, y, x])
        if len(yy) > 0:
            matrix = array[:, yy, xx]
            matrix = matrix_scaling(matrix, algo_params.scaling)
            if algo_params.cube_ref is not None:
                matrix_ref = algo_params.cube_ref[:, yy, xx]
                matrix_ref = matrix_scaling(matrix_ref, algo_params.scaling)
            if algo_params.cube_sig is not None:
                matrix_sig = algo_params.cube_sig[:, yy, xx]
        else:
            raise ValueError("Remove frame(s) with negative values")
    else:
        if algo_params.handle_neg == HandleNeg.NULL:
            if algo_params.cube_sig is not None:
                array[np.where(array - algo_params.cube_sig < 0)] = 0
                algo_params.cube_sig[np.where(
                    array - algo_params.cube_sig < 0)] = 0
            else:
                array[np.where(array < 0)] = 0

        elif algo_params.handle_neg == HandleNeg.SUBTR_MIN:
            if algo_params.cube_sig is not None:
                array -= np.amin(array - algo_params.cube_sig)
            else:
                array -= np.amin(array)
        else:
            raise ValueError("Mode to handle neg. pixels not recognized")

        matrix = prepare_matrix(
            array,
            algo_params.scaling,
            algo_params.mask_center_px,
            mode="fullfr",
            verbose=algo_params.verbose,
        )
        if algo_params.cube_ref is not None:
            matrix_ref = prepare_matrix(
                algo_params.cube_ref,
                algo_params.scaling,
                algo_params.mask_center_px,
                mode="fullfr",
                verbose=algo_params.verbose,
            )
        if algo_params.cube_sig is not None:
            matrix_sig = prepare_matrix(
                algo_params.cube_sig,
                algo_params.scaling,
                algo_params.mask_center_px,
                mode="fullfr",
                verbose=algo_params.verbose,
            )

    if algo_params.cube_sig is not None:
        # derotate
        residuals_cube = algo_params.cube_sig.copy()
    else:
        residuals_cube = np.zeros_like(array)

    if algo_params.source_xy is None:
        add_params = {
            "matrix": matrix,
            "matrix_ref": matrix_ref,
            "matrix_sig": matrix_sig,
        }
        func_params = setup_parameters(
            params_obj=algo_params, fkt=_project_subtract, **add_params
        )
        residuals = _project_subtract(**func_params, **algo_params.nmf_args)
        if algo_params.verbose:
            timing(start_time)
        if algo_params.full_output:
            # reconstructed = residuals[1]
            H = residuals[2]
            reconstructed = residuals[1]
            residuals = residuals[0]
        recon_cube = residuals_cube.copy()
        if algo_params.handle_neg == "mask":
            for fr in range(n):
                residuals_cube[fr][yy, xx] = residuals[fr]
            if algo_params.full_output:
                for fr in range(n):
                    recon_cube[fr][yy, xx] = reconstructed[fr]
                for pp in range(algo_params.ncomp):
                    H_tmp[pp][yy, xx] = H[pp]
                H = H_tmp
        else:
            for fr in range(n):
                residuals_cube[fr] = residuals[fr].reshape((y, x))
            if algo_params.full_output:
                recon_cube = reshape_matrix(reconstructed, y, x)
                H = H.reshape(algo_params.ncomp, y, x)
    else:
        if algo_params.delta_rot is None or algo_params.fwhm is None:
            msg = "Delta_rot or fwhm parameters missing. Needed for the"
            msg += "PA-based rejection of frames from the library"
            raise TypeError(msg)
        recon_cube = np.zeros_like(algo_params.cube)
        yc, xc = frame_center(algo_params.cube[0], False)
        x1, y1 = algo_params.source_xy
        ann_center = dist(yc, xc, y1, x1)
        pa_thr = _compute_pa_thresh(
            ann_center, algo_params.fwhm, algo_params.delta_rot)
        mid_range = (
            np.abs(np.amax(algo_params.angle_list) -
                   np.amin(algo_params.angle_list))
            / 2
        )
        if pa_thr >= mid_range - mid_range * 0.1:
            new_pa_th = float(mid_range - mid_range * 0.1)
            if algo_params.verbose:
                msg = "PA threshold {:.2f} is too big, will be set to "
                msg += "{:.2f}"
                print(msg.format(pa_thr, new_pa_th))
            pa_thr = new_pa_th

        for fr in range(n):
            ind = _find_indices_adi(algo_params.angle_list, fr, pa_thr)
            add_params = {
                "matrix": matrix,
                "matrix_ref": matrix_ref,
                "matrix_sig": matrix_sig,
                "indices": ind,
                "frame": fr,
            }
            func_params = setup_parameters(
                params_obj=algo_params, fkt=_project_subtract, **add_params
            )
            res_result = _project_subtract(
                **func_params, **algo_params.nmf_args)
            # ! Instead of reshaping, fill frame using get_annulus?
            if algo_params.full_output:
                residuals = res_result[0]
                recon_frame = res_result[1]
                H = res_result[2]
                if algo_params.handle_neg == "mask":
                    recon_cube[fr][yy, xx] = recon_frame
                else:
                    recon_cube[fr] = recon_frame.reshape((y, x))
            else:
                residuals = res_result
            if algo_params.handle_neg == "mask":
                residuals_cube[fr][yy, xx] = residuals
                if fr == n - 1 and algo_params.full_output:
                    for pp in range(algo_params.ncomp):
                        H_tmp[pp][yy, xx] = H[pp]
                    H = H_tmp
            else:
                residuals_cube[fr] = residuals.reshape((y, x))
                if fr == n - 1 and algo_params.full_output:
                    H = H.reshape(algo_params.ncomp, y, x)

    if algo_params.verbose:
        print("Done NMF with sklearn.NMF.")
        timing(start_time)

    residuals_cube_ = cube_derotate(
        residuals_cube, algo_params.angle_list, **rot_options
    )
    frame = cube_collapse(residuals_cube_, mode=algo_params.collapse)

    if algo_params.verbose:
        print("Done derotating and combining.")
        timing(start_time)
    if algo_params.full_output:
        return (H, recon_cube, residuals_cube, residuals_cube_, frame)
    else:
        return frame



def _project_subtract(
    matrix,
    matrix_ref,
    ncomp,
    scaling,
    mask_center_px,
    verbose,
    full_output,
    indices=None,
    frame=None,
    matrix_sig=None,
    max_iter=100,
    random_state=None,
    init_svd="nndsvda",
    **kwargs
):
    """
    PCA projection and model PSF subtraction. Used as a helping function by
    each of the PCA modes (ADI, ADI+RDI, ADI+mSDI).

    Parameters
    ----------
    cube : numpy ndarray
        Input cube.
    cube_ref : numpy ndarray
        Reference cube.
    ncomp : int
        Number of principal components.
    scaling : str
        Scaling of pixel values. See ``pca`` docstrings.
    mask_center_px : int
        Masking out a centered circular aperture.
    verbose : bool
        Verbosity.
    full_output : bool
        Whether to return intermediate arrays or not.
    indices : list
        Indices to be used to discard frames (a rotation threshold is used).
    frame : int
        Index of the current frame (when indices is a list and a rotation
        threshold was applied).
    cube_sig: numpy ndarray, opt
        Cube with estimate of significant authentic signals. If provided, this
        will be subtracted from both the cube and the PCA library, before
        projecting the cube onto the principal components.

    Returns
    -------
    ref_lib_shape : int
        [indices is not None, frame is not None] Number of
        rows in the reference library for the given frame.
    residuals: numpy ndarray
        Residuals, returned in every case.
    reconstructed : numpy ndarray
        [full_output=True] The reconstructed array.
    V : numpy ndarray
        [full_output=True, indices is None, frame is None] The right singular
        vectors of the input matrix, as returned by ``svd/svd_wrapper()``
    """
    if matrix_sig is None:
        matrix_emp = matrix.copy()
    else:
        matrix_emp = matrix - matrix_sig

    if matrix_ref is not None:
        ref_lib = matrix_ref
    elif indices is not None and frame is not None:
        ref_lib = matrix_emp[indices].copy()
    else:
        ref_lib = matrix_emp.copy()

    # to avoid bug, just consider positive values
    if np.median(ref_lib) < 0:
        raise ValueError("Mostly negative values in the cube")
    else:
        ref_lib[np.where(ref_lib < 0)] = 0

    solver = "mu"
    # if init_svd != 'nndsvd':
    #     solver = 'mu'
    # else:
    #     solver = 'cd'
    mod = NMF(
        n_components=ncomp,
        solver=solver,
        init=init_svd,
        max_iter=max_iter,
        random_state=random_state,
        **kwargs
    )
    # a rotation threshold is used (frames are processed one by one)
    if indices is not None and frame is not None:
        if ref_lib.shape[0] <= 10:
            raise RuntimeError(
                "Less than 10 frames left in the PCA library"
                ", Try decreasing the parameter delta_rot"
            )
        curr_frame = matrix[frame]  # current frame
        curr_frame_emp = matrix_emp[frame]
        # H [ncomp, n_pixels]
        H = mod.fit(ref_lib).components_
        # W: coefficients [1, ncomp]
        W = mod.transform(curr_frame_emp[np.newaxis, ...])
        # V = svd_wrapper(ref_lib, svd_mode, ncomp, False)
        # transformed = np.dot(curr_frame_emp, V.T)
        # reconstructed = np.dot(transformed.T, V)
        reconstructed = np.dot(W, H)
        residuals = curr_frame - reconstructed
        if full_output:
            return residuals, reconstructed, H
        else:
            return residuals

    # the whole matrix is processed at once
    else:
        # H [ncomp, n_pixels]: Non-negative components of the data
        # if cube_ref is not None:
        H = mod.fit(ref_lib).components_
        # else:
        #    H = mod.fit(matrix).components_

        # W: coefficients [n_frames, ncomp]
        W = mod.transform(matrix_emp)

        reconstructed = np.dot(W, H)
        residuals = matrix - reconstructed

        # V = svd_wrapper(ref_lib, svd_mode, ncomp, verbose)
        # transformed = np.dot(V, matrix_emp.T)
        # reconstructed = np.dot(transformed.T, V)
        # residuals = matrix - reconstructed
        # residuals_res = reshape_matrix(residuals, y, x)
        if full_output:
            return residuals, reconstructed, H
        else:
            return residuals