dfdri.py

#!/usr/bin/env python3
# -*- coding: utf-8 -*-
"""
Differential-Fourier-Domain-Regularized-Inversion.

Created on 27 Jul 2021, updated Aug 5 2021, style corrections Oct. 2022


This D-FDRI code in Python generates a measurement
matrix with sampling patterns and a reconstruction matrix
for single pixel imaging (SPI). The description of D-FDRI
is included in the following paper and at
https://github.com/rkotynski/D_FDRI.
This file defines the dfdri module. See example.py for usage instructions.
Citation: [1] A. Pastuszczak, R. Stojek, P. Wróbel,
and R. Kotyński, "Differential real-time single-pixel imaging with
Fourier domain regularization: applications to VIS-IR imaging and
polarization imaging," Opt. Express 29, 26685-26700 (2021).
https://doi.org/10.1364/OE.433199 (open access)
Download: https://github.com/rkotynski/D_FDRI/
Contact (authors): anna.pastuszczak@fuw.edu.pl,
rafal.stojek@fuw.edu.pl, piotr.wrobel@fuw.edu.pl, rafal.kotynski@fuw.edu.pl
Acknowledgement: National Science Center (Poland),
UMO-2017/27/B/ST7/00885 (RS,PW,RK), UMO-2019/35/D/ST7/03781 (AP).


  GPL LICENSE INFORMATION

 This program is free software: you can redistribute it and/or modify
 it under the terms of the GNU General Public License as published by
 the Free Software Foundation, either version 3 of the License, or
 (at your option) any later version.

 This program is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU General Public License for more details.

 You should have received a copy of the GNU General Public License
 along with this program.  If not, see <http://www.gnu.org/licenses/>.
"""


import numpy as np
from scipy import fft, linalg


class DFDRI:
    """Differential-Fourier-Domain-Regularized-Inversion class."""

    def __init__(self, μ=0.5, ϵ=1e-7, p=1, m=7, dim=(256, 256), CR=0.03,
                 verbose=True):
        """Initialize the object and set the defauld values of parameters.

        Parameters
        ----------
        μ,ϵ,p, m : D-FDRI parameters (See sect. 2.2 of ref. [1]).
                p=1,2 is the order of finite difference operator D
                m is an odd intteger defining the number of pixel areas
                used to evaluate the zeroth spatial frequency of the image
                μ,ϵ describe the properties of generalized inversion
        dim : dimension of images (tuple). The default is (256,256)
        CR : Compression ratio. The default is 3%.
        verbose : bool. The default is True. Determins whether to print
        comments during program execution
        """
        self.μ = μ
        self.ϵ = ϵ
        self.p = p
        self.m = m
        self.CR = CR
        self.dim = dim
        self.verbose = verbose
        self.M_dct = None
        self.Mbin = None
        self.Pg = None
        if self.verbose:
            print('Differential Fourier Domain Regularized Inversion (D-FDRI)')
            print('This is a python module for')
            print('compressive differential Single Pixel Imaging (SPI).')
            print('It calculates the measurement matrix with binarized DCT')
            print('sampling patterns and reconstructs images from ')
            print('compressive measurements at a high speed.')
            print('For details please see')
            print(' https://doi.org/10.1364/OE.433199 (open access)')
            print('If you find this code useful, please cite our work.\n')

            print('Default parameters:')
            print(f'dim={dim}\t-image resolution')
            print(f'p={p}\t\t\t\t-order of the finite difference operator')
            print(f'm={m}\t\t\t\t- (p+m) is the number of binary patterns used')
            print('to measure the 0th spatial freq.')
            print(f'μ={μ}, ϵ={ϵ}\t-FDRI parameters')
            print(f'CR={CR}\t\t\t-compression ratio')

    def differential_operator(self, p=None):
        """
        Return a function which is a differential operator of order p.

        (p=1 or p=2)
        The operator takes a matrix as its first argument.
        If the second argument ax=1, then it operates on the matrix from
        the right side.
        """
        def D2(Y, right=False):
            if right:
                return np.hstack((
                    np.zeros((Y.shape[0], 1)),
                    Y,
                    np.zeros((Y.shape[0], 1)))) - 0.5*np.hstack((
                        np.zeros((Y.shape[0], 2)), Y)) - 0.5 * np.hstack((
                            Y, np.zeros((Y.shape[0], 2))))
            else:
                return Y[1:-1, :]-0.5*Y[:-2, :]-0.5*Y[2:, :]

        def D1(Y, right=False):
            if right:
                return np.hstack((
                    np.zeros((Y.shape[0], 1)), Y)) - np.hstack(
                        (Y, np.zeros((Y.shape[0], 1))))
            else:
                return np.diff(Y, axis=0)

        if p is None:
            p = self.p

        return D1 if p == 1 else D2

    def auxiliary_matrix_a(self, p=None, m=None, use_precalculated=True,
                           maxiter=5000):
        """
        Calculate and return an auxilliary matrix A (See sect. 2.1 of Ref [1]).

        Parameters
        ----------
        p : =1 or 2, order of the differential operator
            The default is None (the class default).
        m : an odd int, the returned matrix is of size [p+m,m]
            The default is None (the class default).
        use_precalculated : bool, check if a precalculated matrix is available
            DESCRIPTION. The default is True.
        maxiter : number of iterations in evaluation of A
            The default is 5000.

        Returns
        -------
        A : auxiliary binary matrix which columns represent subsets of
        pixels (See sect. 2.1 of Ref [1]).

        """
        if p is None:
            p = p = self.p
        if m is None:
            m = m = self.m
        assert((m & 1) and (m > 1))   # m must be odd
        if use_precalculated:
            A_precalculated = {
                (2, 7): [[0, 0, 0, 0, 1, 1, 1], [1, 0, 0, 1, 1, 0, 0],
                         [1, 1, 0, 0, 1, 0, 0], [1, 1, 1, 1, 0, 0, 0],
                         [1, 0, 0, 1, 0, 1, 0], [0, 1, 0, 1, 1, 0, 1],
                         [0, 0, 1, 0, 1, 1, 1], [0, 0, 1, 0, 0, 1, 1],
                         [0, 1, 1, 1, 0, 0, 0]],
                (2, 5): [[1, 0, 1, 1, 0], [1, 1, 0, 1, 0], [1, 0, 0, 1, 0],
                         [0, 0, 1, 1, 0], [1, 1, 1, 0, 0], [0, 1, 0, 0, 1],
                         [1, 0, 0, 1, 1]],
                (2, 3): [[0, 1, 1], [0, 0, 1], [0, 1, 0], [1, 0, 0],
                         [1, 1, 0]],
                (1, 7): [[0, 1, 0, 0, 1, 1, 1], [1, 1, 0, 0, 0, 0, 1],
                         [0, 0, 1, 1, 1, 0, 0], [1, 0, 1, 1, 0, 0, 1],
                         [0, 1, 1, 0, 0, 1, 0], [0, 1, 0, 0, 1, 1, 0],
                         [1, 1, 1, 0, 0, 0, 1], [0, 0, 1, 0, 1, 1, 1]],
                (1, 5): [[1, 1, 0, 1, 0], [1, 0, 1, 1, 0], [1, 1, 0, 0, 0],
                         [0, 1, 0, 1, 1], [1, 1, 1, 0, 0], [1, 0, 1, 0, 1]],
                (1, 3): [[0, 1, 1], [1, 1, 0], [1, 0, 0], [0, 1, 0]]}
            if (p, m) in A_precalculated.keys():
                A = np.array(A_precalculated[p, m])
                if self.verbose:
                    print(
                        f'Using the precalculated auxiliary differential\
                            DC-decomposition matrix A\n{A}')
                return A
        if self.verbose:
            print(
                f'Preparing the auxiliary differential DC-decomposition\
                    matrix A (m={m},p={p})')
        DIFF = self.differential_operator(p)

        A = []
        for i in range(2**m):
            b = np.binary_repr(i, m)
            v = np.array([int(b[j]) for j in range(m)])
            if v.sum() == m//2 or v.sum() == (m//2)+1:
                A.append(v)
        A0 = np.array(A)
        ntst = maxiter
        Abest = None
        stdbest = np.inf
        while(True):
            prm = np.random.permutation(A0.shape[0])[:m+p]
            M = DIFF(A0[prm, :])
            r = np.linalg.matrix_rank(M)
            if r == m:
                A = A0[prm, :]
                ntst -= 1
                coef = np.linalg.inv(DIFF(A).T).sum(axis=1)
                stdnew = (DIFF(coef.reshape((1, -1)), right=1)**2).sum()
                if stdnew < stdbest:
                    # select the matrix giving the most uniform distribution
                    stdbest = stdnew
                    Abest = np.array(A)
                    if self.verbose:
                        print(f'iter={maxiter-ntst}, crit={stdbest}')
                if ntst <= 0:
                    A = Abest
                    if self.verbose:
                        print(
                            f'Finished calculating the auxiliary matrix\n\
                                A={A}')
                    return A

    def dct_sampling_functions(self, dim=None, rows=None, CR=0.03):
        """Create a measuremnt matrix with DCT functions.

        Create a matrix M with rows containg low-frequency continuous-valued
        2d DCT functions.The DCT functions are stored in rows of matrix M,
        and their locations in the 2D DCT basis are indicated by the logical
        matrix SM. The returned matrix does not contain the zeroth frequency
        pattern. The compression ratio CR may be passed to the function
        instead of the number of rows. If binarize is True then a binarization
        with a randomly varied threshold is applied to M. The range of
        threshold values is governed by the value of m

        Parameters
        ----------
        dim : size of DCT basis
        rows : number of patterns to create
        CR : compression ratio (may override rows)

        Returns
        -------
        M :a real valued matrix M with rows containg low-frequency
        continuous-valued 2d DCT functions
        SM:a binary selection matrix pointing to the positions of the returned
        functions in the DCT basis
        """
        if self.verbose:
            print('Calculating the real-valued DCT patterns')
        if dim is None:
            dim = self.dim
        cols = np.prod(dim)
        if rows is None:
            rows = int(round(cols*CR))

        def InvTransform(x): return fft.idctn(x, norm='ortho')
        (x, y) = np.meshgrid(range(dim[1]), range(dim[0]))
        Avg = 1/(x+y+1e-7)  # selection function for the 2d DCT basis
        Avg[0, 0] = 0  # the 0th spatial frequency is excluded
        ind = np.argsort(-Avg.reshape(-1))[:rows]
        SM = np.zeros(Avg.size, dtype=bool)  # selection matrix
        SM[ind] = True
        P = np.flatnonzero(SM)
        M = np.zeros((rows, cols))
        ind = np.zeros(dim)
        for r in range(rows):
            ind.reshape(-1)[P[r]] = 1
            it = InvTransform(ind).reshape((1, -1))
            ind.reshape(-1)[P[r]] = 0
            M[r, :] = it
        self.M_dct = M
        return M, SM.reshape(dim)

    def binary_measurement_matrix(self, M_dct=None, A=None):
        """
        Calculate the binary measurement matrix.

        Calculate the final binary measurement matrix M consisting of
        (p+m) binary patterns that encode differentialy the zeroth spatial
        frequency of the measurement followed by the binarized rows of
        matrix M_dct
        Note: other kinds of patterns than the DCT basis could be also
        passed to this function

        Parameters
        ----------
        M_dct : the real-valued matrix with DCT patterns
        A : the auxiliary matrix encoding the measurement of the zeroth
        spatial frequency

        Returns
        -------
        M : the final binary measurement matrix with all of the patterns
        that will be displayed on the DMD stored in rows.
        """
        if A is None:
            A = self.auxiliary_matrix_a()
        if M_dct is None:
            if self.M_dct is None:
                self.dct_sampling_functions()
            M_dct = self.M_dct
        if self.verbose:
            print('Calculating the final binary measurement matrix')
        m = A.shape[1]
        p = A.shape[0]-m
        k_dct = M_dct.shape[0]
        k = m+p+k_dct
        n = M_dct.shape[1]
        M = np.zeros((k, n), dtype=np.single, order='F')
        ind = np.random.randint(0, m, n)
        for i in range(m):
            M[:m+p, ind == i] = A[:, i].reshape((-1, 1))
        for r in range(k_dct):
            argsrt = np.argsort(M_dct[r, :].ravel()+1e-7*np.random.rand(n))
            M[m+p+r, argsrt[round(n/2 * (2*np.random.rand()+m-1)/m):]] = 1
        self.Mbin = M
        return M

    def d_fdri(self, Mbin=None, p=None, dim=None, μ=None, ϵ=None, tol=1e-7):
        """
        Calculate the reconstruction matrix Pg (See Eq. (6) of Ref. [1]).

        Parameters
        ----------
        Mbin : the measurement matrix (M in Eq. (6))
        p : =1,2 order of the finite difference operator

        dim : Tpattern dimensions

        μ : parameter of FDRI controlling the shape of the spatial spectrum
        ϵ : parameter of FDRI controlling noise robustness
        tol : tolerance in the calculation of the pseudoinverse
        (defaults to 1e-7).

        Returns
        -------
        Pg: the reconstruction matrix (See Eq. (6))

        """
        if Mbin is None:
            if self.Mbin is None:
                self.binary_measurement_matrix()
            Mbin = self.Mbin
        if p is None:
            p = self.p
        if dim is None:
            dim = self.dim
        if μ is None:
            μ = self.μ
        if ϵ is None:
            ϵ = self.ϵ
        if self.verbose:
            print('Calculating the reconstruction matrix\
                  (may take a lot of time)')
        DIFF = self.differential_operator(p)
        M = DIFF(Mbin.reshape(-1, np.prod(dim)))
        Ny, Nx = dim

        def w(N): return (2*np.pi/N) * \
            np.hstack((np.arange(N//2), np.arange(-N//2, 0)))
        (wx, wy) = np.meshgrid(w(Nx), w(Ny))
        D = 1/np.sqrt((1-μ)**2 * (np.sin(wx)**2+np.sin(wy)**2) +
                      ϵ + μ**2*(wx**2+wy**2)/(2*np.pi**2))

        def row_fft2(X): return fft.fftn(X.reshape((-1, Ny, Nx)),
                                         axes=(-2, -1)).reshape((-1, Ny*Nx))

        def row_ifft2(X): return fft.ifftn(
            X.reshape((-1, Ny, Nx)), axes=(-2, -1)).reshape((-1, Ny*Nx))

        def col_fft2(X): return fft.fftn(X.T.reshape(
            (-1, Ny, Nx)), axes=(-2, -1)).reshape((-1, Ny*Nx)).T

        def col_ifft2(X): return fft.ifftn(X.T.reshape(
            (-1, Ny, Nx)), axes=(-2, -1)).reshape((-1, Ny*Nx)).T

        def FILT_R(X): return row_fft2(row_ifft2(X)*D.reshape(-1))  # F*D*F'*X
        def FILT_L(X): return col_fft2(
            D.reshape(-1, 1)*col_ifft2(X))  # F*D*F'*X
        a = FILT_R(M.reshape((-1, Nx*Ny))).real
        # use svd to calculate the pseudoinverse
        U, S, V = linalg.svd(a, full_matrices=False)  # a = U*S*V'
        inv_S = 1/S
        ind = np.abs(S) < tol*np.abs(S).max()
        if np.any(ind):
            print('Warning: zero svd values: ', ind.sum())
        inv_S[ind] = 0
        P = np.array(FILT_L((V.T.conj()*inv_S.reshape(-1))@U.T.conj()).real)
        self.Pg = np.array(DIFF(P, right=True), dtype=np.single, order='F')
        if self.verbose:
            print('Done')
        return self.Pg

    def reconstruct(self, P=None, channel=1):
        """
        Calculate a function responsible for image reconstruction.

        The returned function calculates a matrix-vector product with
        negative values replaced by zeros.

        Parameters
        ----------
        P : the reconstruction matrix (Pg in Eq. (11))
        channel : 1 or 2, the direct channel (1) or the complementary
        channel (2) (denoted as l in Eq. (11))

        Returns
        -------
        a function that evaluates Eq. (11) in [1] responsible for image
        reconstruction

        """
        if P is None:
            P = self.Pg

        def relu(x):
            x[x < 0] = 0
            return x
        if channel == 1:
            P0 = np.array(P, dtype=np.single, order='F')
        else:
            P0 = np.array(-P, dtype=np.single, order='F')
        return lambda y: relu(P0@y.reshape((-1, 1)))

    def psnr(self, orig, tstimg):
        """Find the PSNR of tstimg."""
        MSE = np.mean((orig - tstimg) ** 2)
        vmax = orig.max()
        PSNR = 10 * np.log10(vmax**2 / MSE)
        return PSNR


def main():
    """Create a DFDRI class object."""
    DFDRI(verbose=True)
    print('See example.py for usage instructions.')


if __name__ == "__main__":
    main()