BatchPoisson.cpp

//
// Created by eliezer on 28.10.16.
//

#include "BatchPoisson.h"
/*************************************
 An ANSI-C implementation of the digamma-function for real arguments based
 on the Chebyshev expansion proposed in appendix E of
 http://arXiv.org/abs/math.CA/0403344 . This is identical to the implementation
 by Jet Wimp, Math. Comp. vol 15 no 74 (1961) pp 174 (see Table 1).
 For other implementations see
 the GSL implementation for Psi(Digamma) in
 http://www.gnu.org/software/gsl/manual/html_node/Psi-_0028Digamma_0029-Function.html

Richard J. Mathar, 2005-11-24
**************************************/
#include <math.h>

#ifndef M_PIl
/** The constant Pi in high precision */
#define M_PIl 3.1415926535897932384626433832795029L
#endif
#ifndef M_GAMMAl
/** Euler's constant in high precision */
#define M_GAMMAl 0.5772156649015328606065120900824024L
#endif
#ifndef M_LN2l
/** the natural logarithm of 2 in high precision */
#define M_LN2l 0.6931471805599453094172321214581766L
#endif

/** The digamma function in long double precision.
* @param x the real value of the argument
* @return the value of the digamma (psi) function at that point
* @author Richard J. Mathar
* @since 2005-11-24
*/
long double digammal(long double x)
{
    /* force into the interval 1..3 */
    if( x < 0.0L )
        return digammal(1.0L-x)+M_PIl/tanl(M_PIl*(1.0L-x)) ;	/* reflection formula */
    else if( x < 1.0L )
        return digammal(1.0L+x)-1.0L/x ;
    else if ( x == 1.0L)
        return -M_GAMMAl ;
    else if ( x == 2.0L)
        return 1.0L-M_GAMMAl ;
    else if ( x == 3.0L)
        return 1.5L-M_GAMMAl ;
    else if ( x > 3.0L)
        /* duplication formula */
        return 0.5L*(digammal(x/2.0L)+digammal((x+1.0L)/2.0L))+M_LN2l ;
    else
    {
        /* Just for your information, the following lines contain
        * the Maple source code to re-generate the table that is
        * eventually becoming the Kncoe[] array below
        * interface(prettyprint=0) :
        * Digits := 63 :
        * r := 0 :
        *
        * for l from 1 to 60 do
        * 	d := binomial(-1/2,l) :
        * 	r := r+d*(-1)^l*(Zeta(2*l+1) -1) ;
        * 	evalf(r) ;
        * 	print(%,evalf(1+Psi(1)-r)) ;
        *o d :
        *
        * for N from 1 to 28 do
        * 	r := 0 :
        * 	n := N-1 :
        *
         *	for l from iquo(n+3,2) to 70 do
        *		d := 0 :
         *		for s from 0 to n+1 do
         *		 d := d+(-1)^s*binomial(n+1,s)*binomial((s-1)/2,l) :
         *		od :
         *		if 2*l-n > 1 then
         *		r := r+d*(-1)^l*(Zeta(2*l-n) -1) :
         *		fi :
         *	od :
         *	print(evalf((-1)^n*2*r)) ;
         *od :
         *quit :
        */
        static long double Kncoe[] = { .30459198558715155634315638246624251L,
                                       .72037977439182833573548891941219706L, -.12454959243861367729528855995001087L,
                                       .27769457331927827002810119567456810e-1L, -.67762371439822456447373550186163070e-2L,
                                       .17238755142247705209823876688592170e-2L, -.44817699064252933515310345718960928e-3L,
                                       .11793660000155572716272710617753373e-3L, -.31253894280980134452125172274246963e-4L,
                                       .83173997012173283398932708991137488e-5L, -.22191427643780045431149221890172210e-5L,
                                       .59302266729329346291029599913617915e-6L, -.15863051191470655433559920279603632e-6L,
                                       .42459203983193603241777510648681429e-7L, -.11369129616951114238848106591780146e-7L,
                                       .304502217295931698401459168423403510e-8L, -.81568455080753152802915013641723686e-9L,
                                       .21852324749975455125936715817306383e-9L, -.58546491441689515680751900276454407e-10L,
                                       .15686348450871204869813586459513648e-10L, -.42029496273143231373796179302482033e-11L,
                                       .11261435719264907097227520956710754e-11L, -.30174353636860279765375177200637590e-12L,
                                       .80850955256389526647406571868193768e-13L, -.21663779809421233144009565199997351e-13L,
                                       .58047634271339391495076374966835526e-14L, -.15553767189204733561108869588173845e-14L,
                                       .41676108598040807753707828039353330e-15L, -.11167065064221317094734023242188463e-15L } ;

        register long double Tn_1 = 1.0L ;	/* T_{n-1}(x), started at n=1 */
        register long double Tn = x-2.0L ;	/* T_{n}(x) , started at n=1 */
        register long double resul = Kncoe[0] + Kncoe[1]*Tn ;

        x -= 2.0L ;

        for(int n = 2 ; n < sizeof(Kncoe)/sizeof(long double) ;n++)
        {
            const long double Tn1 = 2.0L * x * Tn - Tn_1 ;	/* Chebyshev recursion, Eq. 22.7.4 Abramowitz-Stegun */
            resul += Kncoe[n]*Tn1 ;
            Tn_1 = Tn ;
            Tn = Tn1 ;
        }
        return resul ;
    }
}

/** The optional interface to CREASO's IDL is added if someone has defined
* the cpp macro export_IDL_REF, which typically has been done by including the
* files stdio.h and idl_export.h before this one here.
*/
#ifdef export_IDL_REF
/** CALL_EXTERNAL interface.
* A template of calling this C function from IDL  is
* @verbatim
* dg = CALL_EXTERNAL('digamma.so',X)
* @endverbatim
* @param argc the number of arguments. This is supposed to be 1 and not
*    checked further because that might have negative impact on performance.
* @param argv the parameter list. The first element is the parameter x
*    supposed to be of type DOUBLE in IDL
* @return the return value, again of IDL-type DOUBLE
* @since 2007-01-16
* @author Richard J. Mathar
*/
double digamma_idl(int argc, void *argv[])
{
	long double x = *(double*)argv[0] ;
	return (double)digammal(x) ;
}
#endif /* export_IDL_REF */

#ifdef TEST

/* an alternate implementation for test purposes, using formula 6.3.16 of Abramowitz/Stegun with the
   first n terms */
#include <stdio.h>

long double digammalAlt(long double x, int n)
{
	/* force into the interval 1..3 */
	if( x < 0.0L )
		return digammalAlt(1.0L-x,n)+M_PIl/tanl(M_PIl*(1.0L-x)) ;	/* reflection formula */
	else if( x < 1.0L )
		return digammalAlt(1.0L+x,n)-1.0L/x ;
	else if ( x == 1.0L)
		return -M_GAMMAl ;
	else if ( x == 2.0L)
		return 1.0L-M_GAMMAl ;
	else if ( x == 3.0L)
		return 1.5L-M_GAMMAl ;
	else if ( x > 3.0L)
		return digammalAlt(x-1.0L,n)+1.0L/(x-1.0L) ;
	else
	{
		x -= 1.0L ;
		register long double resul = -M_GAMMAl ;

		for( ; n >= 1 ;n--)
			resul += x/(n*(n+x)) ;
		return resul ;
	}
}
int main(int argc, char *argv[])
{
	for( long double x=0.01 ; x < 5. ; x += 0.02)
		printf("%.2Lf %.30Lf %.30Lf %.30Lf\n",x, digammal(x), digammalAlt(x,100), digammalAlt(x,200) ) ;
}

#endif /* TEST */


void compute_gama_expected(ArrayXXf& a_x, ArrayXf& b_x, ArrayXXf& e_x,
                           ArrayXXf& elog_x) {
    for ( long i=0; i< a_x.cols();i++ ){
        for( long k=0; k< a_x.rows();k++){
            e_x(k,i) = a_x(k,i)/b_x(k);
            elog_x(k,i) = (float)(digammal(a_x(k,i))-log(b_x(k)));
        }
    }
}


BatchPoisson::BatchPoisson(uint64_t n_users,uint64_t n_wd_entries, uint64_t n_items, uint64_t k_feat, uint64_t n_words, uint64_t n_ratings,
                           uint64_t n_max_neighbors, float a, float b, float c, float d, float e, float f, float g,
                           float h, float k, float l)
: n_users(n_users), n_items(n_items), k_feat(k_feat),
n_words(n_words), n_ratings(n_ratings),
n_wd_entries(n_wd_entries),
n_max_neighbors(n_max_neighbors), a(a), b(b), c(c), d(d), e(e),
f(f), g(g), h(h), k(k), l(l) , a_beta(ArrayXXf::Constant(k_feat,n_words,a)),
b_beta(ArrayXf::Constant(k_feat,b)), e_beta(ArrayXXf::Constant(k_feat,n_words,0)),
elog_beta(ArrayXXf::Constant(k_feat,n_words,0)), a_theta(ArrayXXf::Constant(k_feat,n_items,c)),
b_theta(ArrayXf::Constant(k_feat,d)), e_theta(ArrayXXf::Constant(k_feat,n_items,0)),
elog_theta(ArrayXXf::Constant(k_feat,n_items,0)),a_epsilon(ArrayXXf::Constant(k_feat,n_items,g)),
b_epsilon(ArrayXf::Constant(k_feat,h)), e_epsilon(ArrayXXf::Constant(k_feat,n_items,0)),
elog_epsilon(ArrayXXf::Constant(k_feat,n_items,0)), a_eta(ArrayXXf::Constant(k_feat,n_users,e)),
b_eta(ArrayXf::Constant(k_feat,f)),e_eta(ArrayXXf::Constant(k_feat,n_users,0)),
elog_eta(ArrayXXf::Constant(k_feat,n_users,0)),a_tau(ArrayXXf::Constant(n_max_neighbors,n_users,k)),
b_tau(ArrayXf::Constant(n_max_neighbors,l)),e_tau(ArrayXXf::Constant(n_max_neighbors,n_users,0)),
elog_tau(ArrayXXf::Constant(n_max_neighbors,n_users,0)),
phi(ArrayXXf::Constant(k_feat,n_wd_entries,0)),xi_M(ArrayXXf::Constant(k_feat,n_ratings,0)),
xi_N(ArrayXXf::Constant(k_feat,n_ratings,0)),xi_S(ArrayXXf::Constant(n_max_neighbors,n_ratings,0))
{}

void BatchPoisson::train(vector<tuple<uint64_t, uint64_t, uint64_t>> r_entries,
                         vector<tuple<uint64_t, uint64_t, uint64_t>> w_entries,
                         vector<list<pair<uint64_t, uint64_t>>> user_items_neighboors,
                         uint64_t n_iter, double tol) {
    this->r_entries = r_entries;
    this->w_entries = w_entries;
    this->user_items_neighboors = user_items_neighboors;
    double old_elbo=-std::numeric_limits<double>::infinity();
    double elbo;
    for(auto i=0;i<n_iter;i++){
        update_aux_latent();
        update_latent();
        elbo = compute_elbo();
        elbo_lst.push_back(elbo);
        if(abs(elbo-old_elbo)/old_elbo < tol)
            break;
        else{
            old_elbo=elbo;
        }

    }
}

double BatchPoisson::compute_elbo() {
    return 0;
}


void BatchPoisson::init() {

}

void BatchPoisson::update_aux_latent(){
    float sum_k=0;
    for(auto ud=0; ud< n_ratings;ud++){
        auto user_u = std::get<0>(r_entries[ud]);
        auto item_i = std::get<1>(r_entries[ud]);
        for(auto k=0; k<k_feat;k++){
            // self.xi_M = np.exp(self.Elogeta[:, np.newaxis, :] + self.Elogtheta[:, :, np.newaxis])
            xi_M(k,ud)=exp(elog_eta(k,user_u)+elog_theta(k,item_i));

            // self.xi_N = np.exp(self.Elogeta[:, np.newaxis, :] + self.Elogepsilon[:, :, np.newaxis])
            xi_N(k,ud)=exp(elog_eta(k,user_u)+elog_epsilon(k,item_i));
            sum_k += xi_M(k,ud)+xi_N(k,ud);
        }
        xi_S.col(ud)=0;
        for(auto neighb : user_items_neighboors[ud]){
            xi_S(neighb.first,ud) = std::get<2>(r_entries[neighb.second])
                                    *exp(elog_tau(neighb.first,user_u));
            sum_k += xi_S(neighb.first,ud);
        }
        xi_M.col(ud)/=sum_k;
        xi_N.col(ud)/=sum_k;
        xi_S.col(ud)/=sum_k;
    }

    for(auto dv=0; dv< n_wd_entries;dv++){
        sum_k=0;
        auto word_w = std::get<0>(w_entries[dv]);
        auto item_i = std::get<1>(w_entries[dv]);
        for(auto k=0; k<k_feat;k++){
            // self.phi = np.exp(self.Elogbeta[:, np.newaxis, :] + self.Elogtheta[:, :, np.newaxis])
            phi(k,dv)=exp(elog_beta(k,word_w)+elog_theta(k,item_i));
            sum_k += phi(k,dv);
        }
        {
            phi.col(dv)/=sum_k;
        }

    }

}

void BatchPoisson::update_latent() {
    a_beta=a;
    a_theta=c;
    a_epsilon=g;
    a_eta=e;
    a_tau=k;

    for(auto ud=0; ud< n_ratings;ud++){
        auto user_u = std::get<0>(r_entries[ud]);
        auto item_i = std::get<1>(r_entries[ud]);
        auto r_ud= std::get<2>(w_entries[ud]);
        /** auto rudk_M=r_ud*xi_M.col(ud);
        auto rudk_N=r_ud*xi_N.col(ud);
        a_epsilon.col(item_i)+=rudk_N;
        a_theta.col(item_i)+=rudk_M;
        a_eta.col(user_u)+=rudk_M+rudk_N; **/
        for(auto k=0; k<k_feat;k++){
            auto rudk_M=r_ud*xi_M(k,ud);
            auto rudk_N=r_ud*xi_N(k,ud);
            a_epsilon(k,item_i)+=rudk_N;
            a_theta(k,item_i)+=rudk_M;
            a_eta(k,user_u)+=rudk_M+rudk_N;

        }
        /** a_tau.col(user_u)+=xi_S.col(ud); **/
        for(auto neighb : user_items_neighboors[ud]) {
            a_tau(neighb.first,user_u)+=xi_S(neighb.first, ud);
        }
    }
    double temp_w;
    for(auto dv=0; dv< n_wd_entries;dv++){

        auto word_w = std::get<0>(w_entries[dv]);
        auto item_i = std::get<1>(w_entries[dv]);
        auto wdv= std::get<2>(w_entries[dv]);
        for(auto k=0; k<k_feat;k++) {
            temp_w=wdv*phi(k,dv);
            a_beta(k,word_w)+=temp_w;
            a_theta(k,item_i)+=temp_w;

        }
    }

    b_beta=b;
    b_theta=d;
    b_epsilon=h;
    b_eta=f;

    for(auto k=0; k<k_feat;k++) {


    }

    update_expected();

}

void BatchPoisson::update_expected() {
    compute_gama_expected(a_beta, b_beta, e_beta, elog_beta);
    compute_gama_expected(a_theta, b_theta,e_theta,elog_theta);
    compute_gama_expected(a_epsilon, b_epsilon,e_epsilon,elog_epsilon);
    compute_gama_expected(a_eta, b_eta,e_eta,elog_eta);
    compute_gama_expected(a_tau, b_tau,e_tau,elog_tau);
}