vmmlib-1.7/t3__hopm_8hpp_source.html

 /*

  * Copyright (c) 2006-2014, Visualization and Multimedia Lab,

  *                          University of Zurich <http://vmml.ifi.uzh.ch>,

  *                          Eyescale Software GmbH,

  *                          Blue Brain Project, EPFL

  *

  * This file is part of VMMLib <https://github.com/VMML/vmmlib/>

  *

  * Redistribution and use in source and binary forms, with or without

  * modification, are permitted provided that the following conditions are met:

  *

  * Redistributions of source code must retain the above copyright notice, this

  * list of conditions and the following disclaimer.  Redistributions in binary

  * form must reproduce the above copyright notice, this list of conditions and

  * the following disclaimer in the documentation and/or other materials provided

  * with the distribution.  Neither the name of the Visualization and Multimedia

  * Lab, University of Zurich nor the names of its contributors may be used to

  * endorse or promote products derived from this software without specific prior

  * written permission.

  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"

  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE

  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE

  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE

  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR

  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF

  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS

  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN

  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)

  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE

  * POSSIBILITY OF SUCH DAMAGE.

  */


 /* @author Susanne Suter

  * @author Rafa Ballester

  *

  * the higher-order power method (HOPM) is also known as CP-ALS (ALS: alternating least squares)

  * CP stands for Candecomp/Parafac (1970)

  * references:

  * - Carroll & Chang, 1970: Analysis of Individual Differences in Multidimensional Scaling via an N-way generalization of ``Eckart--Young'' decompositions, Psychometrika.

  * - Harshman, 1970: Foundations of the PARAFAC procedure: Models and conditions for an 'explanatory' multi-modal factor analysis, UCLA Working Papers in Phonetics.

  * - De Lathauwer, De Moor, Vandewalle, 2000: A multilinear singular value decomposition, SIAM J. Matrix Anal. Appl.

  * - Kolda & Bader, 2009: Tensor Decompositions and Applications, SIAM Review.

  * - Bader & Kolda, 2006: Algorithm 862: Matlab tensor classes for fast algorithm prototyping. ACM Transactions on Mathematical Software.

  *

  */


 #ifndef __VMML__T3_HOPM__HPP__

 #define __VMML__T3_HOPM__HPP__


 #include <vmmlib/t3_hosvd.hpp>

 #include <vmmlib/matrix_pseudoinverse.hpp>

 #include <vmmlib/blas_dgemm.hpp>

 #include <vmmlib/blas_dot.hpp>

 #include <vmmlib/validator.hpp>

 #include <vmmlib/t3_ttv.hpp>

 #include <vmmlib/tensor_stats.hpp>


 namespace vmml {


     template< size_t R, size_t I1, size_t I2, size_t I3, typename T = float >

             class t3_hopm {

     public:

         typedef tensor3< I1, I2, I3, T > t3_type;


         typedef vector< R, T > lambda_type;


         typedef matrix< I1, R, T > u1_type;

         typedef matrix< I2, R, T > u2_type;

         typedef matrix< I3, R, T > u3_type;


         typedef matrix< R, I1, T > u1_inv_type;

         typedef matrix< R, I2, T > u2_inv_type;

         typedef matrix< R, I3, T > u3_inv_type;


         typedef matrix< I1, I2*I3, T > u1_unfolded_type;

         typedef matrix< I2, I1*I3, T > u2_unfolded_type;

         typedef matrix< I3, I1*I2, T > u3_unfolded_type;


         typedef matrix< R, R, T > m_r2_type;


         typedef typename lambda_type::iterator lvalue_iterator;

         typedef typename lambda_type::const_iterator lvalue_const_iterator;

         typedef std::pair< T, size_t > lambda_pair_type;


         //higher-order power method (lathauwer et al., 2000b)


         template< typename T_init >

         static tensor_stats als(const t3_type& data_, u1_type& u1_, u2_type& u2_, u3_type& u3_, lambda_type& lambdas_, T_init init, const size_t max_iterations_ = 50, const float tolerance = 1e-04);

         static void reconstruct(t3_type& data_, const u1_type& u1_, const u2_type& u2_, const u3_type& u3_, const lambda_type& lambdas_);


         //ktensor = kruskal tensor, i.e., lambda, U1, U2, U3

         static double norm_ktensor(const u1_type& u1_, const u2_type& u2_, const u3_type& u3_, const lambda_type& lambdas_);


         // init functors


         struct init_hosvd {


             inline void operator()(const t3_type& data_, u2_type& u2_, u3_type & u3_) {

                 t3_hosvd< R, R, R, I1, I2, I3, T >::apply_mode2(data_, u2_);

                 t3_hosvd< R, R, R, I1, I2, I3, T >::apply_mode3(data_, u3_);

             }

         };


         struct init_random {


             inline void operator()(const t3_type&, u2_type& u2_, u3_type & u3_) {

                 srand(time(NULL));

                 u2_.set_random();

                 u3_.set_random();

             }

         };


         //FIXME: check test on linux

 #if 1


         struct init_dct {


             inline void operator()(const t3_type&, u2_type& u2_, u3_type & u3_) {

                 u2_.set_dct();

                 u3_.set_dct();

             }

         };

 #endif


     protected:


         static void optimize_mode1(const t3_type& data_, u1_type& u1, const u2_type& u2_, const u3_type& u3_, lambda_type& lambdas_);

         static void optimize_mode2(const t3_type& data_, const u1_type& u1_, u2_type& u2_, const u3_type& u3_, lambda_type& lambdas_);

         static void optimize_mode3(const t3_type& data_, const u1_type& u1_, const u2_type& u2_, u3_type& u3_, lambda_type& lambdas_);


         template< size_t J, size_t K, size_t L >

         static void optimize(const matrix< J, K*L, T >& unfolding_,

                 matrix< J, R, T >& uj_,

                 const matrix< K, R, T >& uk_, const matrix< L, R, T >& ul_,

                 vector< R, T>& lambdas_

                 );


         static void sort_dec(u1_type& u1_, u2_type& u2_, u3_type& u3_, lambda_type& lambdas_);


         // comparison functor


         struct lambda_compare {


             inline bool operator()(const lambda_pair_type& a, const lambda_pair_type & b) {

                 return fabs(a.first) > fabs(b.first);

             }

         };


     };


 #define VMML_TEMPLATE_STRING        template< size_t R, size_t I1, size_t I2, size_t I3, typename T >

 #define VMML_TEMPLATE_CLASSNAME     t3_hopm< R, I1, I2, I3, T >


     VMML_TEMPLATE_STRING

     template< typename T_init>

     tensor_stats

     VMML_TEMPLATE_CLASSNAME::als(const t3_type& data_,

             u1_type& u1_, u2_type& u2_, u3_type& u3_,

             lambda_type& lambdas_,

             T_init init,

             const size_t max_iterations_, const float tolerance_) {


         tensor_stats result;

         t3_type* approximated_data = new t3_type;

         t3_type* residual_data = new t3_type;

         residual_data->zero();


         T max_f_norm = 0.0;

         T fit = 0.;

         T fitchange, norm2, innerprod, fitold, normresidual;

         if (tolerance_ > 0) {

             max_f_norm = data_.frobenius_norm();

             fit = 0;

             if (max_f_norm == 0)

                 fit = 1;

             fitchange = 1;

             norm2 = innerprod = 0;

             fitold = fit;

             normresidual = 0;

         }


         //intialize u1-u3

         //inital guess not needed for u1 since it will be computed in the first optimization step

         init(data_, u2_, u3_);


         assert(validator::is_valid(u2_) && validator::is_valid(u3_));

         assert(validator::is_valid(lambdas_));


 #if CP_LOG

         std::ostringstream convert;

         convert << R;

         std::cout << convert.str() + "-R rank CP ALS: HOPM (for tensor3) " << std::endl;

 #endif


         size_t i = 0;

         while (i < max_iterations_ && (tolerance_ < 0 || fitchange >= tolerance_)) //do until converges

         {

             fitold = fit;


             //            timer myTimer;

             //            myTimer.start();


             optimize_mode1(data_, u1_, u2_, u3_, lambdas_);

             //#if CP_LOG

             //            std::cerr << myTimer.get_seconds() << " ";

             //            myTimer.start();

             //#endif

             optimize_mode2(data_, u1_, u2_, u3_, lambdas_);

 #if CP_LOG

             //            std::cerr << myTimer.get_seconds() << " ";

             //            myTimer.start();

 #endif

             optimize_mode3(data_, u1_, u2_, u3_, lambdas_);

             //#if CP_LOG

             //            std::cerr << myTimer.get_seconds() << " ";

             //#endif


             if (tolerance_ > 0) {

                 norm2 = norm_ktensor(u1_, u2_, u3_, lambdas_);


                 T val2 = 0;

                 for( size_t j = 0; j < lambdas_.size(); ++j)

                 {

                     matrix<I2, I3, T> res1;

                     t3_ttv::multiply_first_mode(data_, u1_.get_column(j), res1);

                     vector<I2, T> res2 = res1 * u3_.get_column(j);

                     val2 += lambdas_.at(j) * (res2.dot(u2_.get_column(j)));

                 }

                 innerprod = 2 * val2;

                 // ||X-P|| = sqrt( ||X||^2 + ||P||^2 - 2 * X.P );

                 normresidual = sqrt(max_f_norm * max_f_norm + norm2 * norm2 - innerprod);

                 fit = 1 - (normresidual / max_f_norm);

                 fitchange = fabs(fitold - fit);

 #if CP_LOG

                 //                std::cerr << myTimer.get_seconds() << " ";

                 std::cout << "iteration '" << i

                         << "', fit: " << fit

                         << ", fitdelta: " << fit - fitold

                         << ", normresidual: " << normresidual;

                 if (fit - fitold < 0) std::cout << " *fit is worsening*";

                 std::cout << std::endl;

 #endif

             }

 #if 0

             myTimer.start();


             //Reconstruct tensor and measure norm of approximation

             //slower version since cp reconstruction is slow

             reconstruct(*approximated_data, u1_, u2_, u3_, lambdas_);

             //            approx_norm = approximated_data->frobenius_norm();

             *residual_data = data_ - *approximated_data;

             normresidual = residual_data->frobenius_norm();

             std::cerr << myTimer.get_seconds() << " ";

 #endif


             ++i;

         } // end ALS

         result.set_n_iterations(i);


         //sort lambdas by decreasing magnitude

         sort_dec(u1_, u2_, u3_, lambdas_);


         delete residual_data;

         delete approximated_data;

         return result;

     }


     VMML_TEMPLATE_STRING

     void

     VMML_TEMPLATE_CLASSNAME::optimize_mode1(const t3_type& data_, u1_type& u1_, const u2_type& u2_, const u3_type& u3_, lambda_type& lambdas_) {

         u1_unfolded_type* unfolding = new u1_unfolded_type; // -> u1

         //data_.horizontal_unfolding_bwd( *unfolding ); //lathauwer

         data_.frontal_unfolding_fwd(*unfolding);


         assert(validator::is_valid(u2_) && validator::is_valid(u3_));


         optimize(*unfolding, u1_, u2_, u3_, lambdas_);


         delete unfolding;

     }


     VMML_TEMPLATE_STRING

     void

     VMML_TEMPLATE_CLASSNAME::optimize_mode2(const t3_type& data_, const u1_type& u1_, u2_type& u2_, const u3_type& u3_, lambda_type& lambdas_) {

         u2_unfolded_type* unfolding = new u2_unfolded_type; // -> u2

         data_.frontal_unfolding_bwd(*unfolding); //lathauwer

         //data_.horizontal_unfolding_fwd( *unfolding );


         assert(validator::is_valid(u1_) && validator::is_valid(u3_));


         optimize(*unfolding, u2_, u1_, u3_, lambdas_);


         delete unfolding;

     }


     VMML_TEMPLATE_STRING

     void

     VMML_TEMPLATE_CLASSNAME::optimize_mode3(const t3_type& data_, const u1_type& u1_, const u2_type& u2_, u3_type& u3_, lambda_type& lambdas_) {

         u3_unfolded_type* unfolding = new u3_unfolded_type; //-> u3

         //data_.horizontal_unfolding_bwd( *unfolding );//lathauwer

         data_.lateral_unfolding_fwd(*unfolding);


         assert(validator::is_valid(u1_) && validator::is_valid(u2_));


         optimize(*unfolding, u3_, u1_, u2_, lambdas_);


         delete unfolding;

     }


     VMML_TEMPLATE_STRING

     template< size_t J, size_t K, size_t L >

     void

     VMML_TEMPLATE_CLASSNAME::optimize(

             const matrix< J, K*L, T >& unfolding_,

             matrix< J, R, T >& uj_,

             const matrix< K, R, T >& uk_, const matrix< L, R, T >& ul_,

             vector< R, T>& lambdas_

             ) {


         typedef matrix< K*L, R, T > krp_matrix_type;

         krp_matrix_type* krp_prod = new krp_matrix_type;

         assert(validator::is_valid(uk_) && validator::is_valid(ul_));


         ul_.khatri_rao_product(uk_, *krp_prod);


         matrix< J, R, T >* u_new = new matrix< J, R, T >;


         blas_dgemm< J, K*L, R, T> blas_dgemm1;

         blas_dgemm1.compute(unfolding_, *krp_prod, *u_new);


         //square matrix of U_l and U_k

         m_r2_type* uk_r = new m_r2_type;

         m_r2_type* ul_r = new m_r2_type;


         blas_dgemm< R, K, R, T> blas_dgemm2;

         blas_dgemm2.compute_t(uk_, *uk_r);

         assert(validator::is_valid(*uk_r));


         blas_dgemm< R, L, R, T> blas_dgemm3;

         blas_dgemm3.compute_t(ul_, *ul_r);

         assert(validator::is_valid(*ul_r));


         uk_r->multiply_piecewise(*ul_r);

         assert(validator::is_valid(*uk_r));


         m_r2_type* pinv_t = new m_r2_type;

         compute_pseudoinverse< m_r2_type > compute_pinv;


         compute_pinv(*uk_r, *pinv_t);


         blas_dgemm< J, R, R, T> blas_dgemm4;

         blas_dgemm4.compute_bt(*u_new, *pinv_t, uj_);

         assert(validator::is_valid(uj_));


         *u_new = uj_;

         u_new->multiply_piecewise(*u_new); //2 norm

         u_new->columnwise_sum(lambdas_);


         assert(validator::is_valid(lambdas_));


         lambdas_.sqrt_elementwise();

         lambda_type* tmp = new lambda_type;

         *tmp = lambdas_;

         tmp->reciprocal_safe();


         assert(validator::is_valid(*tmp));


         m_r2_type* diag_lambdas = new m_r2_type;

         diag_lambdas->diag(*tmp);


         matrix< J, R, T >* tmp_uj = new matrix< J, R, T > (uj_);

         blas_dgemm4.compute(*tmp_uj, *diag_lambdas, uj_);


         assert(validator::is_valid(uj_));


         delete krp_prod;

         delete uk_r;

         delete ul_r;

         delete pinv_t;

         delete u_new;

         delete diag_lambdas;

         delete tmp;

         delete tmp_uj;


     }


     VMML_TEMPLATE_STRING

     void

     VMML_TEMPLATE_CLASSNAME::reconstruct(t3_type& data_, const u1_type& u1_, const u2_type& u2_, const u3_type& u3_, const lambda_type& lambdas_) {

         u1_inv_type* u1_t = new u1_inv_type;

         u2_inv_type* u2_t = new u2_inv_type;

         u3_inv_type* u3_t = new u3_inv_type;

         typedef matrix< R, I2 * I3, T > m_temp_type;

         m_temp_type* temp = new m_temp_type;


         u1_.transpose_to(*u1_t);

         u2_.transpose_to(*u2_t);

         u3_.transpose_to(*u3_t);


         data_.reconstruct_CP(lambdas_, *u1_t, *u2_t, *u3_t, *temp);


         delete temp;

         delete u1_t;

         delete u2_t;

         delete u3_t;

     }


     VMML_TEMPLATE_STRING

     double

     VMML_TEMPLATE_CLASSNAME::norm_ktensor(const u1_type& u1_, const u2_type& u2_, const u3_type& u3_, const lambda_type& lambdas_) {

         m_r2_type* coeff2_matrix = new m_r2_type;

         m_r2_type* cov_u1 = new m_r2_type;

         m_r2_type* cov_u2 = new m_r2_type;

         m_r2_type* cov_u3 = new m_r2_type;


         blas_dgemm< R, 1, R, T >* blas_l2 = new blas_dgemm< R, 1, R, T>;

         blas_l2->compute_vv_outer(lambdas_, lambdas_, *coeff2_matrix);

         delete blas_l2;


         blas_dgemm< R, I1, R, T >* blas_u1cov = new blas_dgemm< R, I1, R, T>;

         blas_u1cov->compute_t(u1_, *cov_u1);

         delete blas_u1cov;


         blas_dgemm< R, I2, R, T >* blas_u2cov = new blas_dgemm< R, I2, R, T>;

         blas_u2cov->compute_t(u2_, *cov_u2);

         delete blas_u2cov;


         blas_dgemm< R, I3, R, T >* blas_u3cov = new blas_dgemm< R, I3, R, T>;

         blas_u3cov->compute_t(u3_, *cov_u3);

         delete blas_u3cov;


         coeff2_matrix->multiply_piecewise(*cov_u1);

         coeff2_matrix->multiply_piecewise(*cov_u2);

         coeff2_matrix->multiply_piecewise(*cov_u3);


         double nrm = coeff2_matrix->sum_elements();


         delete coeff2_matrix;

         delete cov_u1;

         delete cov_u2;

         delete cov_u3;


         return sqrt(nrm);

     }


     VMML_TEMPLATE_STRING

     void

     VMML_TEMPLATE_CLASSNAME::sort_dec(u1_type& u1_, u2_type& u2_, u3_type& u3_, lambda_type& lambdas_) {

         //keep copy of original matrices

         u1_type *orig_u1 = new u1_type(u1_);

         u2_type *orig_u2 = new u2_type(u2_);

         u3_type *orig_u3 = new u3_type(u3_);

         lambda_type sorted_lvalues;


         //(1) store permutations of the lambdas (According to larges magnitude

         std::vector< lambda_pair_type > lambda_permut;


         lvalue_const_iterator it = lambdas_.begin(), it_end = lambdas_.end();

         size_t counter = 0;

         for (; it != it_end; ++it, ++counter) {

             lambda_permut.push_back(lambda_pair_type(*it, counter));

         }


         std::sort(

                 lambda_permut.begin(),

                 lambda_permut.end(),

                 lambda_compare()

                 );


         //(2) sort the matrix vectors according to lambda permutations and set sorted lambdas

         typename std::vector< lambda_pair_type >::const_iterator it2 = lambda_permut.begin(), it2_end = lambda_permut.end();

         lvalue_iterator lvalues_it = lambdas_.begin();

         for (counter = 0; it2 != it2_end; ++it2, ++counter, ++lvalues_it) {

             *lvalues_it = it2->first;

             u1_.set_column(counter, orig_u1->get_column(it2->second));

             u2_.set_column(counter, orig_u2->get_column(it2->second));

             u3_.set_column(counter, orig_u3->get_column(it2->second));

         }


         delete orig_u1;

         delete orig_u2;

         delete orig_u3;

     }


 #undef VMML_TEMPLATE_STRING

 #undef VMML_TEMPLATE_CLASSNAME


 }//end vmml namespace


 #endif

vmml::t3_hopm::lambda_compare
Definition: t3_hopm.hpp:143

vmml::t3_hopm
Definition: t3_hopm.hpp:61

vmml::t3_hopm::init_random
Definition: t3_hopm.hpp:104

vmml::t3_hopm::init_dct
Definition: t3_hopm.hpp:116

vmml::t3_hosvd
Definition: t3_hosvd.hpp:63

vmml::tensor3
Definition: tensor3.hpp:62

vmml::tensor_stats
Definition: tensor_stats.hpp:45

vmml::matrix
Definition: matrix.hpp:58

vmml::vector
Definition: vector.hpp:53

vmml::t3_hopm::init_hosvd
Definition: t3_hopm.hpp:96