d8/dc0/bppnmf_8hpp_source.html

 /* Copyright 2016 Ramakrishnan Kannan */

 #ifndef NMF_BPPNMF_HPP_
 #define NMF_BPPNMF_HPP_

 #include <omp.h>
 #include "common/nmf.hpp"
 #include "nnls/bppnnls.hpp"

 // needed for precondition with hals
 #ifdef BUILD_SPARSE
 #include "hals.hpp"
 #endif

 #define ONE_THREAD_MATRIX_SIZE 2000

 namespace planc {

 template <class T>
 class BPPNMF : public NMF<T> {
  private:
   T At;
   MAT giventGiven;
   // designed as if W is given and H is found.
   // The transpose is the other problem.
   void updateOtherGivenOneMultipleRHS(const T &input, const MAT &given,
                                       char worh, MAT *othermat) {
     double t2;
     UINT numThreads = (input.n_cols / ONE_THREAD_MATRIX_SIZE) + 1;
     tic();
     MAT giventInput(this->k, input.n_cols);
     // This is WtW
     giventGiven = given.t() * given;
     // This is WtA
     // tic();
     giventInput = given.t() * input;
     // INFO << "matmul ::" << toc() << std::endl;
     t2 = toc();
     INFO << "starting " << worh << ". Prereq for " << worh << " took=" << t2
          << " NumThreads=" << numThreads << PRINTMATINFO(giventGiven)
          << PRINTMATINFO(giventInput) << std::endl;
     tic();
 #pragma omp parallel for schedule(dynamic)
     for (UINT i = 0; i < numThreads; i++) {
       UINT spanStart = i * ONE_THREAD_MATRIX_SIZE;
       UINT spanEnd = (i + 1) * ONE_THREAD_MATRIX_SIZE - 1;
       if (spanEnd > input.n_cols - 1) {
         spanEnd = input.n_cols - 1;
       }
       // if it is exactly divisible, the last iteration is unnecessary.
       BPPNNLS<MAT, VEC> *subProblem;
       if (spanStart <= spanEnd) {
         if (spanStart == spanEnd) {
           subProblem = new BPPNNLS<MAT, VEC>(
               giventGiven, (VEC)giventInput.col(spanStart), true);
         } else {  // if (spanStart < spanEnd)
           subProblem = new BPPNNLS<MAT, VEC>(
               giventGiven, (MAT)giventInput.cols(spanStart, spanEnd), true);
         }
 #ifdef _VERBOSE
         INFO << "Scheduling " << worh << " start=" << spanStart
              << ", end=" << spanEnd << ", tid=" << omp_get_thread_num()
              << std::endl;
 #endif
         // tic();
         subProblem->solveNNLS();
         // t2 = toc();
 #ifdef _VERBOSE
         INFO << "completed " << worh << " start=" << spanStart
              << ", end=" << spanEnd << ", tid=" << omp_get_thread_num()
              << " cpu=" << sched_getcpu() << " time taken=" << t2
              << " num_iterations()=" << numIter << std::endl;
 #endif
         if (spanStart == spanEnd) {
           ROWVEC solVec = subProblem->getSolutionVector().t();
           (*othermat).row(i) = solVec;
         } else {  // if (spanStart < spanEnd)
           (*othermat).rows(spanStart, spanEnd) =
               subProblem->getSolutionMatrix().t();
         }
         subProblem->clear();
         delete subProblem;
       }
     }
     double totalH2 = toc();
     INFO << worh << " total time taken :" << totalH2 << std::endl;
     giventGiven.clear();
     giventInput.clear();
   }

  public:
   BPPNMF(const T &A, int lowrank) : NMF<T>(A, lowrank) {
     giventGiven = arma::zeros<MAT>(lowrank, lowrank);
     this->At = A.t();
   }
   BPPNMF(const T &A, const MAT &llf, const MAT &rlf) : NMF<T>(A, llf, rlf) {
     this->At = A.t();
   }
   void computeNMFSingleRHS() {
     int currentIteration = 0;
     T At = this->A.t();
     this->computeObjectiveErr();
     while (currentIteration < this->num_iterations() &&
            this->objectiveErr > CONV_ERR) {
 #ifdef COLLECTSTATS
       this->collectStats(currentIteration);
 #endif
       // solve for H given W;
       MAT Wt = this->W.t();
       MAT WtW = Wt * this->W;
       MAT WtA = Wt * this->A;
       Wt.clear();
       {
 #pragma omp parallel for
         // int i=251;
         for (UINT i = 0; i < this->n; i++) {
           BPPNNLS<MAT, VEC> *subProblemforH =
               new BPPNNLS<MAT, VEC>(WtW, (VEC)WtA.col(i), true);
 #ifdef _VERBOSE
           INFO << "Initialized subproblem and calling solveNNLS for "
                << "H(" << i << "/" << this->n << ")";
 #endif
           tic();
           int numIter = subProblemforH->solveNNLS();
           double t2 = toc();
 #ifdef _VERBOSE
           INFO << subProblemforH->getSolutionVector();
 #endif
           this->H.row(i) = subProblemforH->getSolutionVector().t();
           INFO << "Comp H(" << i << "/" << this->n
                << ") of it=" << currentIteration << " time taken=" << t2
                << " num_iterations()=" << numIter << std::endl;
         }
       }
 #ifdef _VERBOSE
       INFO << "H: at it = " << currentIteration << std::endl << this->H;
 #endif
       // #pragma omp parallel
       {
         // clear previous allocations.
         WtW.clear();
         WtA.clear();
         MAT Ht = this->H.t();
         MAT HtH = Ht * this->H;
         MAT HtAt = Ht * At;
         Ht.clear();
 // solve for W given H;
 #pragma omp parallel for
         for (UINT i = 0; i < this->m; i++) {
           BPPNNLS<MAT, VEC> *subProblemforW =
               new BPPNNLS<MAT, VEC>(HtH, (VEC)HtAt.col(i), true);
 #ifdef _VERBOSE
           INFO << "Initialized subproblem and calling solveNNLS for "
                << "W(" << i << "/" << this->m << ")";
 #endif
           tic();
           int numIter = subProblemforW->solveNNLS();
           double t2 = toc();
 #ifdef _VERBOSE
           INFO << subProblemforW->getSolutionVector();
 #endif

           this->W.row(i) = subProblemforW->getSolutionVector().t();
           INFO << "Comp W(" << i << "/" << this->n
                << ") of it=" << currentIteration << " time taken=" << t2
                << " num_iterations()=" << numIter << std::endl;
         }
         HtH.clear();
         HtAt.clear();
       }
 #ifdef _VERBOSE
       INFO << "W: at it = " << currentIteration << std::endl << this->W;
 #endif
 #ifdef COLLECTSTATS
       // INFO << "iteration = " << currentIteration << " currentObjectiveError="
       // << this->objective_err << std::endl;
 #endif
       currentIteration++;
     }
   }
   void computeNMF() {
     unsigned int currentIteration = 0;
 #ifdef COLLECTSTATS
     // this->objective_err;
 #endif
     // tic();
     // this->At = this->A.t();  // do it once
     // INFO << "At time::" << toc() << std::endl;
 #ifdef BUILD_SPARSE
     // run hals once to get proper initializations
     HALSNMF<T> tempHals(this->A, this->W, this->H);
     tempHals.num_iterations(2);
     this->W = tempHals.getLeftLowRankFactor();
     this->H = tempHals.getRightLowRankFactor();
 #endif
     INFO << PRINTMATINFO(this->At);
 #ifdef BUILD_SPARSE
     INFO << " nnz = " << this->At.n_nonzero << std::endl;
 #endif
     INFO << "Starting BPP for num_iterations()=" << this->num_iterations()
          << std::endl;
     while (currentIteration < this->num_iterations()) {
 #ifdef COLLECTSTATS
       this->collectStats(currentIteration);
       this->stats(currentIteration + 1, 0) = currentIteration + 1;
 #endif
       tic();
       updateOtherGivenOneMultipleRHS(this->At, this->H, 'W', &(this->W));
       double totalW2 = toc();
       tic();
       updateOtherGivenOneMultipleRHS(this->A, this->W, 'H', &(this->H));
       double totalH2 = toc();

 #ifdef COLLECTSTATS
       // end of H and start of W are almost same.
       this->stats(currentIteration + 1, 1) = totalH2;
       this->stats(currentIteration + 1, 2) = totalW2;

       this->stats(currentIteration + 1, 3) = totalW2 + totalH2;
 #endif
       INFO << "completed it=" << currentIteration
            << " time taken = " << totalW2 + totalH2 << std::endl;
       this->computeObjectiveError();
       INFO << "error:it = " << currentIteration
            << " bpperr =" << sqrt(this->objective_err) / this->normA
            << std::endl;
       currentIteration++;
     }
     this->normalize_by_W();
 #ifdef COLLECTSTATS
     this->collectStats(currentIteration);
     INFO << "NMF Statistics:" << std::endl << this->stats << std::endl;
 #endif
   }
   double getObjectiveError() { return this->objectiveErr; }

   /*
    * I dont like this function here. But this seems to be the
    * easy place for having it. This function really should have been
    * in BPPNNLS.hpp. It will take some time to refactor this.
    * Given, A and W, solve for H.
    */
   MAT solveScalableNNLS() {
     updateOtherGivenOneMultipleRHS(this->A, this->W, 'H', &(this->H));
     return this->H;
   }
   ~BPPNMF() { this->At.clear(); }
 };

 }  // namespace planc

 #endif  // NMF_BPPNMF_HPP_
NNLS::getSolutionMatrix
MATTYPE getSolutionMatrix()
Definition: nnls.hpp:79

planc::BPPNMF::BPPNMF
BPPNMF(const T &A, int lowrank)
Definition: bppnmf.hpp:92

tic
void tic()
start the timer. easy to call as tic(); some code; double t=toc();
Definition: utils.hpp:42

planc::BPPNMF::getObjectiveError
double getObjectiveError()
Definition: bppnmf.hpp:235

planc::NMF::num_iterations
const unsigned int num_iterations() const
Returns the number of iterations.
Definition: nmf.hpp:350

BPPNNLS
Definition: bppnnls.hpp:22

planc::HALSNMF
Definition: hals.hpp:11

toc
double toc()
Definition: utils.hpp:48

planc::NMF::getRightLowRankFactor
MAT getRightLowRankFactor()
Returns the right low rank factor matrix H.
Definition: nmf.hpp:169

planc::BPPNMF::computeNMF
void computeNMF()
Definition: bppnmf.hpp:181

planc::BPPNMF
Definition: bppnmf.hpp:20

planc::NMF::num_iterations
void num_iterations(const int it)
Sets number of iterations for the NMF algorithms.
Definition: nmf.hpp:340

planc::BPPNMF::computeNMFSingleRHS
void computeNMFSingleRHS()
Definition: bppnmf.hpp:99

INFO
#define INFO
Definition: utils.h:36

BPPNNLS::solveNNLS
int solveNNLS()
Definition: bppnnls.hpp:30

NNLS::getSolutionVector
VECTYPE getSolutionVector()
Definition: nnls.hpp:76

hals.hpp

UINT
unsigned int UINT
Definition: utils.h:68

MAT
#define MAT
Definition: utils.h:52

planc::BPPNMF::solveScalableNNLS
MAT solveScalableNNLS()
Definition: bppnmf.hpp:243

NNLS::clear
void clear()
Definition: nnls.hpp:82

ONE_THREAD_MATRIX_SIZE
#define ONE_THREAD_MATRIX_SIZE
Definition: bppnmf.hpp:15

planc::NMF::getLeftLowRankFactor
MAT getLeftLowRankFactor()
Returns the left low rank factor matrix W.
Definition: nmf.hpp:167

CONV_ERR
#define CONV_ERR
Definition: nmf.hpp:13

planc::BPPNMF::~BPPNMF
~BPPNMF()
Definition: bppnmf.hpp:247

ROWVEC
#define ROWVEC
Definition: utils.h:54

planc
ncp_factors contains the factors of the ncp every ith factor is of size n_i * k number of factors is ...
Definition: ncpfactors.hpp:20

VEC
#define VEC
Definition: utils.h:61

PRINTMATINFO
#define PRINTMATINFO(A)
Definition: utils.h:63

planc::NMF::computeObjectiveError
void computeObjectiveError()
Definition: nmf.hpp:238

bppnnls.hpp

planc::NMF
Definition: nmf.hpp:24

nmf.hpp

planc::BPPNMF::BPPNMF
BPPNMF(const T &A, const MAT &llf, const MAT &rlf)
Definition: bppnmf.hpp:96