d7/dc1/distntfanlsbpp_8hpp_source.html

 /* Copyright Ramakrishnan Kannan 2018 */

 #ifndef DISTNTF_DISTNTFANLSBPP_HPP_
 #define DISTNTF_DISTNTFANLSBPP_HPP_

 #include "distntf/distauntf.hpp"
 #include "nnls/bppnnls.hpp"

 namespace planc {

 #define ONE_THREAD_MATRIX_SIZE 2000

 class DistNTFANLSBPP : public DistAUNTF {
  protected:
   MAT update(const int mode) {
     MAT othermat(this->m_local_ncp_factors_t.factor(mode));
     if (m_nls_sizes[mode] > 0) {
       unsigned int numThreads =
         (this->ncp_local_mttkrp_t[mode].n_cols / ONE_THREAD_MATRIX_SIZE) + 1;
       #pragma omp parallel for schedule(dynamic)
       for (UINT i = 0; i < numThreads; i++) {
         UINT spanStart = i * ONE_THREAD_MATRIX_SIZE;
         UINT spanEnd = (i + 1) * ONE_THREAD_MATRIX_SIZE - 1;
         if (spanEnd > this->ncp_local_mttkrp_t[mode].n_cols - 1) {
           spanEnd = this->ncp_local_mttkrp_t[mode].n_cols - 1;
         }
         // if it is exactly divisible, the last iteration is unnecessary.
         BPPNNLS<MAT, VEC> *subProblem;
         if (spanStart <= spanEnd) {
           if (spanStart == spanEnd) {
             subProblem = new BPPNNLS<MAT, VEC>(
               this->global_gram,
               (VEC)this->ncp_local_mttkrp_t[mode].col(spanStart), true);
           } else {  // if (spanStart < spanEnd)
             subProblem = new BPPNNLS<MAT, VEC>(
               this->global_gram,
               (MAT)this->ncp_local_mttkrp_t[mode].cols(spanStart, spanEnd),
               true);
           }
 #ifdef _VERBOSE
           INFO << "Scheduling " << worh << " start=" << spanStart
              << ", end=" << spanEnd << ", tid=" << omp_get_thread_num()
              << std::endl;
 #endif
           // tic();
           subProblem->solveNNLS();
           // t2 = toc();
 #ifdef _VERBOSE
           INFO << "completed " << worh << " start=" << spanStart
              << ", end=" << spanEnd << ", tid=" << omp_get_thread_num()
              << " cpu=" << sched_getcpu() << " time taken=" << t2
              << " num_iterations()=" << numIter << std::endl;
 #endif
           if (spanStart == spanEnd) {
             VEC solVec = subProblem->getSolutionVector();
             othermat.col(i) = solVec;
           } else {  // if (spanStart < spanEnd)
             othermat.cols(spanStart, spanEnd) = subProblem->getSolutionMatrix();
           }
           subProblem->clear();
           delete subProblem;
         }
       }
     } else {
       othermat.zeros();
     }
     return othermat;
   }

  public:
   DistNTFANLSBPP(const Tensor &i_tensor, const int i_k, algotype i_algo,
                  const UVEC &i_global_dims, const UVEC &i_local_dims,
                  const UVEC &i_nls_sizes, const UVEC &i_nls_idxs,
                  const NTFMPICommunicator &i_mpicomm)
       : DistAUNTF(i_tensor, i_k, i_algo, i_global_dims, i_local_dims,
                   i_nls_sizes, i_nls_idxs, i_mpicomm) {}
 };  // class DistNTFANLSBPP

 }  // namespace planc

 #endif  // DISTNTF_DISTNTFANLSBPP_HPP_
NNLS::getSolutionMatrix
MATTYPE getSolutionMatrix()
Definition: nnls.hpp:79

planc::Tensor
Data is stored such that the unfolding  is column major.
Definition: tensor.hpp:32

ONE_THREAD_MATRIX_SIZE
#define ONE_THREAD_MATRIX_SIZE
Definition: distntfanlsbpp.hpp:11

planc::DistAUNTF
Definition: distauntf.hpp:32

BPPNNLS
Definition: bppnnls.hpp:22

algotype
algotype
Definition: utils.h:10

UVEC
#define UVEC
Definition: utils.h:58

distauntf.hpp

planc::NTFMPICommunicator
Definition: distntfmpicomm.hpp:12

INFO
#define INFO
Definition: utils.h:36

BPPNNLS::solveNNLS
int solveNNLS()
Definition: bppnnls.hpp:30

planc::DistNTFANLSBPP
Definition: distntfanlsbpp.hpp:13

planc::DistNTFANLSBPP::DistNTFANLSBPP
DistNTFANLSBPP(const Tensor &i_tensor, const int i_k, algotype i_algo, const UVEC &i_global_dims, const UVEC &i_local_dims, const UVEC &i_nls_sizes, const UVEC &i_nls_idxs, const NTFMPICommunicator &i_mpicomm)
Definition: distntfanlsbpp.hpp:78

NNLS::getSolutionVector
VECTYPE getSolutionVector()
Definition: nnls.hpp:76

UINT
unsigned int UINT
Definition: utils.h:68

MAT
#define MAT
Definition: utils.h:52

NNLS::clear
void clear()
Definition: nnls.hpp:82

planc
ncp_factors contains the factors of the ncp every ith factor is of size n_i * k number of factors is ...
Definition: ncpfactors.hpp:20

VEC
#define VEC
Definition: utils.h:61

bppnnls.hpp