df/d93/utils_8hpp_source.html

 /* Copyright 2016 Ramakrishnan Kannan */
 // utility functions
 #ifndef COMMON_UTILS_HPP_
 #define COMMON_UTILS_HPP_
 #include <assert.h>
 #include <omp.h>
 #include <stdio.h>
 #include <chrono>
 #include <ctime>
 #include <stack>
 #include <typeinfo>
 #include <vector>
 #include "common/utils.h"
 #ifdef MKL_FOUND
 #include <mkl.h>
 #else
 #include <cblas.h>
 #endif

 static ULONG powersof10[16] = {1,
                                10,
                                100,
                                1000,
                                10000,
                                100000,
                                1000000,
                                10000000,
                                100000000,
                                1000000000,
                                10000000000,
                                100000000000,
                                1000000000000,
                                10000000000000,
                                100000000000000,
                                1000000000000000};

 static std::stack<std::chrono::steady_clock::time_point> tictoc_stack;
 static std::stack<double> tictoc_stack_omp_clock;


 inline void tic() { tictoc_stack.push(std::chrono::steady_clock::now()); }

 /***
  * Returns the time taken between the most recent tic() to itself.
  * @return time in seconds.
 */
 inline double toc() {
   std::chrono::duration<double> time_span =
       std::chrono::duration_cast<std::chrono::duration<double>>(
           std::chrono::steady_clock::now() - tictoc_stack.top());
   double rc = time_span.count();
   tictoc_stack.pop();
   return rc;
 }

 template <class T>
 void fixNumericalError(T *X, const double prec = EPSILON_1EMINUS16) {
   (*X).for_each(
       [&](typename T::elem_type &val) { val = (val < prec) ? prec : val; });
 }

 template <class T>
 void fixDecimalPlaces(T *X, const int places = NUMBEROF_DECIMAL_PLACES) {
   (*X).for_each([&](typename T::elem_type &val) {
     val = floorf(val * powersof10[places]) / powersof10[places];
   });
 }

 /*
  * Returns the nth prime number.
  * There are totally 10000 prime numbers within 104000;
  */
 int random_sieve(const int nthprime) {
   int i, m, k;
   int klimit, nlimit;
   int *mark;

   nlimit = 104000;

   mark = reinterpret_cast<int *>(calloc(nlimit, sizeof(int)));

   /* Calculate limit for k */
   klimit = static_cast<int>(sqrt(static_cast<double>(nlimit) + 1));

   /* Mark the composites */
   /* Special case */
   mark[1] = -1;

   /* Set k=1. Loop until k >= sqrt(n) */
   for (k = 3; k <= klimit; k = m) {
     /* Find first non-composite in list > k */
     for (m = k + 1; m < nlimit; m++)
       if (!mark[m]) break;

     /* Mark the numbers 2m, 3m, 4m, ... */
     for (i = m * 2; i < nlimit; i += m) mark[i] = -1;
   }

   /* Now display results - all unmarked numbers are prime */
   int rcprime = -1;
   for (k = 0, i = 1; i < nlimit; i++) {
     if (!mark[i]) {
       k++;
       if (k == nthprime + 1) {
         rcprime = i;
         break;
       }
     }
   }
   free(mark);
   return rcprime;
 }

 template <class T>
 void absmat(T *X) {
   UVEC negativeIdx = find((*X) < 0);
   (*X)(negativeIdx) = (*X)(negativeIdx) * -1;
 }

 template <class T>
 void makeSparse(const double sparsity, T(*X)) {
   // make a matrix sparse
   srand(RAND_SEED_SPARSE);
 #pragma omp parallel for
   for (int j = 0; j < X->n_cols; j++) {
     for (int i = 0; i < X->n_rows; i++) {
       if (arma::randu() > sparsity) (*X)(i, j) = 0;
     }
   }
 }

 template <class T>
 void randNMF(const UWORD m, const UWORD n, const UWORD k, const double sparsity,
              T *A) {
 #ifdef BUILD_SPARSE
   T temp = arma::sprandu<T>(m, n, sparsity);
   A = &temp;
 #else
   srand(RAND_SEED);
   MAT W = 10 * arma::randu<MAT>(m, k);
   MAT H = 10 * arma::randu<MAT>(n, k);
   if (sparsity < 1) {
     makeSparse<MAT>(sparsity, &W);
     makeSparse<MAT>(sparsity, &H);
   }
   T temp = ceil(W * trans(H));
   A = &temp;
 #endif
 }

 template <class T>
 void printVector(const std::vector<T> &x) {
   for (int i = 0; i < x.size(); i++) {
     INFO << x[i] << ' ';
   }
   INFO << std::endl;
 }

 std::vector<std::vector<size_t>> cartesian_product(
     const std::vector<std::vector<size_t>> &v) {
   std::vector<std::vector<size_t>> s = {{}};
   for (auto &u : v) {
     std::vector<std::vector<size_t>> r;
     for (auto y : u) {
       for (auto &x : s) {
         r.push_back(x);
         r.back().push_back(y);
       }
     }
     s.swap(r);
   }
   return s;
 }

 /*
  * can be called by external people for sparse input matrix.
  */
 template <class INPUTTYPE, class LRTYPE>
 double computeObjectiveError(const INPUTTYPE &A, const LRTYPE &W,
                              const LRTYPE &H) {
   // 1. over all nnz (a_ij - w_i h_j)^2
   // 2. over all nnz (w_i h_j)^2
   // 3. Compute R of W ahd L of H through QR
   // 4. use sgemm to compute RL
   // 5. use slange to compute ||RL||_F^2
   // 6. return nnzsse+nnzwh-||RL||_F^2
   UWORD k = W.n_cols;
   UWORD m = A.n_rows;
   UWORD n = A.n_cols;
   tic();
   double nnzsse = 0;
   double nnzwh = 0;
   LRTYPE Rw(k, k);
   LRTYPE Rh(k, k);
   LRTYPE Qw(m, k);
   LRTYPE Qh(n, k);
   LRTYPE RwRh(k, k);
 #pragma omp parallel for reduction(+ : nnzsse, nnzwh)
   for (UWORD jj = 1; jj <= A.n_cols; jj++) {
     UWORD startIdx = A.col_ptrs[jj - 1];
     UWORD endIdx = A.col_ptrs[jj];
     UWORD col = jj - 1;
     double nnzssecol = 0;
     double nnzwhcol = 0;
     for (UWORD ii = startIdx; ii < endIdx; ii++) {
       UWORD row = A.row_indices[ii];
       double tempsum = 0;
       for (UWORD kk = 0; kk < k; kk++) {
         tempsum += (W(row, kk) * H(col, kk));
       }
       nnzwhcol += tempsum * tempsum;
       nnzssecol += (A.values[ii] - tempsum) * (A.values[ii] - tempsum);
     }
     nnzsse += nnzssecol;
     nnzwh += nnzwhcol;
   }
   qr_econ(Qw, Rw, W);
   qr_econ(Qh, Rh, H);
   RwRh = Rw * Rh.t();
   double normWH = arma::norm(RwRh, "fro");
   Rw.clear();
   Rh.clear();
   Qw.clear();
   Qh.clear();
   RwRh.clear();
   INFO << "error compute time " << toc() << std::endl;
   double fastErr = sqrt(nnzsse + (normWH * normWH - nnzwh));
   return (fastErr);
 }

 #if defined(MKL_FOUND) && defined(BUILD_SPARSE)
 /*
  * mklMat is csc representation
  * Bt is the row major order of the arma B matrix
  * Ct is the row major order of the arma C matrix
  * Once you receive Ct, transpose again to print
  * C using arma
  */
 void ARMAMKLSCSCMM(const SP_MAT &mklMat, char transa, const MAT &Bt,
                    double *Ct) {
   MKL_INT m, k, n, nnz;
   m = static_cast<MKL_INT>(mklMat.n_rows);
   k = static_cast<MKL_INT>(mklMat.n_cols);
   n = static_cast<MKL_INT>(Bt.n_rows);
   // MAT B = B.t();
   // C = alpha * A * B + beta * C;
   // mkl_?cscmm - https://software.MKL_INTel.com/en-us/node/468598
   // char transa = 'N';
   double alpha = 1.0;
   double beta = 0.0;
   char *matdescra = "GUNC";
   MKL_INT ldb = n;
   MKL_INT ldc = n;
   MKL_INT *pntrb = static_cast<MKL_INT *>(mklMat.col_ptrs);
   MKL_INT *pntre = pntrb + 1;
   mkl_dcscmm(&transa, &m, &n, &k, &alpha, matdescra, mklMat.values,
              static_cast<MKL_INT *> mklMat.row_indices, pntrb, pntre,
              static_cast<double *>(Bt.memptr()), &ldb, &beta, Ct, &ldc);
 }
 #endif

 /*
  * This is an sgemm wrapper for armadillo matrices
  * Something is going crazy with armadillo
  */

 void cblas_sgemm(const MAT &A, const MAT &B, double *C) {
   UWORD m = A.n_rows;
   UWORD n = B.n_cols;
   UWORD k = A.n_cols;
   double alpha = 1.0;
   double beta = 0.0;
   cblas_dgemm(CblasColMajor, CblasNoTrans, CblasNoTrans, m, n, k, alpha,
               A.memptr(), m, B.memptr(), k, beta, C, m);
 }

 #endif  // COMMON_UTILS_HPP_
randNMF
void randNMF(const UWORD m, const UWORD n, const UWORD k, const double sparsity, T *A)
Definition: utils.hpp:134

NUMBEROF_DECIMAL_PLACES
#define NUMBEROF_DECIMAL_PLACES
Definition: utils.h:46

makeSparse
void makeSparse(const double sparsity, T(*X))
Definition: utils.hpp:122

tic
void tic()
start the timer. easy to call as tic(); some code; double t=toc();
Definition: utils.hpp:42

fixNumericalError
void fixNumericalError(T *X, const double prec=EPSILON_1EMINUS16)
Definition: utils.hpp:58

tictoc_stack_omp_clock
static std::stack< double > tictoc_stack_omp_clock
Definition: utils.hpp:38

EPSILON_1EMINUS16
#define EPSILON_1EMINUS16
Definition: utils.h:43

computeObjectiveError
double computeObjectiveError(const INPUTTYPE &A, const LRTYPE &W, const LRTYPE &H)
Definition: utils.hpp:180

utils.h

cartesian_product
std::vector< std::vector< size_t > > cartesian_product(const std::vector< std::vector< size_t >> &v)
Definition: utils.hpp:160

UVEC
#define UVEC
Definition: utils.h:58

cblas_sgemm
void cblas_sgemm(const MAT &A, const MAT &B, double *C)
Definition: utils.hpp:268

SP_MAT
#define SP_MAT
Definition: utils.h:57

tictoc_stack
static std::stack< std::chrono::steady_clock::time_point > tictoc_stack
Definition: utils.hpp:37

INFO
#define INFO
Definition: utils.h:36

printVector
void printVector(const std::vector< T > &x)
Definition: utils.hpp:153

powersof10
static ULONG powersof10[16]
Definition: utils.hpp:20

UWORD
#define UWORD
Definition: utils.h:60

MAT
#define MAT
Definition: utils.h:52

toc
double toc()
Definition: utils.hpp:48

ULONG
unsigned long ULONG
Definition: utils.h:69

absmat
void absmat(T *X)
Definition: utils.hpp:116

RAND_SEED
#define RAND_SEED
Definition: utils.h:47

RAND_SEED_SPARSE
#define RAND_SEED_SPARSE
Definition: utils.h:48

random_sieve
int random_sieve(const int nthprime)
Definition: utils.hpp:74

fixDecimalPlaces
void fixDecimalPlaces(T *X, const int places=NUMBEROF_DECIMAL_PLACES)
Definition: utils.hpp:64