bench/benchCholesky.cpp - mirror - Git at Google

 // g++ -DNDEBUG -O3 -I.. benchCholesky.cpp  -o benchCholesky && ./benchCholesky
 // options:
 //  -DBENCH_GSL -lgsl /usr/lib/libcblas.so.3
 //  -DEIGEN_DONT_VECTORIZE
 //  -msse2
 //  -DREPEAT=100
 //  -DTRIES=10
 //  -DSCALAR=double

 #include <iostream>

 #include <Eigen/Core>
 #include <Eigen/Cholesky>
 #include <bench/BenchUtil.h>
 using namespace Eigen;

 #ifndef REPEAT
 #define REPEAT 10000
 #endif

 #ifndef TRIES
 #define TRIES 10
 #endif

 typedef float Scalar;

 template <typename MatrixType>
 __attribute__((noinline)) void benchLLT(const MatrixType& m) {
   int rows = m.rows();
   int cols = m.cols();

   double cost = 0;
   for (int j = 0; j < rows; ++j) {
     int r = std::max(rows - j - 1, 0);
     cost += 2 * (r * j + r + j);
   }

   int repeats = (REPEAT * 1000) / (rows * rows);

   typedef typename MatrixType::Scalar Scalar;
   typedef Matrix<Scalar, MatrixType::RowsAtCompileTime, MatrixType::RowsAtCompileTime> SquareMatrixType;

   MatrixType a = MatrixType::Random(rows, cols);
   SquareMatrixType covMat = a * a.adjoint();

   BenchTimer timerNoSqrt, timerSqrt;

   Scalar acc = 0;
   int r = internal::random<int>(0, covMat.rows() - 1);
   int c = internal::random<int>(0, covMat.cols() - 1);
   for (int t = 0; t < TRIES; ++t) {
     timerNoSqrt.start();
     for (int k = 0; k < repeats; ++k) {
       LDLT<SquareMatrixType> cholnosqrt(covMat);
       acc += cholnosqrt.matrixL().coeff(r, c);
     }
     timerNoSqrt.stop();
   }

   for (int t = 0; t < TRIES; ++t) {
     timerSqrt.start();
     for (int k = 0; k < repeats; ++k) {
       LLT<SquareMatrixType> chol(covMat);
       acc += chol.matrixL().coeff(r, c);
     }
     timerSqrt.stop();
   }

   if (MatrixType::RowsAtCompileTime == Dynamic)
     std::cout << "dyn   ";
   else
     std::cout << "fixed ";
   std::cout << covMat.rows() << " \t" << (timerNoSqrt.best()) / repeats << "s "
             << "(" << 1e-9 * cost * repeats / timerNoSqrt.best() << " GFLOPS)\t" << (timerSqrt.best()) / repeats << "s "
             << "(" << 1e-9 * cost * repeats / timerSqrt.best() << " GFLOPS)\n";

 #ifdef BENCH_GSL
   if (MatrixType::RowsAtCompileTime == Dynamic) {
     timerSqrt.reset();

     gsl_matrix* gslCovMat = gsl_matrix_alloc(covMat.rows(), covMat.cols());
     gsl_matrix* gslCopy = gsl_matrix_alloc(covMat.rows(), covMat.cols());

     eiToGsl(covMat, &gslCovMat);
     for (int t = 0; t < TRIES; ++t) {
       timerSqrt.start();
       for (int k = 0; k < repeats; ++k) {
         gsl_matrix_memcpy(gslCopy, gslCovMat);
         gsl_linalg_cholesky_decomp(gslCopy);
         acc += gsl_matrix_get(gslCopy, r, c);
       }
       timerSqrt.stop();
     }

     std::cout << " | \t" << timerSqrt.value() * REPEAT / repeats << "s";

     gsl_matrix_free(gslCovMat);
   }
 #endif
   std::cout << "\n";
   // make sure the compiler does not optimize too much
   if (acc == 123) std::cout << acc;
 }

 int main(int argc, char* argv[]) {
   const int dynsizes[] = {4, 6, 8, 16, 24, 32, 49, 64, 128, 256, 512, 900, 1500, 0};
   std::cout << "size            LDLT                            LLT";
   //   #ifdef BENCH_GSL
   //   std::cout << "       GSL (standard + double + ATLAS)  ";
   //   #endif
   std::cout << "\n";
   for (int i = 0; dynsizes[i] > 0; ++i) benchLLT(Matrix<Scalar, Dynamic, Dynamic>(dynsizes[i], dynsizes[i]));

   benchLLT(Matrix<Scalar, 2, 2>());
   benchLLT(Matrix<Scalar, 3, 3>());
   benchLLT(Matrix<Scalar, 4, 4>());
   benchLLT(Matrix<Scalar, 5, 5>());
   benchLLT(Matrix<Scalar, 6, 6>());
   benchLLT(Matrix<Scalar, 7, 7>());
   benchLLT(Matrix<Scalar, 8, 8>());
   benchLLT(Matrix<Scalar, 12, 12>());
   benchLLT(Matrix<Scalar, 16, 16>());
   return 0;
 }
	// g++ -DNDEBUG -O3 -I.. benchCholesky.cpp -o benchCholesky && ./benchCholesky
	// options:
	// -DBENCH_GSL -lgsl /usr/lib/libcblas.so.3
	// -DEIGEN_DONT_VECTORIZE
	// -msse2
	// -DREPEAT=100
	// -DTRIES=10
	// -DSCALAR=double

	#include <iostream>

	#include <Eigen/Core>
	#include <Eigen/Cholesky>
	#include <bench/BenchUtil.h>
	using namespace Eigen;

	#ifndef REPEAT
	#define REPEAT 10000
	#endif

	#ifndef TRIES
	#define TRIES 10
	#endif

	typedef float Scalar;

	template <typename MatrixType>
	__attribute__((noinline)) void benchLLT(const MatrixType& m) {
	int rows = m.rows();
	int cols = m.cols();

	double cost = 0;
	for (int j = 0; j < rows; ++j) {
	int r = std::max(rows - j - 1, 0);
	cost += 2 * (r * j + r + j);
	}

	int repeats = (REPEAT * 1000) / (rows * rows);

	typedef typename MatrixType::Scalar Scalar;
	typedef Matrix<Scalar, MatrixType::RowsAtCompileTime, MatrixType::RowsAtCompileTime> SquareMatrixType;

	MatrixType a = MatrixType::Random(rows, cols);
	SquareMatrixType covMat = a * a.adjoint();

	BenchTimer timerNoSqrt, timerSqrt;

	Scalar acc = 0;
	int r = internal::random<int>(0, covMat.rows() - 1);
	int c = internal::random<int>(0, covMat.cols() - 1);
	for (int t = 0; t < TRIES; ++t) {
	timerNoSqrt.start();
	for (int k = 0; k < repeats; ++k) {
	LDLT<SquareMatrixType> cholnosqrt(covMat);
	acc += cholnosqrt.matrixL().coeff(r, c);
	}
	timerNoSqrt.stop();
	}

	for (int t = 0; t < TRIES; ++t) {
	timerSqrt.start();
	for (int k = 0; k < repeats; ++k) {
	LLT<SquareMatrixType> chol(covMat);
	acc += chol.matrixL().coeff(r, c);
	}
	timerSqrt.stop();
	}

	if (MatrixType::RowsAtCompileTime == Dynamic)
	std::cout << "dyn ";
	else
	std::cout << "fixed ";
	std::cout << covMat.rows() << " \t" << (timerNoSqrt.best()) / repeats << "s "
	<< "(" << 1e-9 * cost * repeats / timerNoSqrt.best() << " GFLOPS)\t" << (timerSqrt.best()) / repeats << "s "
	<< "(" << 1e-9 * cost * repeats / timerSqrt.best() << " GFLOPS)\n";

	#ifdef BENCH_GSL
	if (MatrixType::RowsAtCompileTime == Dynamic) {
	timerSqrt.reset();

	gsl_matrix* gslCovMat = gsl_matrix_alloc(covMat.rows(), covMat.cols());
	gsl_matrix* gslCopy = gsl_matrix_alloc(covMat.rows(), covMat.cols());

	eiToGsl(covMat, &gslCovMat);
	for (int t = 0; t < TRIES; ++t) {
	timerSqrt.start();
	for (int k = 0; k < repeats; ++k) {
	gsl_matrix_memcpy(gslCopy, gslCovMat);
	gsl_linalg_cholesky_decomp(gslCopy);
	acc += gsl_matrix_get(gslCopy, r, c);
	}
	timerSqrt.stop();
	}

	std::cout << " \| \t" << timerSqrt.value() * REPEAT / repeats << "s";

	gsl_matrix_free(gslCovMat);
	}
	#endif
	std::cout << "\n";
	// make sure the compiler does not optimize too much
	if (acc == 123) std::cout << acc;
	}

	int main(int argc, char* argv[]) {
	const int dynsizes[] = {4, 6, 8, 16, 24, 32, 49, 64, 128, 256, 512, 900, 1500, 0};
	std::cout << "size LDLT LLT";
	// #ifdef BENCH_GSL
	// std::cout << " GSL (standard + double + ATLAS) ";
	// #endif
	std::cout << "\n";
	for (int i = 0; dynsizes[i] > 0; ++i) benchLLT(Matrix<Scalar, Dynamic, Dynamic>(dynsizes[i], dynsizes[i]));

	benchLLT(Matrix<Scalar, 2, 2>());
	benchLLT(Matrix<Scalar, 3, 3>());
	benchLLT(Matrix<Scalar, 4, 4>());
	benchLLT(Matrix<Scalar, 5, 5>());
	benchLLT(Matrix<Scalar, 6, 6>());
	benchLLT(Matrix<Scalar, 7, 7>());
	benchLLT(Matrix<Scalar, 8, 8>());
	benchLLT(Matrix<Scalar, 12, 12>());
	benchLLT(Matrix<Scalar, 16, 16>());
	return 0;
	}