|  | 
 | #include <iostream> | 
 | #include <Eigen/Core> | 
 | #include <bench/BenchTimer.h> | 
 |  | 
 | using namespace Eigen; | 
 | using namespace std; | 
 |  | 
 | #define END 9 | 
 |  | 
 | template <int S> | 
 | struct map_size { | 
 |   enum { ret = S }; | 
 | }; | 
 | template <> | 
 | struct map_size<10> { | 
 |   enum { ret = 20 }; | 
 | }; | 
 | template <> | 
 | struct map_size<11> { | 
 |   enum { ret = 50 }; | 
 | }; | 
 | template <> | 
 | struct map_size<12> { | 
 |   enum { ret = 100 }; | 
 | }; | 
 | template <> | 
 | struct map_size<13> { | 
 |   enum { ret = 300 }; | 
 | }; | 
 |  | 
 | template <int M, int N, int K> | 
 | struct alt_prod { | 
 |   enum { | 
 |     ret = M == 1 && N == 1 ? InnerProduct | 
 |           : K == 1         ? OuterProduct | 
 |           : M == 1         ? GemvProduct | 
 |           : N == 1         ? GemvProduct | 
 |                            : GemmProduct | 
 |   }; | 
 | }; | 
 |  | 
 | void print_mode(int mode) { | 
 |   if (mode == InnerProduct) std::cout << "i"; | 
 |   if (mode == OuterProduct) std::cout << "o"; | 
 |   if (mode == CoeffBasedProductMode) std::cout << "c"; | 
 |   if (mode == LazyCoeffBasedProductMode) std::cout << "l"; | 
 |   if (mode == GemvProduct) std::cout << "v"; | 
 |   if (mode == GemmProduct) std::cout << "m"; | 
 | } | 
 |  | 
 | template <int Mode, typename Lhs, typename Rhs, typename Res> | 
 | EIGEN_DONT_INLINE void prod(const Lhs& a, const Rhs& b, Res& c) { | 
 |   c.noalias() += typename ProductReturnType<Lhs, Rhs, Mode>::Type(a, b); | 
 | } | 
 |  | 
 | template <int M, int N, int K, typename Scalar, int Mode> | 
 | EIGEN_DONT_INLINE void bench_prod() { | 
 |   typedef Matrix<Scalar, M, K> Lhs; | 
 |   Lhs a; | 
 |   a.setRandom(); | 
 |   typedef Matrix<Scalar, K, N> Rhs; | 
 |   Rhs b; | 
 |   b.setRandom(); | 
 |   typedef Matrix<Scalar, M, N> Res; | 
 |   Res c; | 
 |   c.setRandom(); | 
 |  | 
 |   BenchTimer t; | 
 |   double n = 2. * double(M) * double(N) * double(K); | 
 |   int rep = 100000. / n; | 
 |   rep /= 2; | 
 |   if (rep < 1) rep = 1; | 
 |   do { | 
 |     rep *= 2; | 
 |     t.reset(); | 
 |     BENCH(t, 1, rep, prod<CoeffBasedProductMode>(a, b, c)); | 
 |   } while (t.best() < 0.1); | 
 |  | 
 |   t.reset(); | 
 |   BENCH(t, 5, rep, prod<Mode>(a, b, c)); | 
 |  | 
 |   print_mode(Mode); | 
 |   std::cout << int(1e-6 * n * rep / t.best()) << "\t"; | 
 | } | 
 |  | 
 | template <int N> | 
 | struct print_n; | 
 | template <int M, int N, int K> | 
 | struct loop_on_m; | 
 | template <int M, int N, int K, typename Scalar, int Mode> | 
 | struct loop_on_n; | 
 |  | 
 | template <int M, int N, int K> | 
 | struct loop_on_k { | 
 |   static void run() { | 
 |     std::cout << "K=" << K << "\t"; | 
 |     print_n<N>::run(); | 
 |     std::cout << "\n"; | 
 |  | 
 |     loop_on_m<M, N, K>::run(); | 
 |     std::cout << "\n\n"; | 
 |  | 
 |     loop_on_k<M, N, K + 1>::run(); | 
 |   } | 
 | }; | 
 |  | 
 | template <int M, int N> | 
 | struct loop_on_k<M, N, END> { | 
 |   static void run() {} | 
 | }; | 
 |  | 
 | template <int M, int N, int K> | 
 | struct loop_on_m { | 
 |   static void run() { | 
 |     std::cout << M << "f\t"; | 
 |     loop_on_n<M, N, K, float, CoeffBasedProductMode>::run(); | 
 |     std::cout << "\n"; | 
 |  | 
 |     std::cout << M << "f\t"; | 
 |     loop_on_n<M, N, K, float, -1>::run(); | 
 |     std::cout << "\n"; | 
 |  | 
 |     loop_on_m<M + 1, N, K>::run(); | 
 |   } | 
 | }; | 
 |  | 
 | template <int N, int K> | 
 | struct loop_on_m<END, N, K> { | 
 |   static void run() {} | 
 | }; | 
 |  | 
 | template <int M, int N, int K, typename Scalar, int Mode> | 
 | struct loop_on_n { | 
 |   static void run() { | 
 |     bench_prod<M, N, K, Scalar, Mode == -1 ? alt_prod<M, N, K>::ret : Mode>(); | 
 |  | 
 |     loop_on_n<M, N + 1, K, Scalar, Mode>::run(); | 
 |   } | 
 | }; | 
 |  | 
 | template <int M, int K, typename Scalar, int Mode> | 
 | struct loop_on_n<M, END, K, Scalar, Mode> { | 
 |   static void run() {} | 
 | }; | 
 |  | 
 | template <int N> | 
 | struct print_n { | 
 |   static void run() { | 
 |     std::cout << map_size<N>::ret << "\t"; | 
 |     print_n<N + 1>::run(); | 
 |   } | 
 | }; | 
 |  | 
 | template <> | 
 | struct print_n<END> { | 
 |   static void run() {} | 
 | }; | 
 |  | 
 | int main() { | 
 |   loop_on_k<1, 1, 1>::run(); | 
 |  | 
 |   return 0; | 
 | } |