You can not select more than 25 topics
			Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
		
		
		
		
		
			
		
			
				
					
					
						
							143 lines
						
					
					
						
							3.2 KiB
						
					
					
				
			
		
		
		
			
			
			
				
					
				
				
					
				
			
		
		
	
	
							143 lines
						
					
					
						
							3.2 KiB
						
					
					
				
								
							 | 
						|
								#include <iostream>
							 | 
						|
								#include <StormEigen/Core>
							 | 
						|
								#include <bench/BenchTimer.h>
							 | 
						|
								
							 | 
						|
								using namespace StormEigen;
							 | 
						|
								using namespace std;
							 | 
						|
								
							 | 
						|
								#define END 9
							 | 
						|
								
							 | 
						|
								template<int S> struct map_size { enum { ret = S }; };
							 | 
						|
								template<>  struct map_size<10> { enum { ret = 20 }; };
							 | 
						|
								template<>  struct map_size<11> { enum { ret = 50 }; };
							 | 
						|
								template<>  struct map_size<12> { enum { ret = 100 }; };
							 | 
						|
								template<>  struct map_size<13> { enum { ret = 300 }; };
							 | 
						|
								
							 | 
						|
								template<int M, int N,int K> struct alt_prod
							 | 
						|
								{
							 | 
						|
								  enum {
							 | 
						|
								    ret = M==1 && N==1 ? InnerProduct
							 | 
						|
								        : K==1 ? OuterProduct
							 | 
						|
								        : M==1 ? GemvProduct
							 | 
						|
								        : N==1 ? GemvProduct
							 | 
						|
								        : GemmProduct
							 | 
						|
								  };
							 | 
						|
								};
							 | 
						|
								        
							 | 
						|
								void print_mode(int mode)
							 | 
						|
								{
							 | 
						|
								  if(mode==InnerProduct) std::cout << "i";
							 | 
						|
								  if(mode==OuterProduct) std::cout << "o";
							 | 
						|
								  if(mode==CoeffBasedProductMode) std::cout << "c";
							 | 
						|
								  if(mode==LazyCoeffBasedProductMode) std::cout << "l";
							 | 
						|
								  if(mode==GemvProduct) std::cout << "v";
							 | 
						|
								  if(mode==GemmProduct) std::cout << "m";
							 | 
						|
								}
							 | 
						|
								
							 | 
						|
								template<int Mode, typename Lhs, typename Rhs, typename Res>
							 | 
						|
								STORMEIGEN_DONT_INLINE void prod(const Lhs& a, const Rhs& b, Res& c)
							 | 
						|
								{
							 | 
						|
								  c.noalias() += typename ProductReturnType<Lhs,Rhs,Mode>::Type(a,b);
							 | 
						|
								}
							 | 
						|
								
							 | 
						|
								template<int M, int N, int K, typename Scalar, int Mode>
							 | 
						|
								STORMEIGEN_DONT_INLINE void bench_prod()
							 | 
						|
								{
							 | 
						|
								  typedef Matrix<Scalar,M,K> Lhs; Lhs a; a.setRandom();
							 | 
						|
								  typedef Matrix<Scalar,K,N> Rhs; Rhs b; b.setRandom();
							 | 
						|
								  typedef Matrix<Scalar,M,N> Res; Res c; c.setRandom();
							 | 
						|
								
							 | 
						|
								  BenchTimer t;
							 | 
						|
								  double n = 2.*double(M)*double(N)*double(K);
							 | 
						|
								  int rep = 100000./n;
							 | 
						|
								  rep /= 2;
							 | 
						|
								  if(rep<1) rep = 1;
							 | 
						|
								  do {
							 | 
						|
								    rep *= 2;
							 | 
						|
								    t.reset();
							 | 
						|
								    BENCH(t,1,rep,prod<CoeffBasedProductMode>(a,b,c));
							 | 
						|
								  } while(t.best()<0.1);
							 | 
						|
								  
							 | 
						|
								  t.reset();
							 | 
						|
								  BENCH(t,5,rep,prod<Mode>(a,b,c));
							 | 
						|
								
							 | 
						|
								  print_mode(Mode);
							 | 
						|
								  std::cout << int(1e-6*n*rep/t.best()) << "\t";
							 | 
						|
								}
							 | 
						|
								
							 | 
						|
								template<int N> struct print_n;
							 | 
						|
								template<int M, int N, int K> struct loop_on_m;
							 | 
						|
								template<int M, int N, int K, typename Scalar, int Mode> struct loop_on_n;
							 | 
						|
								
							 | 
						|
								template<int M, int N, int K>
							 | 
						|
								struct loop_on_k
							 | 
						|
								{
							 | 
						|
								  static void run()
							 | 
						|
								  {
							 | 
						|
								    std::cout << "K=" << K << "\t";
							 | 
						|
								    print_n<N>::run();
							 | 
						|
								    std::cout << "\n";
							 | 
						|
								
							 | 
						|
								    loop_on_m<M,N,K>::run();
							 | 
						|
								    std::cout << "\n\n";
							 | 
						|
								
							 | 
						|
								    loop_on_k<M,N,K+1>::run();
							 | 
						|
								  }
							 | 
						|
								};
							 | 
						|
								
							 | 
						|
								template<int M, int N>
							 | 
						|
								struct loop_on_k<M,N,END> { static void run(){} };
							 | 
						|
								
							 | 
						|
								
							 | 
						|
								template<int M, int N, int K>
							 | 
						|
								struct loop_on_m
							 | 
						|
								{
							 | 
						|
								  static void run()
							 | 
						|
								  {
							 | 
						|
								    std::cout << M << "f\t";
							 | 
						|
								    loop_on_n<M,N,K,float,CoeffBasedProductMode>::run();
							 | 
						|
								    std::cout << "\n";
							 | 
						|
								    
							 | 
						|
								    std::cout << M << "f\t";
							 | 
						|
								    loop_on_n<M,N,K,float,-1>::run();
							 | 
						|
								    std::cout << "\n";
							 | 
						|
								
							 | 
						|
								    loop_on_m<M+1,N,K>::run();
							 | 
						|
								  }
							 | 
						|
								};
							 | 
						|
								
							 | 
						|
								template<int N, int K>
							 | 
						|
								struct loop_on_m<END,N,K> { static void run(){} };
							 | 
						|
								
							 | 
						|
								template<int M, int N, int K, typename Scalar, int Mode>
							 | 
						|
								struct loop_on_n
							 | 
						|
								{
							 | 
						|
								  static void run()
							 | 
						|
								  {
							 | 
						|
								    bench_prod<M,N,K,Scalar,Mode==-1? alt_prod<M,N,K>::ret : Mode>();
							 | 
						|
								    
							 | 
						|
								    loop_on_n<M,N+1,K,Scalar,Mode>::run();
							 | 
						|
								  }
							 | 
						|
								};
							 | 
						|
								
							 | 
						|
								template<int M, int K, typename Scalar, int Mode>
							 | 
						|
								struct loop_on_n<M,END,K,Scalar,Mode> { static void run(){} };
							 | 
						|
								
							 | 
						|
								template<int N> struct print_n
							 | 
						|
								{
							 | 
						|
								  static void run()
							 | 
						|
								  {
							 | 
						|
								    std::cout << map_size<N>::ret << "\t";
							 | 
						|
								    print_n<N+1>::run();
							 | 
						|
								  }
							 | 
						|
								};
							 | 
						|
								
							 | 
						|
								template<> struct print_n<END> { static void run(){} };
							 | 
						|
								
							 | 
						|
								int main()
							 | 
						|
								{
							 | 
						|
								  loop_on_k<1,1,1>::run();
							 | 
						|
								  
							 | 
						|
								  return 0; 
							 | 
						|
								}
							 |