You can not select more than 25 topics
			Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
		
		
		
		
		
			
		
			
				
					
					
						
							143 lines
						
					
					
						
							3.2 KiB
						
					
					
				
			
		
		
		
			
			
			
				
					
				
				
					
				
			
		
		
	
	
							143 lines
						
					
					
						
							3.2 KiB
						
					
					
				| 
 | |
| #include <iostream> | |
| #include <Eigen/Core> | |
| #include <bench/BenchTimer.h> | |
|  | |
| using namespace Eigen; | |
| using namespace std; | |
| 
 | |
| #define END 9 | |
|  | |
| template<int S> struct map_size { enum { ret = S }; }; | |
| template<>  struct map_size<10> { enum { ret = 20 }; }; | |
| template<>  struct map_size<11> { enum { ret = 50 }; }; | |
| template<>  struct map_size<12> { enum { ret = 100 }; }; | |
| template<>  struct map_size<13> { enum { ret = 300 }; }; | |
| 
 | |
| template<int M, int N,int K> struct alt_prod | |
| { | |
|   enum { | |
|     ret = M==1 && N==1 ? InnerProduct | |
|         : K==1 ? OuterProduct | |
|         : M==1 ? GemvProduct | |
|         : N==1 ? GemvProduct | |
|         : GemmProduct | |
|   }; | |
| }; | |
|          | |
| void print_mode(int mode) | |
| { | |
|   if(mode==InnerProduct) std::cout << "i"; | |
|   if(mode==OuterProduct) std::cout << "o"; | |
|   if(mode==CoeffBasedProductMode) std::cout << "c"; | |
|   if(mode==LazyCoeffBasedProductMode) std::cout << "l"; | |
|   if(mode==GemvProduct) std::cout << "v"; | |
|   if(mode==GemmProduct) std::cout << "m"; | |
| } | |
| 
 | |
| template<int Mode, typename Lhs, typename Rhs, typename Res> | |
| EIGEN_DONT_INLINE void prod(const Lhs& a, const Rhs& b, Res& c) | |
| { | |
|   c.noalias() += typename ProductReturnType<Lhs,Rhs,Mode>::Type(a,b); | |
| } | |
| 
 | |
| template<int M, int N, int K, typename Scalar, int Mode> | |
| EIGEN_DONT_INLINE void bench_prod() | |
| { | |
|   typedef Matrix<Scalar,M,K> Lhs; Lhs a; a.setRandom(); | |
|   typedef Matrix<Scalar,K,N> Rhs; Rhs b; b.setRandom(); | |
|   typedef Matrix<Scalar,M,N> Res; Res c; c.setRandom(); | |
| 
 | |
|   BenchTimer t; | |
|   double n = 2.*double(M)*double(N)*double(K); | |
|   int rep = 100000./n; | |
|   rep /= 2; | |
|   if(rep<1) rep = 1; | |
|   do { | |
|     rep *= 2; | |
|     t.reset(); | |
|     BENCH(t,1,rep,prod<CoeffBasedProductMode>(a,b,c)); | |
|   } while(t.best()<0.1); | |
|    | |
|   t.reset(); | |
|   BENCH(t,5,rep,prod<Mode>(a,b,c)); | |
| 
 | |
|   print_mode(Mode); | |
|   std::cout << int(1e-6*n*rep/t.best()) << "\t"; | |
| } | |
| 
 | |
| template<int N> struct print_n; | |
| template<int M, int N, int K> struct loop_on_m; | |
| template<int M, int N, int K, typename Scalar, int Mode> struct loop_on_n; | |
| 
 | |
| template<int M, int N, int K> | |
| struct loop_on_k | |
| { | |
|   static void run() | |
|   { | |
|     std::cout << "K=" << K << "\t"; | |
|     print_n<N>::run(); | |
|     std::cout << "\n"; | |
| 
 | |
|     loop_on_m<M,N,K>::run(); | |
|     std::cout << "\n\n"; | |
| 
 | |
|     loop_on_k<M,N,K+1>::run(); | |
|   } | |
| }; | |
| 
 | |
| template<int M, int N> | |
| struct loop_on_k<M,N,END> { static void run(){} }; | |
| 
 | |
| 
 | |
| template<int M, int N, int K> | |
| struct loop_on_m | |
| { | |
|   static void run() | |
|   { | |
|     std::cout << M << "f\t"; | |
|     loop_on_n<M,N,K,float,CoeffBasedProductMode>::run(); | |
|     std::cout << "\n"; | |
|      | |
|     std::cout << M << "f\t"; | |
|     loop_on_n<M,N,K,float,-1>::run(); | |
|     std::cout << "\n"; | |
| 
 | |
|     loop_on_m<M+1,N,K>::run(); | |
|   } | |
| }; | |
| 
 | |
| template<int N, int K> | |
| struct loop_on_m<END,N,K> { static void run(){} }; | |
| 
 | |
| template<int M, int N, int K, typename Scalar, int Mode> | |
| struct loop_on_n | |
| { | |
|   static void run() | |
|   { | |
|     bench_prod<M,N,K,Scalar,Mode==-1? alt_prod<M,N,K>::ret : Mode>(); | |
|      | |
|     loop_on_n<M,N+1,K,Scalar,Mode>::run(); | |
|   } | |
| }; | |
| 
 | |
| template<int M, int K, typename Scalar, int Mode> | |
| struct loop_on_n<M,END,K,Scalar,Mode> { static void run(){} }; | |
| 
 | |
| template<int N> struct print_n | |
| { | |
|   static void run() | |
|   { | |
|     std::cout << map_size<N>::ret << "\t"; | |
|     print_n<N+1>::run(); | |
|   } | |
| }; | |
| 
 | |
| template<> struct print_n<END> { static void run(){} }; | |
| 
 | |
| int main() | |
| { | |
|   loop_on_k<1,1,1>::run(); | |
|    | |
|   return 0;  | |
| }
 |