1*bf2c3715SXin Li #include <iostream>
2*bf2c3715SXin Li #include <iomanip>
3*bf2c3715SXin Li #include <Eigen/Core>
4*bf2c3715SXin Li #include <Eigen/Geometry>
5*bf2c3715SXin Li #include <bench/BenchTimer.h>
6*bf2c3715SXin Li
7*bf2c3715SXin Li using namespace Eigen;
8*bf2c3715SXin Li using namespace std;
9*bf2c3715SXin Li
10*bf2c3715SXin Li #ifndef REPEAT
11*bf2c3715SXin Li #define REPEAT 1000000
12*bf2c3715SXin Li #endif
13*bf2c3715SXin Li
14*bf2c3715SXin Li enum func_opt
15*bf2c3715SXin Li {
16*bf2c3715SXin Li TV,
17*bf2c3715SXin Li TMATV,
18*bf2c3715SXin Li TMATVMAT,
19*bf2c3715SXin Li };
20*bf2c3715SXin Li
21*bf2c3715SXin Li
22*bf2c3715SXin Li template <class res, class arg1, class arg2, int opt>
23*bf2c3715SXin Li struct func;
24*bf2c3715SXin Li
25*bf2c3715SXin Li template <class res, class arg1, class arg2>
26*bf2c3715SXin Li struct func<res, arg1, arg2, TV>
27*bf2c3715SXin Li {
runfunc28*bf2c3715SXin Li static EIGEN_DONT_INLINE res run( arg1& a1, arg2& a2 )
29*bf2c3715SXin Li {
30*bf2c3715SXin Li asm ("");
31*bf2c3715SXin Li return a1 * a2;
32*bf2c3715SXin Li }
33*bf2c3715SXin Li };
34*bf2c3715SXin Li
35*bf2c3715SXin Li template <class res, class arg1, class arg2>
36*bf2c3715SXin Li struct func<res, arg1, arg2, TMATV>
37*bf2c3715SXin Li {
runfunc38*bf2c3715SXin Li static EIGEN_DONT_INLINE res run( arg1& a1, arg2& a2 )
39*bf2c3715SXin Li {
40*bf2c3715SXin Li asm ("");
41*bf2c3715SXin Li return a1.matrix() * a2;
42*bf2c3715SXin Li }
43*bf2c3715SXin Li };
44*bf2c3715SXin Li
45*bf2c3715SXin Li template <class res, class arg1, class arg2>
46*bf2c3715SXin Li struct func<res, arg1, arg2, TMATVMAT>
47*bf2c3715SXin Li {
runfunc48*bf2c3715SXin Li static EIGEN_DONT_INLINE res run( arg1& a1, arg2& a2 )
49*bf2c3715SXin Li {
50*bf2c3715SXin Li asm ("");
51*bf2c3715SXin Li return res(a1.matrix() * a2.matrix());
52*bf2c3715SXin Li }
53*bf2c3715SXin Li };
54*bf2c3715SXin Li
55*bf2c3715SXin Li template <class func, class arg1, class arg2>
56*bf2c3715SXin Li struct test_transform
57*bf2c3715SXin Li {
runtest_transform58*bf2c3715SXin Li static void run()
59*bf2c3715SXin Li {
60*bf2c3715SXin Li arg1 a1;
61*bf2c3715SXin Li a1.setIdentity();
62*bf2c3715SXin Li arg2 a2;
63*bf2c3715SXin Li a2.setIdentity();
64*bf2c3715SXin Li
65*bf2c3715SXin Li BenchTimer timer;
66*bf2c3715SXin Li timer.reset();
67*bf2c3715SXin Li for (int k=0; k<10; ++k)
68*bf2c3715SXin Li {
69*bf2c3715SXin Li timer.start();
70*bf2c3715SXin Li for (int k=0; k<REPEAT; ++k)
71*bf2c3715SXin Li a2 = func::run( a1, a2 );
72*bf2c3715SXin Li timer.stop();
73*bf2c3715SXin Li }
74*bf2c3715SXin Li cout << setprecision(4) << fixed << timer.value() << "s " << endl;;
75*bf2c3715SXin Li }
76*bf2c3715SXin Li };
77*bf2c3715SXin Li
78*bf2c3715SXin Li
79*bf2c3715SXin Li #define run_vec( op, scalar, mode, option, vsize ) \
80*bf2c3715SXin Li std::cout << #scalar << "\t " << #mode << "\t " << #option << " " << #vsize " "; \
81*bf2c3715SXin Li {\
82*bf2c3715SXin Li typedef Transform<scalar, 3, mode, option> Trans;\
83*bf2c3715SXin Li typedef Matrix<scalar, vsize, 1, option> Vec;\
84*bf2c3715SXin Li typedef func<Vec,Trans,Vec,op> Func;\
85*bf2c3715SXin Li test_transform< Func, Trans, Vec >::run();\
86*bf2c3715SXin Li }
87*bf2c3715SXin Li
88*bf2c3715SXin Li #define run_trans( op, scalar, mode, option ) \
89*bf2c3715SXin Li std::cout << #scalar << "\t " << #mode << "\t " << #option << " "; \
90*bf2c3715SXin Li {\
91*bf2c3715SXin Li typedef Transform<scalar, 3, mode, option> Trans;\
92*bf2c3715SXin Li typedef func<Trans,Trans,Trans,op> Func;\
93*bf2c3715SXin Li test_transform< Func, Trans, Trans >::run();\
94*bf2c3715SXin Li }
95*bf2c3715SXin Li
main(int argc,char * argv[])96*bf2c3715SXin Li int main(int argc, char* argv[])
97*bf2c3715SXin Li {
98*bf2c3715SXin Li cout << "vec = trans * vec" << endl;
99*bf2c3715SXin Li run_vec(TV, float, Isometry, AutoAlign, 3);
100*bf2c3715SXin Li run_vec(TV, float, Isometry, DontAlign, 3);
101*bf2c3715SXin Li run_vec(TV, float, Isometry, AutoAlign, 4);
102*bf2c3715SXin Li run_vec(TV, float, Isometry, DontAlign, 4);
103*bf2c3715SXin Li run_vec(TV, float, Projective, AutoAlign, 4);
104*bf2c3715SXin Li run_vec(TV, float, Projective, DontAlign, 4);
105*bf2c3715SXin Li run_vec(TV, double, Isometry, AutoAlign, 3);
106*bf2c3715SXin Li run_vec(TV, double, Isometry, DontAlign, 3);
107*bf2c3715SXin Li run_vec(TV, double, Isometry, AutoAlign, 4);
108*bf2c3715SXin Li run_vec(TV, double, Isometry, DontAlign, 4);
109*bf2c3715SXin Li run_vec(TV, double, Projective, AutoAlign, 4);
110*bf2c3715SXin Li run_vec(TV, double, Projective, DontAlign, 4);
111*bf2c3715SXin Li
112*bf2c3715SXin Li cout << "vec = trans.matrix() * vec" << endl;
113*bf2c3715SXin Li run_vec(TMATV, float, Isometry, AutoAlign, 4);
114*bf2c3715SXin Li run_vec(TMATV, float, Isometry, DontAlign, 4);
115*bf2c3715SXin Li run_vec(TMATV, double, Isometry, AutoAlign, 4);
116*bf2c3715SXin Li run_vec(TMATV, double, Isometry, DontAlign, 4);
117*bf2c3715SXin Li
118*bf2c3715SXin Li cout << "trans = trans1 * trans" << endl;
119*bf2c3715SXin Li run_trans(TV, float, Isometry, AutoAlign);
120*bf2c3715SXin Li run_trans(TV, float, Isometry, DontAlign);
121*bf2c3715SXin Li run_trans(TV, double, Isometry, AutoAlign);
122*bf2c3715SXin Li run_trans(TV, double, Isometry, DontAlign);
123*bf2c3715SXin Li run_trans(TV, float, Projective, AutoAlign);
124*bf2c3715SXin Li run_trans(TV, float, Projective, DontAlign);
125*bf2c3715SXin Li run_trans(TV, double, Projective, AutoAlign);
126*bf2c3715SXin Li run_trans(TV, double, Projective, DontAlign);
127*bf2c3715SXin Li
128*bf2c3715SXin Li cout << "trans = trans1.matrix() * trans.matrix()" << endl;
129*bf2c3715SXin Li run_trans(TMATVMAT, float, Isometry, AutoAlign);
130*bf2c3715SXin Li run_trans(TMATVMAT, float, Isometry, DontAlign);
131*bf2c3715SXin Li run_trans(TMATVMAT, double, Isometry, AutoAlign);
132*bf2c3715SXin Li run_trans(TMATVMAT, double, Isometry, DontAlign);
133*bf2c3715SXin Li }
134*bf2c3715SXin Li
135