1*bf2c3715SXin Li // #define EIGEN_TAUCS_SUPPORT
2*bf2c3715SXin Li // #define EIGEN_CHOLMOD_SUPPORT
3*bf2c3715SXin Li #include <iostream>
4*bf2c3715SXin Li #include <Eigen/Sparse>
5*bf2c3715SXin Li
6*bf2c3715SXin Li // g++ -DSIZE=10000 -DDENSITY=0.001 sparse_cholesky.cpp -I.. -DDENSEMATRI -O3 -g0 -DNDEBUG -DNBTRIES=1 -I /home/gael/Coding/LinearAlgebra/taucs_full/src/ -I/home/gael/Coding/LinearAlgebra/taucs_full/build/linux/ -L/home/gael/Coding/LinearAlgebra/taucs_full/lib/linux/ -ltaucs /home/gael/Coding/LinearAlgebra/GotoBLAS/libgoto.a -lpthread -I /home/gael/Coding/LinearAlgebra/SuiteSparse/CHOLMOD/Include/ $CHOLLIB -I /home/gael/Coding/LinearAlgebra/SuiteSparse/UFconfig/ /home/gael/Coding/LinearAlgebra/SuiteSparse/CCOLAMD/Lib/libccolamd.a /home/gael/Coding/LinearAlgebra/SuiteSparse/CHOLMOD/Lib/libcholmod.a -lmetis /home/gael/Coding/LinearAlgebra/SuiteSparse/AMD/Lib/libamd.a /home/gael/Coding/LinearAlgebra/SuiteSparse/CAMD/Lib/libcamd.a /home/gael/Coding/LinearAlgebra/SuiteSparse/CCOLAMD/Lib/libccolamd.a /home/gael/Coding/LinearAlgebra/SuiteSparse/COLAMD/Lib/libcolamd.a -llapack && ./a.out
7*bf2c3715SXin Li
8*bf2c3715SXin Li #define NOGMM
9*bf2c3715SXin Li #define NOMTL
10*bf2c3715SXin Li
11*bf2c3715SXin Li #ifndef SIZE
12*bf2c3715SXin Li #define SIZE 10
13*bf2c3715SXin Li #endif
14*bf2c3715SXin Li
15*bf2c3715SXin Li #ifndef DENSITY
16*bf2c3715SXin Li #define DENSITY 0.01
17*bf2c3715SXin Li #endif
18*bf2c3715SXin Li
19*bf2c3715SXin Li #ifndef REPEAT
20*bf2c3715SXin Li #define REPEAT 1
21*bf2c3715SXin Li #endif
22*bf2c3715SXin Li
23*bf2c3715SXin Li #include "BenchSparseUtil.h"
24*bf2c3715SXin Li
25*bf2c3715SXin Li #ifndef MINDENSITY
26*bf2c3715SXin Li #define MINDENSITY 0.0004
27*bf2c3715SXin Li #endif
28*bf2c3715SXin Li
29*bf2c3715SXin Li #ifndef NBTRIES
30*bf2c3715SXin Li #define NBTRIES 10
31*bf2c3715SXin Li #endif
32*bf2c3715SXin Li
33*bf2c3715SXin Li #define BENCH(X) \
34*bf2c3715SXin Li timer.reset(); \
35*bf2c3715SXin Li for (int _j=0; _j<NBTRIES; ++_j) { \
36*bf2c3715SXin Li timer.start(); \
37*bf2c3715SXin Li for (int _k=0; _k<REPEAT; ++_k) { \
38*bf2c3715SXin Li X \
39*bf2c3715SXin Li } timer.stop(); }
40*bf2c3715SXin Li
41*bf2c3715SXin Li // typedef SparseMatrix<Scalar,UpperTriangular> EigenSparseTriMatrix;
42*bf2c3715SXin Li typedef SparseMatrix<Scalar,SelfAdjoint|LowerTriangular> EigenSparseSelfAdjointMatrix;
43*bf2c3715SXin Li
fillSpdMatrix(float density,int rows,int cols,EigenSparseSelfAdjointMatrix & dst)44*bf2c3715SXin Li void fillSpdMatrix(float density, int rows, int cols, EigenSparseSelfAdjointMatrix& dst)
45*bf2c3715SXin Li {
46*bf2c3715SXin Li dst.startFill(rows*cols*density);
47*bf2c3715SXin Li for(int j = 0; j < cols; j++)
48*bf2c3715SXin Li {
49*bf2c3715SXin Li dst.fill(j,j) = internal::random<Scalar>(10,20);
50*bf2c3715SXin Li for(int i = j+1; i < rows; i++)
51*bf2c3715SXin Li {
52*bf2c3715SXin Li Scalar v = (internal::random<float>(0,1) < density) ? internal::random<Scalar>() : 0;
53*bf2c3715SXin Li if (v!=0)
54*bf2c3715SXin Li dst.fill(i,j) = v;
55*bf2c3715SXin Li }
56*bf2c3715SXin Li
57*bf2c3715SXin Li }
58*bf2c3715SXin Li dst.endFill();
59*bf2c3715SXin Li }
60*bf2c3715SXin Li
61*bf2c3715SXin Li #include <Eigen/Cholesky>
62*bf2c3715SXin Li
63*bf2c3715SXin Li template<int Backend>
doEigen(const char * name,const EigenSparseSelfAdjointMatrix & sm1,int flags=0)64*bf2c3715SXin Li void doEigen(const char* name, const EigenSparseSelfAdjointMatrix& sm1, int flags = 0)
65*bf2c3715SXin Li {
66*bf2c3715SXin Li std::cout << name << "..." << std::flush;
67*bf2c3715SXin Li BenchTimer timer;
68*bf2c3715SXin Li timer.start();
69*bf2c3715SXin Li SparseLLT<EigenSparseSelfAdjointMatrix,Backend> chol(sm1, flags);
70*bf2c3715SXin Li timer.stop();
71*bf2c3715SXin Li std::cout << ":\t" << timer.value() << endl;
72*bf2c3715SXin Li
73*bf2c3715SXin Li std::cout << " nnz: " << sm1.nonZeros() << " => " << chol.matrixL().nonZeros() << "\n";
74*bf2c3715SXin Li // std::cout << "sparse\n" << chol.matrixL() << "%\n";
75*bf2c3715SXin Li }
76*bf2c3715SXin Li
main(int argc,char * argv[])77*bf2c3715SXin Li int main(int argc, char *argv[])
78*bf2c3715SXin Li {
79*bf2c3715SXin Li int rows = SIZE;
80*bf2c3715SXin Li int cols = SIZE;
81*bf2c3715SXin Li float density = DENSITY;
82*bf2c3715SXin Li BenchTimer timer;
83*bf2c3715SXin Li
84*bf2c3715SXin Li VectorXf b = VectorXf::Random(cols);
85*bf2c3715SXin Li VectorXf x = VectorXf::Random(cols);
86*bf2c3715SXin Li
87*bf2c3715SXin Li bool densedone = false;
88*bf2c3715SXin Li
89*bf2c3715SXin Li //for (float density = DENSITY; density>=MINDENSITY; density*=0.5)
90*bf2c3715SXin Li // float density = 0.5;
91*bf2c3715SXin Li {
92*bf2c3715SXin Li EigenSparseSelfAdjointMatrix sm1(rows, cols);
93*bf2c3715SXin Li std::cout << "Generate sparse matrix (might take a while)...\n";
94*bf2c3715SXin Li fillSpdMatrix(density, rows, cols, sm1);
95*bf2c3715SXin Li std::cout << "DONE\n\n";
96*bf2c3715SXin Li
97*bf2c3715SXin Li // dense matrices
98*bf2c3715SXin Li #ifdef DENSEMATRIX
99*bf2c3715SXin Li if (!densedone)
100*bf2c3715SXin Li {
101*bf2c3715SXin Li densedone = true;
102*bf2c3715SXin Li std::cout << "Eigen Dense\t" << density*100 << "%\n";
103*bf2c3715SXin Li DenseMatrix m1(rows,cols);
104*bf2c3715SXin Li eiToDense(sm1, m1);
105*bf2c3715SXin Li m1 = (m1 + m1.transpose()).eval();
106*bf2c3715SXin Li m1.diagonal() *= 0.5;
107*bf2c3715SXin Li
108*bf2c3715SXin Li // BENCH(LLT<DenseMatrix> chol(m1);)
109*bf2c3715SXin Li // std::cout << "dense:\t" << timer.value() << endl;
110*bf2c3715SXin Li
111*bf2c3715SXin Li BenchTimer timer;
112*bf2c3715SXin Li timer.start();
113*bf2c3715SXin Li LLT<DenseMatrix> chol(m1);
114*bf2c3715SXin Li timer.stop();
115*bf2c3715SXin Li std::cout << "dense:\t" << timer.value() << endl;
116*bf2c3715SXin Li int count = 0;
117*bf2c3715SXin Li for (int j=0; j<cols; ++j)
118*bf2c3715SXin Li for (int i=j; i<rows; ++i)
119*bf2c3715SXin Li if (!internal::isMuchSmallerThan(internal::abs(chol.matrixL()(i,j)), 0.1))
120*bf2c3715SXin Li count++;
121*bf2c3715SXin Li std::cout << "dense: " << "nnz = " << count << "\n";
122*bf2c3715SXin Li // std::cout << "dense:\n" << m1 << "\n\n" << chol.matrixL() << endl;
123*bf2c3715SXin Li }
124*bf2c3715SXin Li #endif
125*bf2c3715SXin Li
126*bf2c3715SXin Li // eigen sparse matrices
127*bf2c3715SXin Li doEigen<Eigen::DefaultBackend>("Eigen/Sparse", sm1, Eigen::IncompleteFactorization);
128*bf2c3715SXin Li
129*bf2c3715SXin Li #ifdef EIGEN_CHOLMOD_SUPPORT
130*bf2c3715SXin Li doEigen<Eigen::Cholmod>("Eigen/Cholmod", sm1, Eigen::IncompleteFactorization);
131*bf2c3715SXin Li #endif
132*bf2c3715SXin Li
133*bf2c3715SXin Li #ifdef EIGEN_TAUCS_SUPPORT
134*bf2c3715SXin Li doEigen<Eigen::Taucs>("Eigen/Taucs", sm1, Eigen::IncompleteFactorization);
135*bf2c3715SXin Li #endif
136*bf2c3715SXin Li
137*bf2c3715SXin Li #if 0
138*bf2c3715SXin Li // TAUCS
139*bf2c3715SXin Li {
140*bf2c3715SXin Li taucs_ccs_matrix A = sm1.asTaucsMatrix();
141*bf2c3715SXin Li
142*bf2c3715SXin Li //BENCH(taucs_ccs_matrix* chol = taucs_ccs_factor_llt(&A, 0, 0);)
143*bf2c3715SXin Li // BENCH(taucs_supernodal_factor_to_ccs(taucs_ccs_factor_llt_ll(&A));)
144*bf2c3715SXin Li // std::cout << "taucs:\t" << timer.value() << endl;
145*bf2c3715SXin Li
146*bf2c3715SXin Li taucs_ccs_matrix* chol = taucs_ccs_factor_llt(&A, 0, 0);
147*bf2c3715SXin Li
148*bf2c3715SXin Li for (int j=0; j<cols; ++j)
149*bf2c3715SXin Li {
150*bf2c3715SXin Li for (int i=chol->colptr[j]; i<chol->colptr[j+1]; ++i)
151*bf2c3715SXin Li std::cout << chol->values.d[i] << " ";
152*bf2c3715SXin Li }
153*bf2c3715SXin Li }
154*bf2c3715SXin Li
155*bf2c3715SXin Li // CHOLMOD
156*bf2c3715SXin Li #ifdef EIGEN_CHOLMOD_SUPPORT
157*bf2c3715SXin Li {
158*bf2c3715SXin Li cholmod_common c;
159*bf2c3715SXin Li cholmod_start (&c);
160*bf2c3715SXin Li cholmod_sparse A;
161*bf2c3715SXin Li cholmod_factor *L;
162*bf2c3715SXin Li
163*bf2c3715SXin Li A = sm1.asCholmodMatrix();
164*bf2c3715SXin Li BenchTimer timer;
165*bf2c3715SXin Li // timer.reset();
166*bf2c3715SXin Li timer.start();
167*bf2c3715SXin Li std::vector<int> perm(cols);
168*bf2c3715SXin Li // std::vector<int> set(ncols);
169*bf2c3715SXin Li for (int i=0; i<cols; ++i)
170*bf2c3715SXin Li perm[i] = i;
171*bf2c3715SXin Li // c.nmethods = 1;
172*bf2c3715SXin Li // c.method[0] = 1;
173*bf2c3715SXin Li
174*bf2c3715SXin Li c.nmethods = 1;
175*bf2c3715SXin Li c.method [0].ordering = CHOLMOD_NATURAL;
176*bf2c3715SXin Li c.postorder = 0;
177*bf2c3715SXin Li c.final_ll = 1;
178*bf2c3715SXin Li
179*bf2c3715SXin Li L = cholmod_analyze_p(&A, &perm[0], &perm[0], cols, &c);
180*bf2c3715SXin Li timer.stop();
181*bf2c3715SXin Li std::cout << "cholmod/analyze:\t" << timer.value() << endl;
182*bf2c3715SXin Li timer.reset();
183*bf2c3715SXin Li timer.start();
184*bf2c3715SXin Li cholmod_factorize(&A, L, &c);
185*bf2c3715SXin Li timer.stop();
186*bf2c3715SXin Li std::cout << "cholmod/factorize:\t" << timer.value() << endl;
187*bf2c3715SXin Li
188*bf2c3715SXin Li cholmod_sparse* cholmat = cholmod_factor_to_sparse(L, &c);
189*bf2c3715SXin Li
190*bf2c3715SXin Li cholmod_print_factor(L, "Factors", &c);
191*bf2c3715SXin Li
192*bf2c3715SXin Li cholmod_print_sparse(cholmat, "Chol", &c);
193*bf2c3715SXin Li cholmod_write_sparse(stdout, cholmat, 0, 0, &c);
194*bf2c3715SXin Li //
195*bf2c3715SXin Li // cholmod_print_sparse(&A, "A", &c);
196*bf2c3715SXin Li // cholmod_write_sparse(stdout, &A, 0, 0, &c);
197*bf2c3715SXin Li
198*bf2c3715SXin Li
199*bf2c3715SXin Li // for (int j=0; j<cols; ++j)
200*bf2c3715SXin Li // {
201*bf2c3715SXin Li // for (int i=chol->colptr[j]; i<chol->colptr[j+1]; ++i)
202*bf2c3715SXin Li // std::cout << chol->values.s[i] << " ";
203*bf2c3715SXin Li // }
204*bf2c3715SXin Li }
205*bf2c3715SXin Li #endif
206*bf2c3715SXin Li
207*bf2c3715SXin Li #endif
208*bf2c3715SXin Li
209*bf2c3715SXin Li
210*bf2c3715SXin Li
211*bf2c3715SXin Li }
212*bf2c3715SXin Li
213*bf2c3715SXin Li
214*bf2c3715SXin Li return 0;
215*bf2c3715SXin Li }
216*bf2c3715SXin Li
217