1*bf2c3715SXin Li
2*bf2c3715SXin Li #define EIGEN_INTERNAL_DEBUG_CACHE_QUERY
3*bf2c3715SXin Li #include <iostream>
4*bf2c3715SXin Li #include "../Eigen/Core"
5*bf2c3715SXin Li
6*bf2c3715SXin Li using namespace Eigen;
7*bf2c3715SXin Li using namespace std;
8*bf2c3715SXin Li
9*bf2c3715SXin Li #define DUMP_CPUID(CODE) {\
10*bf2c3715SXin Li int abcd[4]; \
11*bf2c3715SXin Li abcd[0] = abcd[1] = abcd[2] = abcd[3] = 0;\
12*bf2c3715SXin Li EIGEN_CPUID(abcd, CODE, 0); \
13*bf2c3715SXin Li std::cout << "The code " << CODE << " gives " \
14*bf2c3715SXin Li << (int*)(abcd[0]) << " " << (int*)(abcd[1]) << " " \
15*bf2c3715SXin Li << (int*)(abcd[2]) << " " << (int*)(abcd[3]) << " " << std::endl; \
16*bf2c3715SXin Li }
17*bf2c3715SXin Li
main()18*bf2c3715SXin Li int main()
19*bf2c3715SXin Li {
20*bf2c3715SXin Li cout << "Eigen's L1 = " << internal::queryL1CacheSize() << endl;
21*bf2c3715SXin Li cout << "Eigen's L2/L3 = " << internal::queryTopLevelCacheSize() << endl;
22*bf2c3715SXin Li int l1, l2, l3;
23*bf2c3715SXin Li internal::queryCacheSizes(l1, l2, l3);
24*bf2c3715SXin Li cout << "Eigen's L1, L2, L3 = " << l1 << " " << l2 << " " << l3 << endl;
25*bf2c3715SXin Li
26*bf2c3715SXin Li #ifdef EIGEN_CPUID
27*bf2c3715SXin Li
28*bf2c3715SXin Li int abcd[4];
29*bf2c3715SXin Li int string[8];
30*bf2c3715SXin Li char* string_char = (char*)(string);
31*bf2c3715SXin Li
32*bf2c3715SXin Li // vendor ID
33*bf2c3715SXin Li EIGEN_CPUID(abcd,0x0,0);
34*bf2c3715SXin Li string[0] = abcd[1];
35*bf2c3715SXin Li string[1] = abcd[3];
36*bf2c3715SXin Li string[2] = abcd[2];
37*bf2c3715SXin Li string[3] = 0;
38*bf2c3715SXin Li cout << endl;
39*bf2c3715SXin Li cout << "vendor id = " << string_char << endl;
40*bf2c3715SXin Li cout << endl;
41*bf2c3715SXin Li int max_funcs = abcd[0];
42*bf2c3715SXin Li
43*bf2c3715SXin Li internal::queryCacheSizes_intel_codes(l1, l2, l3);
44*bf2c3715SXin Li cout << "Eigen's intel codes L1, L2, L3 = " << l1 << " " << l2 << " " << l3 << endl;
45*bf2c3715SXin Li if(max_funcs>=4)
46*bf2c3715SXin Li {
47*bf2c3715SXin Li internal::queryCacheSizes_intel_direct(l1, l2, l3);
48*bf2c3715SXin Li cout << "Eigen's intel direct L1, L2, L3 = " << l1 << " " << l2 << " " << l3 << endl;
49*bf2c3715SXin Li }
50*bf2c3715SXin Li internal::queryCacheSizes_amd(l1, l2, l3);
51*bf2c3715SXin Li cout << "Eigen's amd L1, L2, L3 = " << l1 << " " << l2 << " " << l3 << endl;
52*bf2c3715SXin Li cout << endl;
53*bf2c3715SXin Li
54*bf2c3715SXin Li // dump Intel direct method
55*bf2c3715SXin Li if(max_funcs>=4)
56*bf2c3715SXin Li {
57*bf2c3715SXin Li l1 = l2 = l3 = 0;
58*bf2c3715SXin Li int cache_id = 0;
59*bf2c3715SXin Li int cache_type = 0;
60*bf2c3715SXin Li do {
61*bf2c3715SXin Li abcd[0] = abcd[1] = abcd[2] = abcd[3] = 0;
62*bf2c3715SXin Li EIGEN_CPUID(abcd,0x4,cache_id);
63*bf2c3715SXin Li cache_type = (abcd[0] & 0x0F) >> 0;
64*bf2c3715SXin Li int cache_level = (abcd[0] & 0xE0) >> 5; // A[7:5]
65*bf2c3715SXin Li int ways = (abcd[1] & 0xFFC00000) >> 22; // B[31:22]
66*bf2c3715SXin Li int partitions = (abcd[1] & 0x003FF000) >> 12; // B[21:12]
67*bf2c3715SXin Li int line_size = (abcd[1] & 0x00000FFF) >> 0; // B[11:0]
68*bf2c3715SXin Li int sets = (abcd[2]); // C[31:0]
69*bf2c3715SXin Li int cache_size = (ways+1) * (partitions+1) * (line_size+1) * (sets+1);
70*bf2c3715SXin Li
71*bf2c3715SXin Li cout << "cache[" << cache_id << "].type = " << cache_type << "\n";
72*bf2c3715SXin Li cout << "cache[" << cache_id << "].level = " << cache_level << "\n";
73*bf2c3715SXin Li cout << "cache[" << cache_id << "].ways = " << ways << "\n";
74*bf2c3715SXin Li cout << "cache[" << cache_id << "].partitions = " << partitions << "\n";
75*bf2c3715SXin Li cout << "cache[" << cache_id << "].line_size = " << line_size << "\n";
76*bf2c3715SXin Li cout << "cache[" << cache_id << "].sets = " << sets << "\n";
77*bf2c3715SXin Li cout << "cache[" << cache_id << "].size = " << cache_size << "\n";
78*bf2c3715SXin Li
79*bf2c3715SXin Li cache_id++;
80*bf2c3715SXin Li } while(cache_type>0 && cache_id<16);
81*bf2c3715SXin Li }
82*bf2c3715SXin Li
83*bf2c3715SXin Li // dump everything
84*bf2c3715SXin Li std::cout << endl <<"Raw dump:" << endl;
85*bf2c3715SXin Li for(int i=0; i<max_funcs; ++i)
86*bf2c3715SXin Li DUMP_CPUID(i);
87*bf2c3715SXin Li
88*bf2c3715SXin Li DUMP_CPUID(0x80000000);
89*bf2c3715SXin Li DUMP_CPUID(0x80000001);
90*bf2c3715SXin Li DUMP_CPUID(0x80000002);
91*bf2c3715SXin Li DUMP_CPUID(0x80000003);
92*bf2c3715SXin Li DUMP_CPUID(0x80000004);
93*bf2c3715SXin Li DUMP_CPUID(0x80000005);
94*bf2c3715SXin Li DUMP_CPUID(0x80000006);
95*bf2c3715SXin Li DUMP_CPUID(0x80000007);
96*bf2c3715SXin Li DUMP_CPUID(0x80000008);
97*bf2c3715SXin Li #else
98*bf2c3715SXin Li cout << "EIGEN_CPUID is not defined" << endl;
99*bf2c3715SXin Li #endif
100*bf2c3715SXin Li return 0;
101*bf2c3715SXin Li }
102