1*67e74705SXin Li // RUN: %clang_cc1 -triple x86_64-apple-darwin -std=c++11 -emit-llvm -o - %s | FileCheck %s
2*67e74705SXin Li
3*67e74705SXin Li // Verify while loop is recognized after sequence of pragma clang loop directives.
while_test(int * List,int Length)4*67e74705SXin Li void while_test(int *List, int Length) {
5*67e74705SXin Li // CHECK: define {{.*}} @_Z10while_test
6*67e74705SXin Li int i = 0;
7*67e74705SXin Li
8*67e74705SXin Li #pragma clang loop vectorize(enable)
9*67e74705SXin Li #pragma clang loop interleave_count(4)
10*67e74705SXin Li #pragma clang loop vectorize_width(4)
11*67e74705SXin Li #pragma clang loop unroll(full)
12*67e74705SXin Li #pragma clang loop distribute(enable)
13*67e74705SXin Li while (i < Length) {
14*67e74705SXin Li // CHECK: br label {{.*}}, !llvm.loop ![[LOOP_1:.*]]
15*67e74705SXin Li List[i] = i * 2;
16*67e74705SXin Li i++;
17*67e74705SXin Li }
18*67e74705SXin Li }
19*67e74705SXin Li
20*67e74705SXin Li // Verify do loop is recognized after multi-option pragma clang loop directive.
do_test(int * List,int Length)21*67e74705SXin Li void do_test(int *List, int Length) {
22*67e74705SXin Li int i = 0;
23*67e74705SXin Li
24*67e74705SXin Li #pragma clang loop vectorize_width(8) interleave_count(4) unroll(disable) distribute(disable)
25*67e74705SXin Li do {
26*67e74705SXin Li // CHECK: br i1 {{.*}}, label {{.*}}, label {{.*}}, !llvm.loop ![[LOOP_2:.*]]
27*67e74705SXin Li List[i] = i * 2;
28*67e74705SXin Li i++;
29*67e74705SXin Li } while (i < Length);
30*67e74705SXin Li }
31*67e74705SXin Li
32*67e74705SXin Li enum struct Tuner : short { Interleave = 4, Unroll = 8 };
33*67e74705SXin Li
34*67e74705SXin Li // Verify for loop is recognized after sequence of pragma clang loop directives.
for_test(int * List,int Length)35*67e74705SXin Li void for_test(int *List, int Length) {
36*67e74705SXin Li #pragma clang loop interleave(enable)
37*67e74705SXin Li #pragma clang loop interleave_count(static_cast<int>(Tuner::Interleave))
38*67e74705SXin Li #pragma clang loop unroll_count(static_cast<int>(Tuner::Unroll))
39*67e74705SXin Li for (int i = 0; i < Length; i++) {
40*67e74705SXin Li // CHECK: br label {{.*}}, !llvm.loop ![[LOOP_3:.*]]
41*67e74705SXin Li List[i] = i * 2;
42*67e74705SXin Li }
43*67e74705SXin Li }
44*67e74705SXin Li
45*67e74705SXin Li // Verify c++11 for range loop is recognized after
46*67e74705SXin Li // sequence of pragma clang loop directives.
for_range_test()47*67e74705SXin Li void for_range_test() {
48*67e74705SXin Li double List[100];
49*67e74705SXin Li
50*67e74705SXin Li #pragma clang loop vectorize_width(2) interleave_count(2)
51*67e74705SXin Li for (int i : List) {
52*67e74705SXin Li // CHECK: br label {{.*}}, !llvm.loop ![[LOOP_4:.*]]
53*67e74705SXin Li List[i] = i;
54*67e74705SXin Li }
55*67e74705SXin Li }
56*67e74705SXin Li
57*67e74705SXin Li // Verify disable pragma clang loop directive generates correct metadata
disable_test(int * List,int Length)58*67e74705SXin Li void disable_test(int *List, int Length) {
59*67e74705SXin Li #pragma clang loop vectorize(disable) unroll(disable) distribute(disable)
60*67e74705SXin Li for (int i = 0; i < Length; i++) {
61*67e74705SXin Li // CHECK: br label {{.*}}, !llvm.loop ![[LOOP_5:.*]]
62*67e74705SXin Li List[i] = i * 2;
63*67e74705SXin Li }
64*67e74705SXin Li }
65*67e74705SXin Li
66*67e74705SXin Li #define VECWIDTH 2
67*67e74705SXin Li #define INTCOUNT 2
68*67e74705SXin Li #define UNROLLCOUNT 8
69*67e74705SXin Li
70*67e74705SXin Li // Verify defines are correctly resolved in pragma clang loop directive
for_define_test(int * List,int Length,int Value)71*67e74705SXin Li void for_define_test(int *List, int Length, int Value) {
72*67e74705SXin Li #pragma clang loop vectorize_width(VECWIDTH) interleave_count(INTCOUNT)
73*67e74705SXin Li #pragma clang loop unroll_count(UNROLLCOUNT)
74*67e74705SXin Li for (int i = 0; i < Length; i++) {
75*67e74705SXin Li // CHECK: br label {{.*}}, !llvm.loop ![[LOOP_6:.*]]
76*67e74705SXin Li List[i] = i * Value;
77*67e74705SXin Li }
78*67e74705SXin Li }
79*67e74705SXin Li
80*67e74705SXin Li // Verify constant expressions are handled correctly.
for_contant_expression_test(int * List,int Length)81*67e74705SXin Li void for_contant_expression_test(int *List, int Length) {
82*67e74705SXin Li #pragma clang loop vectorize_width(1 + 4)
83*67e74705SXin Li for (int i = 0; i < Length; i++) {
84*67e74705SXin Li // CHECK: br label {{.*}}, !llvm.loop ![[LOOP_7:.*]]
85*67e74705SXin Li List[i] = i;
86*67e74705SXin Li }
87*67e74705SXin Li
88*67e74705SXin Li #pragma clang loop vectorize_width(3 + VECWIDTH)
89*67e74705SXin Li for (int i = 0; i < Length; i++) {
90*67e74705SXin Li // CHECK: br label {{.*}}, !llvm.loop ![[LOOP_8:.*]]
91*67e74705SXin Li List[i] += i;
92*67e74705SXin Li }
93*67e74705SXin Li }
94*67e74705SXin Li
95*67e74705SXin Li // Verify metadata is generated when template is used.
96*67e74705SXin Li template <typename A>
for_template_test(A * List,int Length,A Value)97*67e74705SXin Li void for_template_test(A *List, int Length, A Value) {
98*67e74705SXin Li #pragma clang loop vectorize_width(8) interleave_count(8) unroll_count(8)
99*67e74705SXin Li for (int i = 0; i < Length; i++) {
100*67e74705SXin Li // CHECK: br label {{.*}}, !llvm.loop ![[LOOP_9:.*]]
101*67e74705SXin Li List[i] = i * Value;
102*67e74705SXin Li }
103*67e74705SXin Li }
104*67e74705SXin Li
105*67e74705SXin Li // Verify define is resolved correctly when template is used.
106*67e74705SXin Li template <typename A, typename T>
for_template_define_test(A * List,int Length,A Value)107*67e74705SXin Li void for_template_define_test(A *List, int Length, A Value) {
108*67e74705SXin Li const T VWidth = VECWIDTH;
109*67e74705SXin Li const T ICount = INTCOUNT;
110*67e74705SXin Li const T UCount = UNROLLCOUNT;
111*67e74705SXin Li #pragma clang loop vectorize_width(VWidth) interleave_count(ICount)
112*67e74705SXin Li #pragma clang loop unroll_count(UCount)
113*67e74705SXin Li for (int i = 0; i < Length; i++) {
114*67e74705SXin Li // CHECK: br label {{.*}}, !llvm.loop ![[LOOP_10:.*]]
115*67e74705SXin Li List[i] = i * Value;
116*67e74705SXin Li }
117*67e74705SXin Li }
118*67e74705SXin Li
119*67e74705SXin Li // Verify templates and constant expressions are handled correctly.
120*67e74705SXin Li template <typename A, int V, int I, int U>
for_template_constant_expression_test(A * List,int Length)121*67e74705SXin Li void for_template_constant_expression_test(A *List, int Length) {
122*67e74705SXin Li #pragma clang loop vectorize_width(V) interleave_count(I) unroll_count(U)
123*67e74705SXin Li for (int i = 0; i < Length; i++) {
124*67e74705SXin Li // CHECK: br label {{.*}}, !llvm.loop ![[LOOP_11:.*]]
125*67e74705SXin Li List[i] = i;
126*67e74705SXin Li }
127*67e74705SXin Li
128*67e74705SXin Li #pragma clang loop vectorize_width(V * 2 + VECWIDTH) interleave_count(I * 2 + INTCOUNT) unroll_count(U * 2 + UNROLLCOUNT)
129*67e74705SXin Li for (int i = 0; i < Length; i++) {
130*67e74705SXin Li // CHECK: br label {{.*}}, !llvm.loop ![[LOOP_12:.*]]
131*67e74705SXin Li List[i] += i;
132*67e74705SXin Li }
133*67e74705SXin Li
134*67e74705SXin Li const int Scale = 4;
135*67e74705SXin Li #pragma clang loop vectorize_width(Scale * V) interleave_count(Scale * I) unroll_count(Scale * U)
136*67e74705SXin Li for (int i = 0; i < Length; i++) {
137*67e74705SXin Li // CHECK: br label {{.*}}, !llvm.loop ![[LOOP_13:.*]]
138*67e74705SXin Li List[i] += i;
139*67e74705SXin Li }
140*67e74705SXin Li
141*67e74705SXin Li #pragma clang loop vectorize_width((Scale * V) + 2)
142*67e74705SXin Li for (int i = 0; i < Length; i++) {
143*67e74705SXin Li // CHECK: br label {{.*}}, !llvm.loop ![[LOOP_14:.*]]
144*67e74705SXin Li List[i] += i;
145*67e74705SXin Li }
146*67e74705SXin Li }
147*67e74705SXin Li
148*67e74705SXin Li #undef VECWIDTH
149*67e74705SXin Li #undef INTCOUNT
150*67e74705SXin Li #undef UNROLLCOUNT
151*67e74705SXin Li
152*67e74705SXin Li // Use templates defined above. Test verifies metadata is generated correctly.
template_test(double * List,int Length)153*67e74705SXin Li void template_test(double *List, int Length) {
154*67e74705SXin Li double Value = 10;
155*67e74705SXin Li
156*67e74705SXin Li for_template_test<double>(List, Length, Value);
157*67e74705SXin Li for_template_define_test<double, int>(List, Length, Value);
158*67e74705SXin Li for_template_constant_expression_test<double, 2, 4, 8>(List, Length);
159*67e74705SXin Li }
160*67e74705SXin Li
161*67e74705SXin Li // CHECK: ![[LOOP_1]] = distinct !{![[LOOP_1]], ![[WIDTH_4:.*]], ![[INTERLEAVE_4:.*]], ![[INTENABLE_1:.*]], ![[UNROLL_FULL:.*]], ![[DISTRIBUTE_ENABLE:.*]]}
162*67e74705SXin Li // CHECK: ![[WIDTH_4]] = !{!"llvm.loop.vectorize.width", i32 4}
163*67e74705SXin Li // CHECK: ![[INTERLEAVE_4]] = !{!"llvm.loop.interleave.count", i32 4}
164*67e74705SXin Li // CHECK: ![[INTENABLE_1]] = !{!"llvm.loop.vectorize.enable", i1 true}
165*67e74705SXin Li // CHECK: ![[UNROLL_FULL]] = !{!"llvm.loop.unroll.full"}
166*67e74705SXin Li // CHECK: ![[DISTRIBUTE_ENABLE]] = !{!"llvm.loop.distribute.enable", i1 true}
167*67e74705SXin Li // CHECK: ![[LOOP_2]] = distinct !{![[LOOP_2:.*]], ![[WIDTH_8:.*]], ![[INTERLEAVE_4:.*]], ![[UNROLL_DISABLE:.*]], ![[DISTRIBUTE_DISABLE:.*]]}
168*67e74705SXin Li // CHECK: ![[WIDTH_8]] = !{!"llvm.loop.vectorize.width", i32 8}
169*67e74705SXin Li // CHECK: ![[UNROLL_DISABLE]] = !{!"llvm.loop.unroll.disable"}
170*67e74705SXin Li // CHECK: ![[DISTRIBUTE_DISABLE]] = !{!"llvm.loop.distribute.enable", i1 false}
171*67e74705SXin Li // CHECK: ![[LOOP_3]] = distinct !{![[LOOP_3]], ![[INTERLEAVE_4:.*]], ![[UNROLL_8:.*]], ![[INTENABLE_1:.*]]}
172*67e74705SXin Li // CHECK: ![[UNROLL_8]] = !{!"llvm.loop.unroll.count", i32 8}
173*67e74705SXin Li // CHECK: ![[LOOP_4]] = distinct !{![[LOOP_4]], ![[WIDTH_2:.*]], ![[INTERLEAVE_2:.*]]}
174*67e74705SXin Li // CHECK: ![[WIDTH_2]] = !{!"llvm.loop.vectorize.width", i32 2}
175*67e74705SXin Li // CHECK: ![[INTERLEAVE_2]] = !{!"llvm.loop.interleave.count", i32 2}
176*67e74705SXin Li // CHECK: ![[LOOP_5]] = distinct !{![[LOOP_5]], ![[WIDTH_1:.*]], ![[UNROLL_DISABLE:.*]], ![[DISTRIBUTE_DISABLE:.*]]}
177*67e74705SXin Li // CHECK: ![[WIDTH_1]] = !{!"llvm.loop.vectorize.width", i32 1}
178*67e74705SXin Li // CHECK: ![[LOOP_6]] = distinct !{![[LOOP_6]], ![[WIDTH_2:.*]], ![[INTERLEAVE_2:.*]], ![[UNROLL_8:.*]]}
179*67e74705SXin Li // CHECK: ![[LOOP_7]] = distinct !{![[LOOP_7]], ![[WIDTH_5:.*]]}
180*67e74705SXin Li // CHECK: ![[WIDTH_5]] = !{!"llvm.loop.vectorize.width", i32 5}
181*67e74705SXin Li // CHECK: ![[LOOP_8]] = distinct !{![[LOOP_8]], ![[WIDTH_5:.*]]}
182*67e74705SXin Li // CHECK: ![[LOOP_9]] = distinct !{![[LOOP_9]], ![[WIDTH_8:.*]], ![[INTERLEAVE_8:.*]], ![[UNROLL_8:.*]]}
183*67e74705SXin Li // CHECK: ![[INTERLEAVE_8]] = !{!"llvm.loop.interleave.count", i32 8}
184*67e74705SXin Li // CHECK: ![[LOOP_10]] = distinct !{![[LOOP_10]], ![[WIDTH_2:.*]], ![[INTERLEAVE_2:.*]], ![[UNROLL_8:.*]]}
185*67e74705SXin Li // CHECK: ![[LOOP_11]] = distinct !{![[LOOP_11]], ![[WIDTH_2:.*]], ![[INTERLEAVE_4:.*]], ![[UNROLL_8:.*]]}
186*67e74705SXin Li // CHECK: ![[LOOP_12]] = distinct !{![[LOOP_12]], ![[WIDTH_6:.*]], ![[INTERLEAVE_10:.*]], ![[UNROLL_24:.*]]}
187*67e74705SXin Li // CHECK: ![[WIDTH_6]] = !{!"llvm.loop.vectorize.width", i32 6}
188*67e74705SXin Li // CHECK: ![[INTERLEAVE_10]] = !{!"llvm.loop.interleave.count", i32 10}
189*67e74705SXin Li // CHECK: ![[UNROLL_24]] = !{!"llvm.loop.unroll.count", i32 24}
190*67e74705SXin Li // CHECK: ![[LOOP_13]] = distinct !{![[LOOP_13]], ![[WIDTH_8:.*]], ![[INTERLEAVE_16:.*]], ![[UNROLL_32:.*]]}
191*67e74705SXin Li // CHECK: ![[INTERLEAVE_16]] = !{!"llvm.loop.interleave.count", i32 16}
192*67e74705SXin Li // CHECK: ![[UNROLL_32]] = !{!"llvm.loop.unroll.count", i32 32}
193*67e74705SXin Li // CHECK: ![[LOOP_14]] = distinct !{![[LOOP_14]], ![[WIDTH_10:.*]]}
194*67e74705SXin Li // CHECK: ![[WIDTH_10]] = !{!"llvm.loop.vectorize.width", i32 10}
195