xref: /aosp_15_r20/external/clang/test/OpenMP/teams_firstprivate_codegen.cpp (revision 67e74705e28f6214e480b399dd47ea732279e315)
1*67e74705SXin Li // Test host codegen.
2*67e74705SXin Li // RUN: %clang_cc1 -DLAMBDA -verify -fopenmp -x c++ -std=c++11 -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -emit-llvm %s -o - | FileCheck %s --check-prefix LAMBDA --check-prefix LAMBDA-64
3*67e74705SXin Li // RUN: %clang_cc1 -DLAMBDA -fopenmp -x c++ -std=c++11 -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -emit-pch -o %t %s
4*67e74705SXin Li // RUN: %clang_cc1 -DLAMBDA -fopenmp -x c++ -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix LAMBDA --check-prefix LAMBDA-64
5*67e74705SXin Li // RUN: %clang_cc1 -DLAMBDA -verify -fopenmp -x c++ -std=c++11 -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -emit-llvm %s -o - | FileCheck %s --check-prefix LAMBDA --check-prefix LAMBDA-32
6*67e74705SXin Li // RUN: %clang_cc1 -DLAMBDA -fopenmp -x c++ -std=c++11 -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -emit-pch -o %t %s
7*67e74705SXin Li // RUN: %clang_cc1 -DLAMBDA -fopenmp -x c++ -std=c++11 -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix LAMBDA --check-prefix LAMBDA-32
8*67e74705SXin Li 
9*67e74705SXin Li // RUN: %clang_cc1  -verify -fopenmp -x c++ -std=c++11 -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -emit-llvm %s -o - | FileCheck %s --check-prefix CHECK --check-prefix CHECK-64
10*67e74705SXin Li // RUN: %clang_cc1  -fopenmp -x c++ -std=c++11 -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -emit-pch -o %t %s
11*67e74705SXin Li // RUN: %clang_cc1  -fopenmp -x c++ -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix CHECK --check-prefix CHECK-64
12*67e74705SXin Li // RUN: %clang_cc1  -verify -fopenmp -x c++ -std=c++11 -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -emit-llvm %s -o - | FileCheck %s --check-prefix CHECK --check-prefix CHECK-32
13*67e74705SXin Li // RUN: %clang_cc1  -fopenmp -x c++ -std=c++11 -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -emit-pch -o %t %s
14*67e74705SXin Li // RUN: %clang_cc1  -fopenmp -x c++ -std=c++11 -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix CHECK --check-prefix CHECK-32
15*67e74705SXin Li 
16*67e74705SXin Li // RUN: %clang_cc1 -DARRAY  -verify -fopenmp -x c++ -std=c++11 -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -emit-llvm %s -o - | FileCheck %s --check-prefix ARRAY --check-prefix ARRAY-64
17*67e74705SXin Li // RUN: %clang_cc1 -DARRAY  -fopenmp -x c++ -std=c++11 -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -emit-pch -o %t %s
18*67e74705SXin Li // RUN: %clang_cc1 -DARRAY  -fopenmp -x c++ -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix ARRAY --check-prefix ARRAY-64
19*67e74705SXin Li // RUN: %clang_cc1 -DARRAY  -verify -fopenmp -x c++ -std=c++11 -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -emit-llvm %s -o - | FileCheck %s --check-prefix ARRAY --check-prefix ARRAY-32
20*67e74705SXin Li // RUN: %clang_cc1 -DARRAY  -fopenmp -x c++ -std=c++11 -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -emit-pch -o %t %s
21*67e74705SXin Li // RUN: %clang_cc1 -DARRAY  -fopenmp -x c++ -std=c++11 -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix ARRAY --check-prefix ARRAY-32
22*67e74705SXin Li // expected-no-diagnostics
23*67e74705SXin Li #ifndef HEADER
24*67e74705SXin Li #define HEADER
25*67e74705SXin Li #ifndef ARRAY
26*67e74705SXin Li struct St {
27*67e74705SXin Li   int a, b;
StSt28*67e74705SXin Li   St() : a(0), b(0) {}
StSt29*67e74705SXin Li   St(const St &st) : a(st.a + st.b), b(0) {}
~StSt30*67e74705SXin Li   ~St() {}
31*67e74705SXin Li };
32*67e74705SXin Li 
33*67e74705SXin Li volatile int g __attribute__((aligned(128))) = 1212;
34*67e74705SXin Li 
35*67e74705SXin Li template <class T>
36*67e74705SXin Li struct S {
37*67e74705SXin Li   T f;
SS38*67e74705SXin Li   S(T a) : f(a + g) {}
SS39*67e74705SXin Li   S() : f(g) {}
SS40*67e74705SXin Li   S(const S &s, St t = St()) : f(s.f + t.a) {}
operator TS41*67e74705SXin Li   operator T() { return T(); }
~SS42*67e74705SXin Li   ~S() {}
43*67e74705SXin Li };
44*67e74705SXin Li 
45*67e74705SXin Li // CHECK-DAG: [[S_FLOAT_TY:%.+]] = type { float }
46*67e74705SXin Li // CHECK-DAG: [[S_INT_TY:%.+]] = type { i{{[0-9]+}} }
47*67e74705SXin Li // CHECK-DAG: [[ST_TY:%.+]] = type { i{{[0-9]+}}, i{{[0-9]+}} }
48*67e74705SXin Li 
49*67e74705SXin Li template <typename T>
tmain()50*67e74705SXin Li T tmain() {
51*67e74705SXin Li   S<T> test;
52*67e74705SXin Li   T t_var __attribute__((aligned(128))) = T();
53*67e74705SXin Li   T vec[] __attribute__((aligned(128))) = {1, 2};
54*67e74705SXin Li   S<T> s_arr[] __attribute__((aligned(128))) = {1, 2};
55*67e74705SXin Li   S<T> var __attribute__((aligned(128))) (3);
56*67e74705SXin Li   #pragma omp target
57*67e74705SXin Li   #pragma omp teams firstprivate(t_var, vec, s_arr, var)
58*67e74705SXin Li   {
59*67e74705SXin Li     vec[0] = t_var;
60*67e74705SXin Li     s_arr[0] = var;
61*67e74705SXin Li   }
62*67e74705SXin Li #pragma omp target
63*67e74705SXin Li #pragma omp teams firstprivate(t_var)
64*67e74705SXin Li   {}
65*67e74705SXin Li   return T();
66*67e74705SXin Li }
67*67e74705SXin Li 
main()68*67e74705SXin Li int main() {
69*67e74705SXin Li   static int sivar;
70*67e74705SXin Li #ifdef LAMBDA
71*67e74705SXin Li   // LAMBDA-LABEL: @main
72*67e74705SXin Li   // LAMBDA: call{{.*}} void [[OUTER_LAMBDA:@.+]](
73*67e74705SXin Li   [&]() {
74*67e74705SXin Li   // LAMBDA: define{{.*}} internal{{.*}} void [[OUTER_LAMBDA]](
75*67e74705SXin Li   // LAMBDA: call {{.*}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 2, {{.+}}* [[OMP_REGION:@.+]] to {{.+}}, i32* {{.+}}, {{.+}})
76*67e74705SXin Li   #pragma omp target
77*67e74705SXin Li   #pragma omp teams firstprivate(g, sivar)
78*67e74705SXin Li   {
79*67e74705SXin Li     // LAMBDA: define{{.*}} internal{{.*}} void [[OMP_REGION]](i32* noalias %{{.+}}, i32* noalias %{{.+}}, i32* dereferenceable(4) [[G_IN:%.+]], i{{64|32}} {{.*}}[[SIVAR_IN:%.+]])
80*67e74705SXin Li     // LAMBDA: store i{{[0-9]+}}* [[G_IN]], i{{[0-9]+}}** [[G_ADDR:%.+]],
81*67e74705SXin Li     // LAMBDA: store i{{[0-9]+}} [[SIVAR_IN]], i{{[0-9]+}}* [[SIVAR_ADDR:%.+]],
82*67e74705SXin Li     // LAMBDA: [[G_ADDR_VAL:%.+]] = load i{{[0-9]+}}*, i{{[0-9]+}}** [[G_ADDR]],
83*67e74705SXin Li     // LAMBDA-64: [[SIVAR_CONV:%.+]] = bitcast i64*  [[SIVAR_ADDR]] to i32*
84*67e74705SXin Li     // LAMBDA: [[G_VAL:%.+]] = load i{{[0-9]+}}, i{{[0-9]+}}* [[G_ADDR_VAL]],
85*67e74705SXin Li     // LAMBDA: store i{{[0-9]+}} [[G_VAL]], i{{[0-9]+}}* [[G_LOCAL:%.+]],
86*67e74705SXin Li     g = 1;
87*67e74705SXin Li     sivar = 2;
88*67e74705SXin Li     // LAMBDA: store i{{[0-9]+}} 1, i{{[0-9]+}}* [[G_LOCAL]],
89*67e74705SXin Li     // LAMBDA-64: store i{{[0-9]+}} 2, i{{[0-9]+}}* [[SIVAR_CONV]],
90*67e74705SXin Li     // LAMBDA-32: store i{{[0-9]+}} 2, i{{[0-9]+}}* [[SIVAR_ADDR]],
91*67e74705SXin Li     // LAMBDA: [[G_PRIVATE_ADDR_REF:%.+]] = getelementptr inbounds %{{.+}}, %{{.+}}* [[ARG:%.+]], i{{[0-9]+}} 0, i{{[0-9]+}} 0
92*67e74705SXin Li     // LAMBDA: store i{{[0-9]+}}* [[G_LOCAL]], i{{[0-9]+}}** [[G_PRIVATE_ADDR_REF]]
93*67e74705SXin Li     // LAMBDA: [[SIVAR_PRIVATE_ADDR_REF:%.+]] = getelementptr inbounds %{{.+}}, %{{.+}}* [[ARG:%.+]], i{{[0-9]+}} 0, i{{[0-9]+}} 1
94*67e74705SXin Li     // LAMBDA-64: store i{{[0-9]+}}* [[SIVAR_CONV]], i{{[0-9]+}}** [[SIVAR_PRIVATE_ADDR_REF]]
95*67e74705SXin Li     // LAMBDA-32: store i{{[0-9]+}}* [[SIVAR_ADDR]], i{{[0-9]+}}** [[SIVAR_PRIVATE_ADDR_REF]]
96*67e74705SXin Li     // LAMBDA: call{{.*}} void [[INNER_LAMBDA:@.+]](%{{.+}}* [[ARG]])
97*67e74705SXin Li     [&]() {
98*67e74705SXin Li       // LAMBDA: define {{.+}} void [[INNER_LAMBDA]](%{{.+}}* [[ARG_PTR:%.+]])
99*67e74705SXin Li       // LAMBDA: store %{{.+}}* [[ARG_PTR]], %{{.+}}** [[ARG_PTR_REF:%.+]],
100*67e74705SXin Li       g = 2;
101*67e74705SXin Li       sivar = 4;
102*67e74705SXin Li       // LAMBDA: [[ARG_PTR:%.+]] = load %{{.+}}*, %{{.+}}** [[ARG_PTR_REF]]
103*67e74705SXin Li       // LAMBDA: [[G_PTR_REF:%.+]] = getelementptr inbounds %{{.+}}, %{{.+}}* [[ARG_PTR]], i{{[0-9]+}} 0, i{{[0-9]+}} 0
104*67e74705SXin Li       // LAMBDA: [[G_REF:%.+]] = load i{{[0-9]+}}*, i{{[0-9]+}}** [[G_PTR_REF]]
105*67e74705SXin Li       // LAMBDA: [[SIVAR_PTR_REF:%.+]] = getelementptr inbounds %{{.+}}, %{{.+}}* [[ARG_PTR]], i{{[0-9]+}} 0, i{{[0-9]+}} 1
106*67e74705SXin Li       // LAMBDA: [[SIVAR_REF:%.+]] = load i{{[0-9]+}}*, i{{[0-9]+}}** [[SIVAR_PTR_REF]]
107*67e74705SXin Li       // LAMBDA: store i{{[0-9]+}} 4, i{{[0-9]+}}* [[SIVAR_REF]]
108*67e74705SXin Li     }();
109*67e74705SXin Li   }
110*67e74705SXin Li   }();
111*67e74705SXin Li   return 0;
112*67e74705SXin Li #else
113*67e74705SXin Li   S<float> test;
114*67e74705SXin Li   int t_var = 0;
115*67e74705SXin Li   int vec[] = {1, 2};
116*67e74705SXin Li   S<float> s_arr[] = {1, 2};
117*67e74705SXin Li   S<float> var(3);
118*67e74705SXin Li   #pragma omp target
119*67e74705SXin Li   #pragma omp teams firstprivate(t_var, vec, s_arr, var, sivar)
120*67e74705SXin Li   {
121*67e74705SXin Li     vec[0] = t_var;
122*67e74705SXin Li     s_arr[0] = var;
123*67e74705SXin Li     sivar = 2;
124*67e74705SXin Li   }
125*67e74705SXin Li   #pragma omp target
126*67e74705SXin Li   #pragma omp teams firstprivate(t_var)
127*67e74705SXin Li   {}
128*67e74705SXin Li   return tmain<int>();
129*67e74705SXin Li #endif
130*67e74705SXin Li }
131*67e74705SXin Li 
132*67e74705SXin Li // CHECK: define internal {{.*}}void [[OMP_OFFLOADING:@.+]](
133*67e74705SXin Li // CHECK: call {{.*}}void (%{{.+}}*, i{{[0-9]+}}, void (i{{[0-9]+}}*, i{{[0-9]+}}*, ...)*, ...) @__kmpc_fork_teams(%{{.+}}* @{{.+}}, i{{[0-9]+}} 5, void (i{{[0-9]+}}*, i{{[0-9]+}}*, ...)* bitcast (void (i{{[0-9]+}}*, i{{[0-9]+}}*, [2 x i32]*, i{{32|64}}, [2 x [[S_FLOAT_TY]]]*, [[S_FLOAT_TY]]*, i{{[0-9]+}})* [[OMP_OUTLINED:@.+]] to void
134*67e74705SXin Li // CHECK: ret
135*67e74705SXin Li //
136*67e74705SXin Li // CHECK: define internal {{.*}}void [[OMP_OUTLINED]](i{{[0-9]+}}* noalias [[GTID_ADDR:%.+]], i{{[0-9]+}}* noalias %{{.+}}, [2 x i32]* dereferenceable(8) %{{.+}}, i{{32|64}} {{.*}}%{{.+}}, [2 x [[S_FLOAT_TY]]]* dereferenceable(8) %{{.+}}, [[S_FLOAT_TY]]* dereferenceable(4) %{{.+}}, i{{32|64}} {{.*}}[[SIVAR:%.+]])
137*67e74705SXin Li // CHECK: [[T_VAR_PRIV:%.+]] = alloca i{{[0-9]+}},
138*67e74705SXin Li // CHECK: [[SIVAR7_PRIV:%.+]] = alloca i{{[0-9]+}},
139*67e74705SXin Li // CHECK: [[VEC_PRIV:%.+]] = alloca [2 x i{{[0-9]+}}],
140*67e74705SXin Li // CHECK: [[S_ARR_PRIV:%.+]] = alloca [2 x [[S_FLOAT_TY]]],
141*67e74705SXin Li // CHECK: [[VAR_PRIV:%.+]] = alloca [[S_FLOAT_TY]],
142*67e74705SXin Li // CHECK: store i{{[0-9]+}}* [[GTID_ADDR]], i{{[0-9]+}}** [[GTID_ADDR_ADDR:%.+]],
143*67e74705SXin Li 
144*67e74705SXin Li // CHECK: [[VEC_REF:%.+]] = load [2 x i{{[0-9]+}}]*, [2 x i{{[0-9]+}}]** %
145*67e74705SXin Li // CHECK-64: [[T_VAR_CONV:%.+]] = bitcast i64* [[T_VAR_PRIV]] to i32*
146*67e74705SXin Li // CHECK: [[S_ARR_REF:%.+]] = load [2 x [[S_FLOAT_TY]]]*, [2 x [[S_FLOAT_TY]]]** %
147*67e74705SXin Li // CHECK: [[VAR_REF:%.+]] = load [[S_FLOAT_TY]]*, [[S_FLOAT_TY]]** %
148*67e74705SXin Li // CHECK-64: [[SIVAR7_CONV:%.+]] = bitcast i64* [[SIVAR7_PRIV]] to i32*
149*67e74705SXin Li // CHECK: [[VEC_DEST:%.+]] = bitcast [2 x i{{[0-9]+}}]* [[VEC_PRIV]] to i8*
150*67e74705SXin Li // CHECK: [[VEC_SRC:%.+]] = bitcast [2 x i{{[0-9]+}}]* [[VEC_REF]] to i8*
151*67e74705SXin Li // CHECK: call void @llvm.memcpy.{{.+}}(i8* [[VEC_DEST]], i8* [[VEC_SRC]],
152*67e74705SXin Li // CHECK: [[S_ARR_PRIV_BEGIN:%.+]] = getelementptr inbounds [2 x [[S_FLOAT_TY]]], [2 x [[S_FLOAT_TY]]]* [[S_ARR_PRIV]], i{{[0-9]+}} 0, i{{[0-9]+}} 0
153*67e74705SXin Li // CHECK: [[S_ARR_BEGIN:%.+]] = bitcast [2 x [[S_FLOAT_TY]]]* [[S_ARR_REF]] to [[S_FLOAT_TY]]*
154*67e74705SXin Li // CHECK: [[S_ARR_PRIV_END:%.+]] = getelementptr [[S_FLOAT_TY]], [[S_FLOAT_TY]]* [[S_ARR_PRIV_BEGIN]], i{{[0-9]+}} 2
155*67e74705SXin Li // CHECK: [[IS_EMPTY:%.+]] = icmp eq [[S_FLOAT_TY]]* [[S_ARR_PRIV_BEGIN]], [[S_ARR_PRIV_END]]
156*67e74705SXin Li // CHECK: br i1 [[IS_EMPTY]], label %[[S_ARR_BODY_DONE:.+]], label %[[S_ARR_BODY:.+]]
157*67e74705SXin Li // CHECK: [[S_ARR_BODY]]
158*67e74705SXin Li // CHECK: call {{.*}} [[ST_TY_DEFAULT_CONSTR:@.+]]([[ST_TY]]* [[ST_TY_TEMP:%.+]])
159*67e74705SXin Li // CHECK: call {{.*}} [[S_FLOAT_TY_COPY_CONSTR:@.+]]([[S_FLOAT_TY]]* {{.+}}, [[S_FLOAT_TY]]* {{.+}}, [[ST_TY]]* [[ST_TY_TEMP]])
160*67e74705SXin Li // CHECK: call {{.*}} [[ST_TY_DESTR:@.+]]([[ST_TY]]* [[ST_TY_TEMP]])
161*67e74705SXin Li // CHECK: br i1 {{.+}}, label %{{.+}}, label %[[S_ARR_BODY]]
162*67e74705SXin Li // CHECK: call {{.*}} [[ST_TY_DEFAULT_CONSTR]]([[ST_TY]]* [[ST_TY_TEMP:%.+]])
163*67e74705SXin Li // CHECK: call {{.*}} [[S_FLOAT_TY_COPY_CONSTR]]([[S_FLOAT_TY]]* [[VAR_PRIV]], [[S_FLOAT_TY]]* {{.*}} [[VAR_REF]], [[ST_TY]]* [[ST_TY_TEMP]])
164*67e74705SXin Li // CHECK: call {{.*}} [[ST_TY_DESTR]]([[ST_TY]]* [[ST_TY_TEMP]])
165*67e74705SXin Li 
166*67e74705SXin Li // CHECK-64: store i{{[0-9]+}} 2, i{{[0-9]+}}* [[SIVAR7_CONV]],
167*67e74705SXin Li // CHECK-32: store i{{[0-9]+}} 2, i{{[0-9]+}}* [[SIVAR7_PRIV]],
168*67e74705SXin Li 
169*67e74705SXin Li // CHECK-DAG: call {{.*}} [[S_FLOAT_TY_DESTR:@.+]]([[S_FLOAT_TY]]* [[VAR_PRIV]])
170*67e74705SXin Li // CHECK-DAG: call {{.*}} [[S_FLOAT_TY_DESTR]]([[S_FLOAT_TY]]*
171*67e74705SXin Li // CHECK: ret void
172*67e74705SXin Li 
173*67e74705SXin Li // CHECK: define internal {{.*}}void [[OMP_OFFLOADING_1:@.+]](
174*67e74705SXin Li // CHECK: call {{.*}}void (%{{.+}}*, i{{[0-9]+}}, void (i{{[0-9]+}}*, i{{[0-9]+}}*, ...)*, ...) @__kmpc_fork_teams(%{{.+}}* @{{.+}}, i{{[0-9]+}} 1, void (i{{[0-9]+}}*, i{{[0-9]+}}*, ...)* bitcast (void (i{{[0-9]+}}*, i{{[0-9]+}}*, i{{[0-9]+}})* [[OMP_OUTLINED_1:@.+]] to void
175*67e74705SXin Li // CHECK: ret
176*67e74705SXin Li 
177*67e74705SXin Li // CHECK: define internal {{.*}}void [[OMP_OUTLINED_1]](i{{[0-9]+}}* noalias {{%.+}}, i{{[0-9]+}}* noalias {{%.+}}, i{{32|64}} {{.*}}[[T_VAR:%.+]])
178*67e74705SXin Li // CHECK: [[T_VAR_LOC:%.+]] = alloca i{{[0-9]+}},
179*67e74705SXin Li // CHECK: store i{{[0-9]+}} [[T_VAR]], i{{[0-9]+}}* [[T_VAR_LOC]],
180*67e74705SXin Li // CHECK: ret
181*67e74705SXin Li 
182*67e74705SXin Li // CHECK: define internal {{.*}}void [[OMP_OFFLOADING_2:@.+]](i{{[0-9]+}}* {{.+}} {{%.+}}, [2 x i32]* {{.+}} {{%.+}}, [2 x [[S_INT_TY]]]* {{.+}} {{%.+}}, [[S_INT_TY]]* {{.+}} {{%.+}})
183*67e74705SXin Li // CHECK: call {{.*}}void (%{{.+}}*, i{{[0-9]+}}, void (i{{[0-9]+}}*, i{{[0-9]+}}*, ...)*, ...) @__kmpc_fork_teams(%{{.+}}* @{{.+}}, i{{[0-9]+}} 4, void (i{{[0-9]+}}*, i{{[0-9]+}}*, ...)* bitcast (void (i{{[0-9]+}}*, i{{[0-9]+}}*, [2 x i32]*, i32*, [2 x [[S_INT_TY]]]*, [[S_INT_TY]]*)* [[OMP_OUTLINED_2:@.+]] to void
184*67e74705SXin Li // CHECK: ret
185*67e74705SXin Li 
186*67e74705SXin Li //
187*67e74705SXin Li // CHECK: define internal {{.*}}void [[OMP_OUTLINED_2]](i{{[0-9]+}}* noalias [[GTID_ADDR:%.+]], i{{[0-9]+}}* noalias %{{.+}}, [2 x i32]* dereferenceable(8) %{{.+}}, i32* dereferenceable(4) %{{.+}}, [2 x [[S_INT_TY]]]* dereferenceable(8) %{{.+}}, [[S_INT_TY]]* dereferenceable(4) %{{.+}})
188*67e74705SXin Li // CHECK: [[T_VAR_PRIV:%.+]] = alloca i{{[0-9]+}}, align 128
189*67e74705SXin Li // CHECK: [[VEC_PRIV:%.+]] = alloca [2 x i{{[0-9]+}}], align 128
190*67e74705SXin Li // CHECK: [[S_ARR_PRIV:%.+]] = alloca [2 x [[S_INT_TY]]], align 128
191*67e74705SXin Li // CHECK: [[VAR_PRIV:%.+]] = alloca [[S_INT_TY]], align 128
192*67e74705SXin Li // CHECK: store i{{[0-9]+}}* [[GTID_ADDR]], i{{[0-9]+}}** [[GTID_ADDR_ADDR:%.+]],
193*67e74705SXin Li 
194*67e74705SXin Li // CHECK: [[VEC_REF:%.+]] = load [2 x i{{[0-9]+}}]*, [2 x i{{[0-9]+}}]** %
195*67e74705SXin Li // CHECK: [[T_VAR_REF:%.+]] = load i{{[0-9]+}}*, i{{[0-9]+}}** %
196*67e74705SXin Li // CHECK: [[S_ARR_REF:%.+]] = load [2 x [[S_INT_TY]]]*, [2 x [[S_INT_TY]]]** %
197*67e74705SXin Li // CHECK: [[VAR_REF:%.+]] = load [[S_INT_TY]]*, [[S_INT_TY]]** %
198*67e74705SXin Li 
199*67e74705SXin Li // CHECK: [[T_VAR_VAL:%.+]] = load i{{[0-9]+}}, i{{[0-9]+}}* [[T_VAR_REF]], align 128
200*67e74705SXin Li // CHECK: store i{{[0-9]+}} [[T_VAR_VAL]], i{{[0-9]+}}* [[T_VAR_PRIV]], align 128
201*67e74705SXin Li // CHECK: [[VEC_DEST:%.+]] = bitcast [2 x i{{[0-9]+}}]* [[VEC_PRIV]] to i8*
202*67e74705SXin Li // CHECK: [[VEC_SRC:%.+]] = bitcast [2 x i{{[0-9]+}}]* [[VEC_REF]] to i8*
203*67e74705SXin Li // CHECK: call void @llvm.memcpy.{{.+}}(i8* [[VEC_DEST]], i8* [[VEC_SRC]], i{{[0-9]+}} {{[0-9]+}}, i{{[0-9]+}} 128,
204*67e74705SXin Li // CHECK: [[S_ARR_PRIV_BEGIN:%.+]] = getelementptr inbounds [2 x [[S_INT_TY]]], [2 x [[S_INT_TY]]]* [[S_ARR_PRIV]], i{{[0-9]+}} 0, i{{[0-9]+}} 0
205*67e74705SXin Li // CHECK: [[S_ARR_BEGIN:%.+]] = bitcast [2 x [[S_INT_TY]]]* [[S_ARR_REF]] to [[S_INT_TY]]*
206*67e74705SXin Li // CHECK: [[S_ARR_PRIV_END:%.+]] = getelementptr [[S_INT_TY]], [[S_INT_TY]]* [[S_ARR_PRIV_BEGIN]], i{{[0-9]+}} 2
207*67e74705SXin Li // CHECK: [[IS_EMPTY:%.+]] = icmp eq [[S_INT_TY]]* [[S_ARR_PRIV_BEGIN]], [[S_ARR_PRIV_END]]
208*67e74705SXin Li // CHECK: br i1 [[IS_EMPTY]], label %[[S_ARR_BODY_DONE:.+]], label %[[S_ARR_BODY:.+]]
209*67e74705SXin Li // CHECK: [[S_ARR_BODY]]
210*67e74705SXin Li // CHECK: call {{.*}} [[ST_TY_DEFAULT_CONSTR]]([[ST_TY]]* [[ST_TY_TEMP:%.+]])
211*67e74705SXin Li // CHECK: call {{.*}} [[S_INT_TY_COPY_CONSTR:@.+]]([[S_INT_TY]]* {{.+}}, [[S_INT_TY]]* {{.+}}, [[ST_TY]]* [[ST_TY_TEMP]])
212*67e74705SXin Li // CHECK: call {{.*}} [[ST_TY_DESTR:@.+]]([[ST_TY]]* [[ST_TY_TEMP]])
213*67e74705SXin Li // CHECK: br i1 {{.+}}, label %{{.+}}, label %[[S_ARR_BODY]]
214*67e74705SXin Li // CHECK: call {{.*}} [[ST_TY_DEFAULT_CONSTR]]([[ST_TY]]* [[ST_TY_TEMP:%.+]])
215*67e74705SXin Li // CHECK: call {{.*}} [[S_INT_TY_COPY_CONSTR]]([[S_INT_TY]]* [[VAR_PRIV]], [[S_INT_TY]]* {{.*}} [[VAR_REF]], [[ST_TY]]* [[ST_TY_TEMP]])
216*67e74705SXin Li // CHECK: call {{.*}} [[ST_TY_DESTR]]([[ST_TY]]* [[ST_TY_TEMP]])
217*67e74705SXin Li // CHECK-DAG: call {{.*}} [[S_INT_TY_DESTR:@.+]]([[S_INT_TY]]* [[VAR_PRIV]])
218*67e74705SXin Li // CHECK-DAG: call {{.*}} [[S_INT_TY_DESTR]]([[S_INT_TY]]*
219*67e74705SXin Li // CHECK: ret void
220*67e74705SXin Li 
221*67e74705SXin Li // CHECK: define internal {{.*}}void [[OMP_OFFLOADING_3:@.+]](
222*67e74705SXin Li // CHECK: call {{.*}}void (%{{.+}}*, i{{[0-9]+}}, void (i{{[0-9]+}}*, i{{[0-9]+}}*, ...)*, ...) @__kmpc_fork_teams(%{{.+}}* @{{.+}}, i{{[0-9]+}} 1, void (i{{[0-9]+}}*, i{{[0-9]+}}*, ...)* bitcast (void (i{{[0-9]+}}*, i{{[0-9]+}}*, i{{[0-9]+}}*)* [[OMP_OUTLINED_3:@.+]] to void
223*67e74705SXin Li // CHECK: ret
224*67e74705SXin Li 
225*67e74705SXin Li // CHECK: define internal {{.*}}void [[OMP_OUTLINED_3]](i{{[0-9]+}}* noalias [[GTID_ADDR:%.+]], i{{[0-9]+}}* noalias %{{.+}}, i32* dereferenceable(4) [[T_VAR:%.+]])
226*67e74705SXin Li // CHECK: [[T_VAR_LOC:%.+]] = alloca i{{[0-9]+}},
227*67e74705SXin Li // CHECK: store i{{[0-9]+}}* [[T_VAR]], i{{[0-9]+}}** [[T_VAR_ADDR:%.+]],
228*67e74705SXin Li // CHECK: [[T_VAR_REF:%.+]] = load i{{[0-9]+}}*, i{{[0-9]+}}** [[T_VAR_ADDR]],
229*67e74705SXin Li // CHECK: [[T_VAR_VAL:%.+]] = load i{{[0-9]+}}, i{{[0-9]+}}* [[T_VAR_REF]],
230*67e74705SXin Li // CHECK: store i{{[0-9]+}} [[T_VAR_VAL]], i{{[0-9]+}}* [[T_VAR_LOC]],
231*67e74705SXin Li // CHECK: ret
232*67e74705SXin Li 
233*67e74705SXin Li #else
234*67e74705SXin Li struct St {
235*67e74705SXin Li   int a, b;
StSt236*67e74705SXin Li   St() : a(0), b(0) {}
StSt237*67e74705SXin Li   St(const St &) { }
~StSt238*67e74705SXin Li   ~St() {}
St_funcSt239*67e74705SXin Li   void St_func(St s[2], int n, long double vla1[n]) {
240*67e74705SXin Li     double vla2[n][n] __attribute__((aligned(128)));
241*67e74705SXin Li     a = b;
242*67e74705SXin Li     #pragma omp target
243*67e74705SXin Li     #pragma omp teams firstprivate(s, vla1, vla2)
244*67e74705SXin Li     vla1[b] = vla2[1][n - 1] = a = b;
245*67e74705SXin Li   }
246*67e74705SXin Li };
247*67e74705SXin Li 
array_func(float a[3],St s[2],int n,long double vla1[n])248*67e74705SXin Li void array_func(float a[3], St s[2], int n, long double vla1[n]) {
249*67e74705SXin Li   double vla2[n][n] __attribute__((aligned(128)));
250*67e74705SXin Li // ARRAY: call {{.+}} @__kmpc_fork_teams(
251*67e74705SXin Li // ARRAY-DAG: [[PRIV_S:%.+]] = alloca %struct.St*,
252*67e74705SXin Li // ARRAY-64-DAG: [[PRIV_VLA1:%.+]] = alloca ppc_fp128*,
253*67e74705SXin Li // ARRAY-32-DAG: [[PRIV_VLA1:%.+]] = alloca x86_fp80*,
254*67e74705SXin Li // ARRAY-DAG: [[PRIV_A:%.+]] = alloca float*,
255*67e74705SXin Li // ARRAY-DAG: [[PRIV_VLA2:%.+]] = alloca double*,
256*67e74705SXin Li // ARRAY-DAG: store float* %{{.+}}, float** [[PRIV_A]],
257*67e74705SXin Li // ARRAY-DAG: store %struct.St* %{{.+}}, %struct.St** [[PRIV_S]],
258*67e74705SXin Li // ARRAY-64-DAG: store ppc_fp128* %{{.+}}, ppc_fp128** [[PRIV_VLA1]],
259*67e74705SXin Li // ARRAY-32-DAG: store x86_fp80* %{{.+}}, x86_fp80** [[PRIV_VLA1]],
260*67e74705SXin Li // ARRAY-DAG: store double* %{{.+}}, double** [[PRIV_VLA2]],
261*67e74705SXin Li // ARRAY: call i8* @llvm.stacksave()
262*67e74705SXin Li // ARRAY: [[SIZE:%.+]] = mul nuw i{{[0-9]+}} %{{.+}}, 8
263*67e74705SXin Li // ARRAY: call void @llvm.memcpy.p0i8.p0i8.i{{[0-9]+}}(i8* %{{.+}}, i8* %{{.+}}, i{{[0-9]+}} [[SIZE]], i32 128, i1 false)
264*67e74705SXin Li   #pragma omp target
265*67e74705SXin Li   #pragma omp teams firstprivate(a, s, vla1, vla2)
266*67e74705SXin Li   s[0].St_func(s, n, vla1);
267*67e74705SXin Li   ;
268*67e74705SXin Li }
269*67e74705SXin Li 
270*67e74705SXin Li // ARRAY: @__kmpc_fork_teams(
271*67e74705SXin Li // ARRAY-DAG: [[PRIV_S:%.+]] = alloca %struct.St*,
272*67e74705SXin Li // ARRAY-64-DAG: [[PRIV_VLA1:%.+]] = alloca ppc_fp128*,
273*67e74705SXin Li // ARRAY-32-DAG: [[PRIV_VLA1:%.+]] = alloca x86_fp80*,
274*67e74705SXin Li // ARRAY-DAG: [[PRIV_VLA2:%.+]] = alloca double*,
275*67e74705SXin Li // ARRAY-DAG: store %struct.St* %{{.+}}, %struct.St** [[PRIV_S]],
276*67e74705SXin Li // ARRAY-64-DAG: store ppc_fp128* %{{.+}}, ppc_fp128** [[PRIV_VLA1]],
277*67e74705SXin Li // ARRAY-32-DAG: store x86_fp80* %{{.+}}, x86_fp80** [[PRIV_VLA1]],
278*67e74705SXin Li // ARRAY-DAG: store double* %{{.+}}, double** [[PRIV_VLA2]],
279*67e74705SXin Li // ARRAY: call i8* @llvm.stacksave()
280*67e74705SXin Li // ARRAY: [[SIZE:%.+]] = mul nuw i{{[0-9]+}} %{{.+}}, 8
281*67e74705SXin Li // ARRAY: call void @llvm.memcpy.p0i8.p0i8.i{{[0-9]+}}(i8* %{{.+}}, i8* %{{.+}}, i{{[0-9]+}} [[SIZE]], i32 128, i1 false)
282*67e74705SXin Li #endif
283*67e74705SXin Li #endif
284