xref: /aosp_15_r20/external/llvm/test/CodeGen/NVPTX/local-stack-frame.ll (revision 9880d6810fe72a1726cb53787c6711e909410d58)
1*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -march=nvptx -mcpu=sm_20 | FileCheck %s --check-prefix=PTX32
2*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -march=nvptx64 -mcpu=sm_20 | FileCheck %s --check-prefix=PTX64
3*9880d681SAndroid Build Coastguard Worker
4*9880d681SAndroid Build Coastguard Worker; Ensure we access the local stack properly
5*9880d681SAndroid Build Coastguard Worker
6*9880d681SAndroid Build Coastguard Worker; PTX32:        mov.u32          %SPL, __local_depot{{[0-9]+}};
7*9880d681SAndroid Build Coastguard Worker; PTX32:        cvta.local.u32   %SP, %SPL;
8*9880d681SAndroid Build Coastguard Worker; PTX32:        ld.param.u32     %r{{[0-9]+}}, [foo_param_0];
9*9880d681SAndroid Build Coastguard Worker; PTX32:        st.volatile.u32  [%SP+0], %r{{[0-9]+}};
10*9880d681SAndroid Build Coastguard Worker; PTX64:        mov.u64          %SPL, __local_depot{{[0-9]+}};
11*9880d681SAndroid Build Coastguard Worker; PTX64:        cvta.local.u64   %SP, %SPL;
12*9880d681SAndroid Build Coastguard Worker; PTX64:        ld.param.u32     %r{{[0-9]+}}, [foo_param_0];
13*9880d681SAndroid Build Coastguard Worker; PTX64:        st.volatile.u32  [%SP+0], %r{{[0-9]+}};
14*9880d681SAndroid Build Coastguard Workerdefine void @foo(i32 %a) {
15*9880d681SAndroid Build Coastguard Worker  %local = alloca i32, align 4
16*9880d681SAndroid Build Coastguard Worker  store volatile i32 %a, i32* %local
17*9880d681SAndroid Build Coastguard Worker  ret void
18*9880d681SAndroid Build Coastguard Worker}
19*9880d681SAndroid Build Coastguard Worker
20*9880d681SAndroid Build Coastguard Worker; PTX32:        mov.u32          %SPL, __local_depot{{[0-9]+}};
21*9880d681SAndroid Build Coastguard Worker; PTX32:        cvta.local.u32   %SP, %SPL;
22*9880d681SAndroid Build Coastguard Worker; PTX32:        ld.param.u32     %r{{[0-9]+}}, [foo2_param_0];
23*9880d681SAndroid Build Coastguard Worker; PTX32:        add.u32          %r[[SP_REG:[0-9]+]], %SPL, 0;
24*9880d681SAndroid Build Coastguard Worker; PTX32:        st.local.u32  [%r[[SP_REG]]], %r{{[0-9]+}};
25*9880d681SAndroid Build Coastguard Worker; PTX64:        mov.u64          %SPL, __local_depot{{[0-9]+}};
26*9880d681SAndroid Build Coastguard Worker; PTX64:        cvta.local.u64   %SP, %SPL;
27*9880d681SAndroid Build Coastguard Worker; PTX64:        ld.param.u32     %r{{[0-9]+}}, [foo2_param_0];
28*9880d681SAndroid Build Coastguard Worker; PTX64:        add.u64          %rd[[SP_REG:[0-9]+]], %SPL, 0;
29*9880d681SAndroid Build Coastguard Worker; PTX64:        st.local.u32  [%rd[[SP_REG]]], %r{{[0-9]+}};
30*9880d681SAndroid Build Coastguard Workerdefine void @foo2(i32 %a) {
31*9880d681SAndroid Build Coastguard Worker  %local = alloca i32, align 4
32*9880d681SAndroid Build Coastguard Worker  store i32 %a, i32* %local
33*9880d681SAndroid Build Coastguard Worker  call void @bar(i32* %local)
34*9880d681SAndroid Build Coastguard Worker  ret void
35*9880d681SAndroid Build Coastguard Worker}
36*9880d681SAndroid Build Coastguard Worker
37*9880d681SAndroid Build Coastguard Workerdeclare void @bar(i32* %a)
38*9880d681SAndroid Build Coastguard Worker
39*9880d681SAndroid Build Coastguard Worker!nvvm.annotations = !{!0}
40*9880d681SAndroid Build Coastguard Worker!0 = !{void (i32)* @foo2, !"kernel", i32 1}
41*9880d681SAndroid Build Coastguard Worker
42*9880d681SAndroid Build Coastguard Worker; PTX32:        mov.u32          %SPL, __local_depot{{[0-9]+}};
43*9880d681SAndroid Build Coastguard Worker; PTX32-NOT:    cvta.local.u32   %SP, %SPL;
44*9880d681SAndroid Build Coastguard Worker; PTX32:        ld.param.u32     %r{{[0-9]+}}, [foo3_param_0];
45*9880d681SAndroid Build Coastguard Worker; PTX32:        add.u32          %r{{[0-9]+}}, %SPL, 0;
46*9880d681SAndroid Build Coastguard Worker; PTX32:        st.local.u32  [%r{{[0-9]+}}], %r{{[0-9]+}};
47*9880d681SAndroid Build Coastguard Worker; PTX64:        mov.u64          %SPL, __local_depot{{[0-9]+}};
48*9880d681SAndroid Build Coastguard Worker; PTX64-NOT:    cvta.local.u64   %SP, %SPL;
49*9880d681SAndroid Build Coastguard Worker; PTX64:        ld.param.u32     %r{{[0-9]+}}, [foo3_param_0];
50*9880d681SAndroid Build Coastguard Worker; PTX64:        add.u64          %rd{{[0-9]+}}, %SPL, 0;
51*9880d681SAndroid Build Coastguard Worker; PTX64:        st.local.u32  [%rd{{[0-9]+}}], %r{{[0-9]+}};
52*9880d681SAndroid Build Coastguard Workerdefine void @foo3(i32 %a) {
53*9880d681SAndroid Build Coastguard Worker  %local = alloca [3 x i32], align 4
54*9880d681SAndroid Build Coastguard Worker  %1 = bitcast [3 x i32]* %local to i32*
55*9880d681SAndroid Build Coastguard Worker  %2 = getelementptr inbounds i32, i32* %1, i32 %a
56*9880d681SAndroid Build Coastguard Worker  store i32 %a, i32* %2
57*9880d681SAndroid Build Coastguard Worker  ret void
58*9880d681SAndroid Build Coastguard Worker}
59*9880d681SAndroid Build Coastguard Worker
60*9880d681SAndroid Build Coastguard Worker; PTX32:        cvta.local.u32   %SP, %SPL;
61*9880d681SAndroid Build Coastguard Worker; PTX32:        add.u32          {{%r[0-9]+}}, %SP, 0;
62*9880d681SAndroid Build Coastguard Worker; PTX32:        add.u32          {{%r[0-9]+}}, %SPL, 0;
63*9880d681SAndroid Build Coastguard Worker; PTX32:        add.u32          {{%r[0-9]+}}, %SP, 4;
64*9880d681SAndroid Build Coastguard Worker; PTX32:        add.u32          {{%r[0-9]+}}, %SPL, 4;
65*9880d681SAndroid Build Coastguard Worker; PTX32:        st.local.u32     [{{%r[0-9]+}}], {{%r[0-9]+}}
66*9880d681SAndroid Build Coastguard Worker; PTX32:        st.local.u32     [{{%r[0-9]+}}], {{%r[0-9]+}}
67*9880d681SAndroid Build Coastguard Worker; PTX64:        cvta.local.u64   %SP, %SPL;
68*9880d681SAndroid Build Coastguard Worker; PTX64:        add.u64          {{%rd[0-9]+}}, %SP, 0;
69*9880d681SAndroid Build Coastguard Worker; PTX64:        add.u64          {{%rd[0-9]+}}, %SPL, 0;
70*9880d681SAndroid Build Coastguard Worker; PTX64:        add.u64          {{%rd[0-9]+}}, %SP, 4;
71*9880d681SAndroid Build Coastguard Worker; PTX64:        add.u64          {{%rd[0-9]+}}, %SPL, 4;
72*9880d681SAndroid Build Coastguard Worker; PTX64:        st.local.u32     [{{%rd[0-9]+}}], {{%r[0-9]+}}
73*9880d681SAndroid Build Coastguard Worker; PTX64:        st.local.u32     [{{%rd[0-9]+}}], {{%r[0-9]+}}
74*9880d681SAndroid Build Coastguard Workerdefine void @foo4() {
75*9880d681SAndroid Build Coastguard Worker  %A = alloca i32
76*9880d681SAndroid Build Coastguard Worker  %B = alloca i32
77*9880d681SAndroid Build Coastguard Worker  store i32 0, i32* %A
78*9880d681SAndroid Build Coastguard Worker  store i32 0, i32* %B
79*9880d681SAndroid Build Coastguard Worker  call void @bar(i32* %A)
80*9880d681SAndroid Build Coastguard Worker  call void @bar(i32* %B)
81*9880d681SAndroid Build Coastguard Worker  ret void
82*9880d681SAndroid Build Coastguard Worker}
83