xref: /aosp_15_r20/external/llvm/test/Transforms/InstCombine/stack-overalign.ll (revision 9880d6810fe72a1726cb53787c6711e909410d58)
1*9880d681SAndroid Build Coastguard Worker; RUN: opt < %s -instcombine -S | grep "align 32" | count 1
2*9880d681SAndroid Build Coastguard Worker
3*9880d681SAndroid Build Coastguard Worker; It's tempting to have an instcombine in which the src pointer of a
4*9880d681SAndroid Build Coastguard Worker; memcpy is aligned up to the alignment of the destination, however
5*9880d681SAndroid Build Coastguard Worker; there are pitfalls. If the src is an alloca, aligning it beyond what
6*9880d681SAndroid Build Coastguard Worker; the target's stack pointer is aligned at will require dynamic
7*9880d681SAndroid Build Coastguard Worker; stack realignment, which can require functions that don't otherwise
8*9880d681SAndroid Build Coastguard Worker; need a frame pointer to need one.
9*9880d681SAndroid Build Coastguard Worker;
10*9880d681SAndroid Build Coastguard Worker; Abstaining from this transform is not the only way to approach this
11*9880d681SAndroid Build Coastguard Worker; issue. Some late phase could be smart enough to reduce alloca
12*9880d681SAndroid Build Coastguard Worker; alignments when they are greater than they need to be. Or, codegen
13*9880d681SAndroid Build Coastguard Worker; could do dynamic alignment for just the one alloca, and leave the
14*9880d681SAndroid Build Coastguard Worker; main stack pointer at its standard alignment.
15*9880d681SAndroid Build Coastguard Worker
16*9880d681SAndroid Build Coastguard Worker@dst = global [1024 x i8] zeroinitializer, align 32
17*9880d681SAndroid Build Coastguard Worker
18*9880d681SAndroid Build Coastguard Workerdefine void @foo() nounwind {
19*9880d681SAndroid Build Coastguard Workerentry:
20*9880d681SAndroid Build Coastguard Worker  %src = alloca [1024 x i8], align 1
21*9880d681SAndroid Build Coastguard Worker  %src1 = getelementptr [1024 x i8], [1024 x i8]* %src, i32 0, i32 0
22*9880d681SAndroid Build Coastguard Worker  call void @llvm.memcpy.p0i8.p0i8.i32(i8* getelementptr inbounds ([1024 x i8], [1024 x i8]* @dst, i32 0, i32 0), i8* %src1, i32 1024, i32 1, i1 false)
23*9880d681SAndroid Build Coastguard Worker  call void @frob(i8* %src1) nounwind
24*9880d681SAndroid Build Coastguard Worker  ret void
25*9880d681SAndroid Build Coastguard Worker}
26*9880d681SAndroid Build Coastguard Worker
27*9880d681SAndroid Build Coastguard Workerdeclare void @frob(i8*)
28*9880d681SAndroid Build Coastguard Worker
29*9880d681SAndroid Build Coastguard Workerdeclare void @llvm.memcpy.p0i8.p0i8.i32(i8* nocapture, i8* nocapture, i32, i32, i1) nounwind
30