forked from OSchip/llvm-project
Fix a somewhat surprising miscompile where code relying on an ABI
alignment could lose it due to the alloca type moving down to a much smaller alignment guarantee. Now SROA will actively compute a proper alignment, factoring the target data, any explicit alignment, and the offset within the struct. This will in some cases lower the alignment requirements, but when we lower them below those of the type, we drop the alignment entirely to give freedom to the code generator to align it however is convenient. Thanks to Duncan for the lovely test case that pinned this down. =] llvm-svn: 164891
This commit is contained in:
parent
fb9d30dd64
commit
903790eff5
|
@ -3002,9 +3002,19 @@ bool SROA::rewriteAllocaPartition(AllocaInst &AI,
|
|||
assert(PI == P.begin() && "Begin offset is zero on later partition");
|
||||
NewAI = &AI;
|
||||
} else {
|
||||
// FIXME: The alignment here is overly conservative -- we could in many
|
||||
// cases get away with much weaker alignment constraints.
|
||||
NewAI = new AllocaInst(AllocaTy, 0, AI.getAlignment(),
|
||||
unsigned Alignment = AI.getAlignment();
|
||||
if (!Alignment) {
|
||||
// The minimum alignment which users can rely on when the explicit
|
||||
// alignment is omitted or zero is that required by the ABI for this
|
||||
// type.
|
||||
Alignment = TD->getABITypeAlignment(AI.getAllocatedType());
|
||||
}
|
||||
Alignment = MinAlign(Alignment, PI->BeginOffset);
|
||||
// If we will get at least this much alignment from the type alone, leave
|
||||
// the alloca's alignment unconstrained.
|
||||
if (Alignment <= TD->getABITypeAlignment(AllocaTy))
|
||||
Alignment = 0;
|
||||
NewAI = new AllocaInst(AllocaTy, 0, Alignment,
|
||||
AI.getName() + ".sroa." + Twine(PI - P.begin()),
|
||||
&AI);
|
||||
++NumNewAllocas;
|
||||
|
|
|
@ -30,7 +30,7 @@ entry:
|
|||
|
||||
define void @test2() {
|
||||
; CHECK: @test2
|
||||
; CHECK: alloca i16, align 2
|
||||
; CHECK: alloca i16
|
||||
; CHECK: load i8* %{{.*}}, align 1
|
||||
; CHECK: store i8 42, i8* %{{.*}}, align 1
|
||||
; CHECK: ret void
|
||||
|
@ -62,3 +62,24 @@ entry:
|
|||
call void @llvm.memcpy.p0i8.p0i8.i32(i8* %bptr, i8* %aaptr, i32 16, i32 2, i1 false)
|
||||
ret void
|
||||
}
|
||||
|
||||
define void @test3(i8* %x) {
|
||||
; Test that when we promote an alloca to a type with lower ABI alignment, we
|
||||
; provide the needed explicit alignment that code using the alloca may be
|
||||
; expecting. However, also check that any offset within an alloca can in turn
|
||||
; reduce the alignment.
|
||||
; CHECK: @test3
|
||||
; CHECK: alloca [22 x i8], align 8
|
||||
; CHECK: alloca [18 x i8], align 2
|
||||
; CHECK: ret void
|
||||
|
||||
entry:
|
||||
%a = alloca { i8*, i8*, i8* }
|
||||
%b = alloca { i8*, i8*, i8* }
|
||||
%a_raw = bitcast { i8*, i8*, i8* }* %a to i8*
|
||||
call void @llvm.memcpy.p0i8.p0i8.i32(i8* %a_raw, i8* %x, i32 22, i32 8, i1 false)
|
||||
%b_raw = bitcast { i8*, i8*, i8* }* %b to i8*
|
||||
%b_gep = getelementptr i8* %b_raw, i32 6
|
||||
call void @llvm.memcpy.p0i8.p0i8.i32(i8* %b_gep, i8* %x, i32 18, i32 2, i1 false)
|
||||
ret void
|
||||
}
|
||||
|
|
Loading…
Reference in New Issue