forked from OSchip/llvm-project
Fix GVN creating bitcast between address spaces
llvm-svn: 193710
This commit is contained in:
parent
04d88fba3e
commit
614ea99da7
|
@ -1088,14 +1088,15 @@ static int AnalyzeLoadFromClobberingMemInst(Type *LoadTy, Value *LoadPtr,
|
||||||
if (Offset == -1)
|
if (Offset == -1)
|
||||||
return Offset;
|
return Offset;
|
||||||
|
|
||||||
|
unsigned AS = Src->getType()->getPointerAddressSpace();
|
||||||
// Otherwise, see if we can constant fold a load from the constant with the
|
// Otherwise, see if we can constant fold a load from the constant with the
|
||||||
// offset applied as appropriate.
|
// offset applied as appropriate.
|
||||||
Src = ConstantExpr::getBitCast(Src,
|
Src = ConstantExpr::getBitCast(Src,
|
||||||
llvm::Type::getInt8PtrTy(Src->getContext()));
|
Type::getInt8PtrTy(Src->getContext(), AS));
|
||||||
Constant *OffsetCst =
|
Constant *OffsetCst =
|
||||||
ConstantInt::get(Type::getInt64Ty(Src->getContext()), (unsigned)Offset);
|
ConstantInt::get(Type::getInt64Ty(Src->getContext()), (unsigned)Offset);
|
||||||
Src = ConstantExpr::getGetElementPtr(Src, OffsetCst);
|
Src = ConstantExpr::getGetElementPtr(Src, OffsetCst);
|
||||||
Src = ConstantExpr::getBitCast(Src, PointerType::getUnqual(LoadTy));
|
Src = ConstantExpr::getBitCast(Src, PointerType::get(LoadTy, AS));
|
||||||
if (ConstantFoldLoadFromConstPtr(Src, &TD))
|
if (ConstantFoldLoadFromConstPtr(Src, &TD))
|
||||||
return Offset;
|
return Offset;
|
||||||
return -1;
|
return -1;
|
||||||
|
@ -1247,15 +1248,16 @@ static Value *GetMemInstValueForLoad(MemIntrinsic *SrcInst, unsigned Offset,
|
||||||
// Otherwise, this is a memcpy/memmove from a constant global.
|
// Otherwise, this is a memcpy/memmove from a constant global.
|
||||||
MemTransferInst *MTI = cast<MemTransferInst>(SrcInst);
|
MemTransferInst *MTI = cast<MemTransferInst>(SrcInst);
|
||||||
Constant *Src = cast<Constant>(MTI->getSource());
|
Constant *Src = cast<Constant>(MTI->getSource());
|
||||||
|
unsigned AS = Src->getType()->getPointerAddressSpace();
|
||||||
|
|
||||||
// Otherwise, see if we can constant fold a load from the constant with the
|
// Otherwise, see if we can constant fold a load from the constant with the
|
||||||
// offset applied as appropriate.
|
// offset applied as appropriate.
|
||||||
Src = ConstantExpr::getBitCast(Src,
|
Src = ConstantExpr::getBitCast(Src,
|
||||||
llvm::Type::getInt8PtrTy(Src->getContext()));
|
Type::getInt8PtrTy(Src->getContext(), AS));
|
||||||
Constant *OffsetCst =
|
Constant *OffsetCst =
|
||||||
ConstantInt::get(Type::getInt64Ty(Src->getContext()), (unsigned)Offset);
|
ConstantInt::get(Type::getInt64Ty(Src->getContext()), (unsigned)Offset);
|
||||||
Src = ConstantExpr::getGetElementPtr(Src, OffsetCst);
|
Src = ConstantExpr::getGetElementPtr(Src, OffsetCst);
|
||||||
Src = ConstantExpr::getBitCast(Src, PointerType::getUnqual(LoadTy));
|
Src = ConstantExpr::getBitCast(Src, PointerType::get(LoadTy, AS));
|
||||||
return ConstantFoldLoadFromConstPtr(Src, &TD);
|
return ConstantFoldLoadFromConstPtr(Src, &TD);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -1,5 +1,5 @@
|
||||||
; RUN: opt < %s -default-data-layout="e-p:32:32:32-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:32:64-f32:32:32-f64:32:64-n8:16:32" -basicaa -gvn -S -die | FileCheck %s
|
; RUN: opt < %s -default-data-layout="e-p:32:32:32-p1:16:16:16-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:32:64-f32:32:32-f64:32:64-n8:16:32" -basicaa -gvn -S -die | FileCheck %s
|
||||||
; RUN: opt < %s -default-data-layout="E-p:32:32:32-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:32:64-f32:32:32-f64:64:64-n32" -basicaa -gvn -S -die | FileCheck %s
|
; RUN: opt < %s -default-data-layout="E-p:32:32:32-p1:16:16:16-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:32:64-f32:32:32-f64:64:64-n32" -basicaa -gvn -S -die | FileCheck %s
|
||||||
|
|
||||||
;; Trivial RLE test.
|
;; Trivial RLE test.
|
||||||
define i32 @test0(i32 %V, i32* %P) {
|
define i32 @test0(i32 %V, i32* %P) {
|
||||||
|
@ -195,6 +195,7 @@ Cont:
|
||||||
}
|
}
|
||||||
|
|
||||||
@GCst = constant {i32, float, i32 } { i32 42, float 14., i32 97 }
|
@GCst = constant {i32, float, i32 } { i32 42, float 14., i32 97 }
|
||||||
|
@GCst_as1 = addrspace(1) constant {i32, float, i32 } { i32 42, float 14., i32 97 }
|
||||||
|
|
||||||
; memset -> float forwarding.
|
; memset -> float forwarding.
|
||||||
define float @memcpy_to_float_local(float* %A) nounwind ssp {
|
define float @memcpy_to_float_local(float* %A) nounwind ssp {
|
||||||
|
@ -209,7 +210,18 @@ entry:
|
||||||
; CHECK: ret float 1.400000e+01
|
; CHECK: ret float 1.400000e+01
|
||||||
}
|
}
|
||||||
|
|
||||||
|
; memcpy from address space 1
|
||||||
|
define float @memcpy_to_float_local_as1(float* %A) nounwind ssp {
|
||||||
|
entry:
|
||||||
|
%conv = bitcast float* %A to i8* ; <i8*> [#uses=1]
|
||||||
|
tail call void @llvm.memcpy.p0i8.p1i8.i64(i8* %conv, i8 addrspace(1)* bitcast ({i32, float, i32 } addrspace(1)* @GCst_as1 to i8 addrspace(1)*), i64 12, i32 1, i1 false)
|
||||||
|
%arrayidx = getelementptr inbounds float* %A, i64 1 ; <float*> [#uses=1]
|
||||||
|
%tmp2 = load float* %arrayidx ; <float> [#uses=1]
|
||||||
|
ret float %tmp2
|
||||||
|
; CHECK-LABEL: @memcpy_to_float_local_as1(
|
||||||
|
; CHECK-NOT: load
|
||||||
|
; CHECK: ret float 1.400000e+01
|
||||||
|
}
|
||||||
|
|
||||||
;; non-local i32/float -> i8 load forwarding.
|
;; non-local i32/float -> i8 load forwarding.
|
||||||
define i8 @coerce_mustalias_nonlocal0(i32* %P, i1 %cond) {
|
define i8 @coerce_mustalias_nonlocal0(i32* %P, i1 %cond) {
|
||||||
|
@ -647,6 +659,8 @@ entry:
|
||||||
declare void @llvm.memset.p0i8.i64(i8* nocapture, i8, i64, i32, i1) nounwind
|
declare void @llvm.memset.p0i8.i64(i8* nocapture, i8, i64, i32, i1) nounwind
|
||||||
|
|
||||||
declare void @llvm.memcpy.p0i8.p0i8.i64(i8* nocapture, i8* nocapture, i64, i32, i1) nounwind
|
declare void @llvm.memcpy.p0i8.p0i8.i64(i8* nocapture, i8* nocapture, i64, i32, i1) nounwind
|
||||||
|
declare void @llvm.memcpy.p0i8.p1i8.i64(i8* nocapture, i8 addrspace(1)* nocapture, i64, i32, i1) nounwind
|
||||||
|
|
||||||
|
|
||||||
;;===----------------------------------------------------------------------===;;
|
;;===----------------------------------------------------------------------===;;
|
||||||
;; Load -> Store dependency which isn't interfered with by a call that happens
|
;; Load -> Store dependency which isn't interfered with by a call that happens
|
||||||
|
|
Loading…
Reference in New Issue