2019-04-17 12:52:47 +08:00
|
|
|
; RUN: opt < %s -jump-threading -S | FileCheck %s
|
|
|
|
|
|
|
|
target datalayout = "e-p:32:32:32-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:32:64-f32:32:32-f64:32:64-v64:64:64-v128:128:128-a0:0:64-f80:128:128"
|
|
|
|
target triple = "i386-apple-darwin7"
|
|
|
|
|
|
|
|
declare void @use(i32 *)
|
|
|
|
|
|
|
|
; Check that we propagate nonnull to dominated loads, when we find an available
|
|
|
|
; loaded value.
|
|
|
|
; CHECK-LABEL: @test1(
|
|
|
|
; CHECK-LABEL: ret1:
|
|
|
|
; CHECK-NEXT: %[[p1:.*]] = load i32*, i32** %ptr
|
|
|
|
; CHECK-NOT: !nonnull
|
|
|
|
; CHECK-NEXT: store i32 1, i32* %[[p1]]
|
|
|
|
; CHECK-NEXT: tail call void @use(i32* null)
|
|
|
|
; CHECK-NEXT: ret void
|
|
|
|
|
|
|
|
; CHECK-LABEL: ret2:
|
|
|
|
; CHECK-NEXT: %[[p2:.*]] = load i32*, i32** %ptr, !nonnull !0
|
|
|
|
; CHECK: tail call void @use(i32* %[[p2]])
|
|
|
|
; CHECK-NEXT: ret void
|
|
|
|
define void @test1(i32** %ptr, i1 %c) {
|
|
|
|
br i1 %c, label %d1, label %d2
|
|
|
|
|
|
|
|
d1:
|
|
|
|
%p1 = load i32*, i32** %ptr, !nonnull !0
|
|
|
|
br label %d3
|
|
|
|
|
|
|
|
d2:
|
|
|
|
br label %d3
|
|
|
|
|
|
|
|
d3:
|
|
|
|
%pm = phi i32* [ null, %d2 ], [ %p1, %d1 ]
|
|
|
|
%p2 = load i32*, i32** %ptr
|
|
|
|
store i32 1, i32* %p2
|
|
|
|
%c2 = icmp eq i32* %pm, null
|
|
|
|
br i1 %c2, label %ret1, label %ret2
|
|
|
|
|
|
|
|
ret1:
|
|
|
|
tail call void @use(i32* %pm) nounwind
|
|
|
|
ret void
|
|
|
|
|
|
|
|
ret2:
|
|
|
|
tail call void @use(i32* %pm) nounwind
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
; Check that we propagate nonnull to dominated loads, when we find an available
|
|
|
|
; loaded value.
|
|
|
|
; CHECK-LABEL: @test2(
|
|
|
|
; CHECK-LABEL: d3.thread:
|
|
|
|
; CHECK-NEXT: %[[p1:.*]] = load i32*, i32** %ptr, !nonnull !0
|
|
|
|
; CHECK-NEXT: store i32 1, i32* %[[p1]]
|
|
|
|
; CHECK-NEXT: br label %ret1
|
|
|
|
|
|
|
|
; CHECK-LABEL: d3:
|
|
|
|
; CHECK-NEXT: %[[p_cmp:.*]] = load i32*, i32** %ptr
|
|
|
|
; CHECK-NEXT: %[[p2:.*]] = load i32*, i32** %ptr, !nonnull !0
|
|
|
|
; CHECK-NEXT: store i32 1, i32* %[[p2]]
|
|
|
|
; CHECK-NEXT: icmp eq i32* %[[p_cmp]], null
|
|
|
|
define void @test2(i32** %ptr, i1 %c) {
|
|
|
|
br i1 %c, label %d1, label %d2
|
|
|
|
|
|
|
|
d1:
|
|
|
|
%p1 = load i32*, i32** %ptr
|
|
|
|
br label %d3
|
|
|
|
|
|
|
|
d2:
|
|
|
|
br label %d3
|
|
|
|
|
|
|
|
d3:
|
|
|
|
%pm = phi i32* [ null, %d2 ], [ %p1, %d1 ]
|
|
|
|
%p2 = load i32*, i32** %ptr, !nonnull !0
|
|
|
|
store i32 1, i32* %p2
|
|
|
|
%c2 = icmp eq i32* %pm, null
|
|
|
|
br i1 %c2, label %ret1, label %ret2
|
|
|
|
|
|
|
|
ret1:
|
|
|
|
tail call void @use(i32* %pm) nounwind
|
|
|
|
ret void
|
|
|
|
|
|
|
|
ret2:
|
|
|
|
tail call void @use(i32* %pm) nounwind
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
; Check that we do not propagate nonnull to loads predecessors that are combined
|
|
|
|
; to a PHI node.
|
|
|
|
; CHECK-LABEL: @test3(
|
|
|
|
; CHECK-LABEL: d1:
|
|
|
|
; CHECK-NEXT: %[[p1:.*]] = load i32*, i32** %ptr
|
|
|
|
; CHECK-NOT: !nonnull
|
|
|
|
|
|
|
|
; CHECK-LABEL: d2:
|
|
|
|
; CHECK-NEXT: %[[p2:.*]] = load i32*, i32** %ptr
|
|
|
|
; CHECK-NOT: !nonnull
|
|
|
|
|
|
|
|
; CHECK-LABEL: d3:
|
|
|
|
; CHECK-NEXT: phi i32* [ %[[p2]], %d2 ], [ %[[p1]], %d1 ]
|
|
|
|
define void @test3(i32** %ptr) {
|
|
|
|
d1:
|
|
|
|
%x = load i32*, i32** %ptr, !nonnull !0
|
|
|
|
br label %d3
|
|
|
|
|
|
|
|
d2:
|
|
|
|
br label %d3
|
|
|
|
|
|
|
|
d3:
|
|
|
|
%y = load i32*, i32** %ptr
|
|
|
|
store i32 1, i32* %y
|
Reapply [LVI] Normalize pointer behavior
This is a rebase of the change over D70376, which fixes an LVI cache
invalidation issue that also affected this patch.
-----
Related to D69686. As noted there, LVI currently behaves differently
for integer and pointer values: For integers, the block value is always
valid inside the basic block, while for pointers it is only valid at
the end of the basic block. I believe the integer behavior is the
correct one, and CVP relies on it via its getConstantRange() uses.
The reason for the special pointer behavior is that LVI checks whether
a pointer is dereferenced in a given basic block and marks it as
non-null in that case. Of course, this information is valid only after
the dereferencing instruction, or in conservative approximation,
at the end of the block.
This patch changes the treatment of dereferencability: Instead of
including it inside the block value, we instead treat it as something
similar to an assume (it essentially is a non-nullness assume) and
incorporate this information in intersectAssumeOrGuardBlockValueConstantRange()
if the context instruction is the terminator of the basic block.
This happens either when determining an edge-value internally in LVI,
or when a terminator was explicitly passed to getValueAt(). The latter
case makes this change not fully NFC, because we can now fold
terminator icmps based on the dereferencability information in the
same block. This is the reason why I changed one JumpThreading test
(it would optimize the condition away without the change).
Of course, we do not want to recompute dereferencability on each
intersectAssume call, so we need a new cache for this. The
dereferencability analysis requires walking the entire basic block
and computing underlying objects of all memory operands. This was
previously done separately for each queried pointer value. In the
new implementation (both because this makes the caching simpler,
and because it is faster), I instead only walk the full BB once and
cache all the dereferenced pointers. So the traversal is now performed
only once per BB, instead of once per queried pointer value.
I think the overall model now makes more sense than before, and there
will be no more pitfalls due to differing integer/pointer behavior.
Differential Revision: https://reviews.llvm.org/D69914
2019-12-05 03:51:31 +08:00
|
|
|
%c2 = icmp eq i32* %y, @p
|
2019-04-17 12:52:47 +08:00
|
|
|
br i1 %c2, label %ret1, label %ret2
|
|
|
|
|
|
|
|
ret1:
|
|
|
|
ret void
|
|
|
|
|
|
|
|
ret2:
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
Reapply [LVI] Normalize pointer behavior
This is a rebase of the change over D70376, which fixes an LVI cache
invalidation issue that also affected this patch.
-----
Related to D69686. As noted there, LVI currently behaves differently
for integer and pointer values: For integers, the block value is always
valid inside the basic block, while for pointers it is only valid at
the end of the basic block. I believe the integer behavior is the
correct one, and CVP relies on it via its getConstantRange() uses.
The reason for the special pointer behavior is that LVI checks whether
a pointer is dereferenced in a given basic block and marks it as
non-null in that case. Of course, this information is valid only after
the dereferencing instruction, or in conservative approximation,
at the end of the block.
This patch changes the treatment of dereferencability: Instead of
including it inside the block value, we instead treat it as something
similar to an assume (it essentially is a non-nullness assume) and
incorporate this information in intersectAssumeOrGuardBlockValueConstantRange()
if the context instruction is the terminator of the basic block.
This happens either when determining an edge-value internally in LVI,
or when a terminator was explicitly passed to getValueAt(). The latter
case makes this change not fully NFC, because we can now fold
terminator icmps based on the dereferencability information in the
same block. This is the reason why I changed one JumpThreading test
(it would optimize the condition away without the change).
Of course, we do not want to recompute dereferencability on each
intersectAssume call, so we need a new cache for this. The
dereferencability analysis requires walking the entire basic block
and computing underlying objects of all memory operands. This was
previously done separately for each queried pointer value. In the
new implementation (both because this makes the caching simpler,
and because it is faster), I instead only walk the full BB once and
cache all the dereferenced pointers. So the traversal is now performed
only once per BB, instead of once per queried pointer value.
I think the overall model now makes more sense than before, and there
will be no more pitfalls due to differing integer/pointer behavior.
Differential Revision: https://reviews.llvm.org/D69914
2019-12-05 03:51:31 +08:00
|
|
|
@p = external global i32
|
2019-04-17 12:52:47 +08:00
|
|
|
|
|
|
|
!0 = !{}
|