2018-07-30 19:52:08 +08:00
|
|
|
; RUN: opt < %s -phi-values -basicaa -aa-eval -print-all-alias-modref-info -disable-output 2>&1 | FileCheck %s
|
|
|
|
; RUN: opt < %s -aa-pipeline=basic-aa -passes='require<phi-values>,aa-eval' -print-all-alias-modref-info -disable-output 2>&1 | FileCheck %s
|
2014-01-02 11:31:36 +08:00
|
|
|
target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64-S128"
|
|
|
|
target triple = "x86_64-unknown-linux-gnu"
|
|
|
|
|
2009-10-14 06:02:20 +08:00
|
|
|
; rdar://7282591
|
|
|
|
|
2009-10-14 09:45:10 +08:00
|
|
|
@X = common global i32 0
|
|
|
|
@Y = common global i32 0
|
|
|
|
@Z = common global i32 0
|
2009-10-14 06:02:20 +08:00
|
|
|
|
2014-01-02 11:31:36 +08:00
|
|
|
; CHECK-LABEL: foo
|
2012-04-24 17:15:38 +08:00
|
|
|
; CHECK: NoAlias: i32* %P, i32* @Z
|
|
|
|
|
2010-11-12 05:08:46 +08:00
|
|
|
define void @foo(i32 %cond) nounwind {
|
2009-10-14 06:02:20 +08:00
|
|
|
entry:
|
2009-10-14 09:45:10 +08:00
|
|
|
%"alloca point" = bitcast i32 0 to i32
|
|
|
|
%tmp = icmp ne i32 %cond, 0
|
|
|
|
br i1 %tmp, label %bb, label %bb1
|
2009-10-14 06:02:20 +08:00
|
|
|
|
2009-10-14 09:45:10 +08:00
|
|
|
bb:
|
|
|
|
br label %bb2
|
2009-10-14 06:02:20 +08:00
|
|
|
|
2009-10-14 09:45:10 +08:00
|
|
|
bb1:
|
|
|
|
br label %bb2
|
2009-10-14 06:02:20 +08:00
|
|
|
|
2009-10-14 09:45:10 +08:00
|
|
|
bb2:
|
|
|
|
%P = phi i32* [ @X, %bb ], [ @Y, %bb1 ]
|
2015-02-28 05:17:42 +08:00
|
|
|
%tmp1 = load i32, i32* @Z, align 4
|
2009-10-14 09:45:10 +08:00
|
|
|
store i32 123, i32* %P, align 4
|
2015-02-28 05:17:42 +08:00
|
|
|
%tmp2 = load i32, i32* @Z, align 4
|
2009-10-14 09:45:10 +08:00
|
|
|
br label %return
|
2009-10-14 06:02:20 +08:00
|
|
|
|
2009-10-14 09:45:10 +08:00
|
|
|
return:
|
2009-10-14 06:02:20 +08:00
|
|
|
ret void
|
|
|
|
}
|
2014-01-02 11:31:36 +08:00
|
|
|
|
|
|
|
; Pointers can vary in between iterations of loops.
|
|
|
|
; PR18068
|
|
|
|
|
|
|
|
; CHECK-LABEL: pr18068
|
|
|
|
; CHECK: MayAlias: i32* %0, i32* %arrayidx5
|
[BasicAA] Fix the handling of sext and zext in the analysis of GEPs.
Hopefully this will end the GEPs saga!
This commit reverts r245394, i.e., it reapplies r221876 while incorporating the
fixes from D11847.
r221876 was not reapplied alone because it was not safe and D11847 was not
applied alone because it needs r221876 to produce correct results.
This should fix PR24596.
Original commit message for r221876:
Let's try this again...
This reverts r219432, plus a bug fix.
Description of the bug in r219432 (by Nick):
The bug was using AllPositive to break out of the loop; if the loop break
condition i != e is changed to i != e && AllPositive then the
test_modulo_analysis_with_global test I've added will fail as the Modulo will
be calculated incorrectly (as the last loop iteration is skipped, so Modulo
isn't updated with its Scale).
Nick also adds this comment:
ComputeSignBit is safe to use in loops as it takes into account phi nodes, and
the == EK_ZeroEx check is safe in loops as, no matter how the variable changes
between iterations, zero-extensions will always guarantee a zero sign bit. The
isValueEqualInPotentialCycles check is therefore definitely not needed as all
the variable analysis holds no matter how the variables change between loop
iterations.
And this patch also adds another enhancement to GetLinearExpression - basically
to convert ConstantInts to Offsets (see test_const_eval and
test_const_eval_scaled for the situations this improves).
Original commit message:
This reverts r218944, which reverted r218714, plus a bug fix.
Description of the bug in r218714 (by Nick):
The original patch forgot to check if the Scale in VariableGEPIndex flipped the
sign of the variable. The BasicAA pass iterates over the instructions in the
order they appear in the function, and so BasicAliasAnalysis::aliasGEP is
called with the variable it first comes across as parameter GEP1. Adding a
%reorder label puts the definition of %a after %b so aliasGEP is called with %b
as the first parameter and %a as the second. aliasGEP later calculates that %a
== %b + 1 - %idxprom where %idxprom >= 0 (if %a was passed as the first
parameter it would calculate %b == %a - 1 + %idxprom where %idxprom >= 0) -
ignoring that %idxprom is scaled by -1 here lead the patch to incorrectly
conclude that %a > %b.
Revised patch by Nick White, thanks! Thanks to Lang to isolating the bug.
Slightly modified by me to add an early exit from the loop and avoid
unnecessary, but expensive, function calls.
Original commit message:
Two related things:
1. Fixes a bug when calculating the offset in GetLinearExpression. The code
previously used zext to extend the offset, so negative offsets were converted
to large positive ones.
2. Enhance aliasGEP to deduce that, if the difference between two GEP
allocations is positive and all the variables that govern the offset are also
positive (i.e. the offset is strictly after the higher base pointer), then
locations that fit in the gap between the two base pointers are NoAlias.
Patch by Nick White!
Message from D11847:
Un-revert of r241981 and fix for PR23626. The 'Or' case of GetLinearExpression
delegates to 'Add' if possible, and if not it returns an Opaque value.
Unfortunately the Scale and Offsets weren't being set (and so defaulted to 0) -
and a scale of zero effectively removes the variable from the GEP instruction.
This meant that BasicAA would return MustAliases when it should have been
returning PartialAliases (and PR23626 was an example of the GVN pass using an
incorrect MustAlias to merge loads from what should have been different
pointers).
Differential Revision: http://reviews.llvm.org/D11847
Patch by Nick White <n.j.white@gmail.com>!
llvm-svn: 246502
2015-09-01 06:32:47 +08:00
|
|
|
; CHECK: NoAlias: i32* %arrayidx13, i32* %arrayidx5
|
2014-01-02 11:31:36 +08:00
|
|
|
|
|
|
|
define i32 @pr18068(i32* %jj7, i32* %j) {
|
|
|
|
entry:
|
|
|
|
%oa5 = alloca [100 x i32], align 16
|
|
|
|
br label %codeRepl
|
|
|
|
|
|
|
|
codeRepl:
|
|
|
|
%0 = phi i32* [ %arrayidx13, %for.body ], [ %j, %entry ]
|
|
|
|
%targetBlock = call i1 @cond(i32* %jj7)
|
|
|
|
br i1 %targetBlock, label %for.body, label %bye
|
|
|
|
|
|
|
|
for.body:
|
2015-02-28 05:17:42 +08:00
|
|
|
%1 = load i32, i32* %jj7, align 4
|
2014-01-02 11:31:36 +08:00
|
|
|
%idxprom4 = zext i32 %1 to i64
|
[opaque pointer type] Add textual IR support for explicit type parameter to getelementptr instruction
One of several parallel first steps to remove the target type of pointers,
replacing them with a single opaque pointer type.
This adds an explicit type parameter to the gep instruction so that when the
first parameter becomes an opaque pointer type, the type to gep through is
still available to the instructions.
* This doesn't modify gep operators, only instructions (operators will be
handled separately)
* Textual IR changes only. Bitcode (including upgrade) and changing the
in-memory representation will be in separate changes.
* geps of vectors are transformed as:
getelementptr <4 x float*> %x, ...
->getelementptr float, <4 x float*> %x, ...
Then, once the opaque pointer type is introduced, this will ultimately look
like:
getelementptr float, <4 x ptr> %x
with the unambiguous interpretation that it is a vector of pointers to float.
* address spaces remain on the pointer, not the type:
getelementptr float addrspace(1)* %x
->getelementptr float, float addrspace(1)* %x
Then, eventually:
getelementptr float, ptr addrspace(1) %x
Importantly, the massive amount of test case churn has been automated by
same crappy python code. I had to manually update a few test cases that
wouldn't fit the script's model (r228970,r229196,r229197,r229198). The
python script just massages stdin and writes the result to stdout, I
then wrapped that in a shell script to handle replacing files, then
using the usual find+xargs to migrate all the files.
update.py:
import fileinput
import sys
import re
ibrep = re.compile(r"(^.*?[^%\w]getelementptr inbounds )(((?:<\d* x )?)(.*?)(| addrspace\(\d\)) *\*(|>)(?:$| *(?:%|@|null|undef|blockaddress|getelementptr|addrspacecast|bitcast|inttoptr|\[\[[a-zA-Z]|\{\{).*$))")
normrep = re.compile( r"(^.*?[^%\w]getelementptr )(((?:<\d* x )?)(.*?)(| addrspace\(\d\)) *\*(|>)(?:$| *(?:%|@|null|undef|blockaddress|getelementptr|addrspacecast|bitcast|inttoptr|\[\[[a-zA-Z]|\{\{).*$))")
def conv(match, line):
if not match:
return line
line = match.groups()[0]
if len(match.groups()[5]) == 0:
line += match.groups()[2]
line += match.groups()[3]
line += ", "
line += match.groups()[1]
line += "\n"
return line
for line in sys.stdin:
if line.find("getelementptr ") == line.find("getelementptr inbounds"):
if line.find("getelementptr inbounds") != line.find("getelementptr inbounds ("):
line = conv(re.match(ibrep, line), line)
elif line.find("getelementptr ") != line.find("getelementptr ("):
line = conv(re.match(normrep, line), line)
sys.stdout.write(line)
apply.sh:
for name in "$@"
do
python3 `dirname "$0"`/update.py < "$name" > "$name.tmp" && mv "$name.tmp" "$name"
rm -f "$name.tmp"
done
The actual commands:
From llvm/src:
find test/ -name *.ll | xargs ./apply.sh
From llvm/src/tools/clang:
find test/ -name *.mm -o -name *.m -o -name *.cpp -o -name *.c | xargs -I '{}' ../../apply.sh "{}"
From llvm/src/tools/polly:
find test/ -name *.ll | xargs ./apply.sh
After that, check-all (with llvm, clang, clang-tools-extra, lld,
compiler-rt, and polly all checked out).
The extra 'rm' in the apply.sh script is due to a few files in clang's test
suite using interesting unicode stuff that my python script was throwing
exceptions on. None of those files needed to be migrated, so it seemed
sufficient to ignore those cases.
Reviewers: rafael, dexonsmith, grosser
Differential Revision: http://reviews.llvm.org/D7636
llvm-svn: 230786
2015-02-28 03:29:02 +08:00
|
|
|
%arrayidx5 = getelementptr inbounds [100 x i32], [100 x i32]* %oa5, i64 0, i64 %idxprom4
|
2015-02-28 05:17:42 +08:00
|
|
|
%2 = load i32, i32* %arrayidx5, align 4
|
2014-01-02 11:31:36 +08:00
|
|
|
%sub6 = sub i32 %2, 6
|
|
|
|
store i32 %sub6, i32* %arrayidx5, align 4
|
|
|
|
; %0 and %arrayidx5 can alias! It is not safe to DSE the above store.
|
2015-02-28 05:17:42 +08:00
|
|
|
%3 = load i32, i32* %0, align 4
|
2014-01-02 11:31:36 +08:00
|
|
|
store i32 %3, i32* %arrayidx5, align 4
|
|
|
|
%sub11 = add i32 %1, -1
|
|
|
|
%idxprom12 = zext i32 %sub11 to i64
|
[opaque pointer type] Add textual IR support for explicit type parameter to getelementptr instruction
One of several parallel first steps to remove the target type of pointers,
replacing them with a single opaque pointer type.
This adds an explicit type parameter to the gep instruction so that when the
first parameter becomes an opaque pointer type, the type to gep through is
still available to the instructions.
* This doesn't modify gep operators, only instructions (operators will be
handled separately)
* Textual IR changes only. Bitcode (including upgrade) and changing the
in-memory representation will be in separate changes.
* geps of vectors are transformed as:
getelementptr <4 x float*> %x, ...
->getelementptr float, <4 x float*> %x, ...
Then, once the opaque pointer type is introduced, this will ultimately look
like:
getelementptr float, <4 x ptr> %x
with the unambiguous interpretation that it is a vector of pointers to float.
* address spaces remain on the pointer, not the type:
getelementptr float addrspace(1)* %x
->getelementptr float, float addrspace(1)* %x
Then, eventually:
getelementptr float, ptr addrspace(1) %x
Importantly, the massive amount of test case churn has been automated by
same crappy python code. I had to manually update a few test cases that
wouldn't fit the script's model (r228970,r229196,r229197,r229198). The
python script just massages stdin and writes the result to stdout, I
then wrapped that in a shell script to handle replacing files, then
using the usual find+xargs to migrate all the files.
update.py:
import fileinput
import sys
import re
ibrep = re.compile(r"(^.*?[^%\w]getelementptr inbounds )(((?:<\d* x )?)(.*?)(| addrspace\(\d\)) *\*(|>)(?:$| *(?:%|@|null|undef|blockaddress|getelementptr|addrspacecast|bitcast|inttoptr|\[\[[a-zA-Z]|\{\{).*$))")
normrep = re.compile( r"(^.*?[^%\w]getelementptr )(((?:<\d* x )?)(.*?)(| addrspace\(\d\)) *\*(|>)(?:$| *(?:%|@|null|undef|blockaddress|getelementptr|addrspacecast|bitcast|inttoptr|\[\[[a-zA-Z]|\{\{).*$))")
def conv(match, line):
if not match:
return line
line = match.groups()[0]
if len(match.groups()[5]) == 0:
line += match.groups()[2]
line += match.groups()[3]
line += ", "
line += match.groups()[1]
line += "\n"
return line
for line in sys.stdin:
if line.find("getelementptr ") == line.find("getelementptr inbounds"):
if line.find("getelementptr inbounds") != line.find("getelementptr inbounds ("):
line = conv(re.match(ibrep, line), line)
elif line.find("getelementptr ") != line.find("getelementptr ("):
line = conv(re.match(normrep, line), line)
sys.stdout.write(line)
apply.sh:
for name in "$@"
do
python3 `dirname "$0"`/update.py < "$name" > "$name.tmp" && mv "$name.tmp" "$name"
rm -f "$name.tmp"
done
The actual commands:
From llvm/src:
find test/ -name *.ll | xargs ./apply.sh
From llvm/src/tools/clang:
find test/ -name *.mm -o -name *.m -o -name *.cpp -o -name *.c | xargs -I '{}' ../../apply.sh "{}"
From llvm/src/tools/polly:
find test/ -name *.ll | xargs ./apply.sh
After that, check-all (with llvm, clang, clang-tools-extra, lld,
compiler-rt, and polly all checked out).
The extra 'rm' in the apply.sh script is due to a few files in clang's test
suite using interesting unicode stuff that my python script was throwing
exceptions on. None of those files needed to be migrated, so it seemed
sufficient to ignore those cases.
Reviewers: rafael, dexonsmith, grosser
Differential Revision: http://reviews.llvm.org/D7636
llvm-svn: 230786
2015-02-28 03:29:02 +08:00
|
|
|
%arrayidx13 = getelementptr inbounds [100 x i32], [100 x i32]* %oa5, i64 0, i64 %idxprom12
|
2014-01-02 11:31:36 +08:00
|
|
|
call void @inc(i32* %jj7)
|
|
|
|
br label %codeRepl
|
|
|
|
|
|
|
|
bye:
|
2015-02-28 05:17:42 +08:00
|
|
|
%.reload = load i32, i32* %jj7, align 4
|
2014-01-02 11:31:36 +08:00
|
|
|
ret i32 %.reload
|
|
|
|
}
|
|
|
|
|
|
|
|
declare i1 @cond(i32*)
|
|
|
|
|
|
|
|
declare void @inc(i32*)
|
|
|
|
|
|
|
|
|
2018-07-30 19:52:08 +08:00
|
|
|
; When we have a chain of phis in nested loops we should recognise if there's
|
|
|
|
; actually only one underlying value.
|
|
|
|
; CHECK-LABEL: loop_phi_chain
|
|
|
|
; CHECK: NoAlias: i32* %val1, i32* @Y
|
|
|
|
; CHECK: NoAlias: i32* %val2, i32* @Y
|
|
|
|
; CHECK: NoAlias: i32* %val3, i32* @Y
|
|
|
|
define void @loop_phi_chain(i32 %a, i32 %b, i32 %c) {
|
|
|
|
entry:
|
|
|
|
br label %loop1
|
|
|
|
|
|
|
|
loop1:
|
|
|
|
%n1 = phi i32 [ 0, %entry ], [ %add1, %loop2 ]
|
|
|
|
%val1 = phi i32* [ @X, %entry ], [ %val2, %loop2 ]
|
|
|
|
%add1 = add i32 %n1, 1
|
|
|
|
%cmp1 = icmp ne i32 %n1, 32
|
|
|
|
br i1 %cmp1, label %loop2, label %end
|
|
|
|
|
|
|
|
loop2:
|
|
|
|
%n2 = phi i32 [ 0, %loop1 ], [ %add2, %loop3 ]
|
|
|
|
%val2 = phi i32* [ %val1, %loop1 ], [ %val3, %loop3 ]
|
|
|
|
%add2 = add i32 %n2, 1
|
|
|
|
%cmp2 = icmp ne i32 %n2, 32
|
|
|
|
br i1 %cmp2, label %loop3, label %loop1
|
|
|
|
|
|
|
|
loop3:
|
|
|
|
%n3 = phi i32 [ 0, %loop2 ], [ %add3, %loop3 ]
|
|
|
|
%val3 = phi i32* [ %val2, %loop2 ], [ %val3, %loop3 ]
|
|
|
|
store i32 0, i32* %val3, align 4
|
|
|
|
store i32 0, i32* @Y, align 4
|
|
|
|
%add3 = add i32 %n3, 1
|
|
|
|
%cmp3 = icmp ne i32 %n3, 32
|
|
|
|
br i1 %cmp3, label %loop3, label %loop2
|
|
|
|
|
|
|
|
end:
|
|
|
|
ret void
|
|
|
|
}
|