[Hexagon] Implement MI-level constant propagation

llvm-svn: 277028
This commit is contained in:
Krzysztof Parzyszek 2016-07-28 20:01:59 +00:00
parent b7c72717c9
commit 167d918225
13 changed files with 3402 additions and 2 deletions

View File

@ -21,6 +21,7 @@ add_llvm_target(HexagonCodeGen
HexagonBranchRelaxation.cpp
HexagonCFGOptimizer.cpp
HexagonCommonGEP.cpp
HexagonConstPropagation.cpp
HexagonCopyToCombine.cpp
HexagonEarlyIfConv.cpp
HexagonExpandCondsets.cpp

File diff suppressed because it is too large Load Diff

View File

@ -42,6 +42,9 @@ static cl::opt<bool> DisableHexagonCFGOpt("disable-hexagon-cfgopt",
cl::Hidden, cl::ZeroOrMore, cl::init(false),
cl::desc("Disable Hexagon CFG Optimization"));
static cl::opt<bool> DisableHCP("disable-hcp", cl::init(false), cl::Hidden,
cl::ZeroOrMore, cl::desc("Disable Hexagon constant propagation"));
static cl::opt<bool> DisableStoreWidening("disable-store-widen",
cl::Hidden, cl::init(false), cl::desc("Disable store widening"));
@ -111,6 +114,7 @@ namespace llvm {
FunctionPass *createHexagonCallFrameInformation();
FunctionPass *createHexagonCFGOptimizer();
FunctionPass *createHexagonCommonGEP();
FunctionPass *createHexagonConstPropagationPass();
FunctionPass *createHexagonCopyToCombine();
FunctionPass *createHexagonEarlyIfConversion();
FunctionPass *createHexagonExpandCondsets();
@ -263,6 +267,11 @@ bool HexagonPassConfig::addInstSelector() {
addPass(createHexagonBitSimplify(), false);
addPass(createHexagonPeephole());
printAndVerify("After hexagon peephole pass");
// Constant propagation.
if (!DisableHCP) {
addPass(createHexagonConstPropagationPass(), false);
addPass(&UnreachableMachineBlockElimID, false);
}
if (EnableGenInsert)
addPass(createHexagonGenInsert(), false);
if (EnableEarlyIf)

View File

@ -0,0 +1,23 @@
; RUN: llc -mcpu=hexagonv5 < %s
; REQUIRES: asserts
target datalayout = "e-m:e-p:32:32-i1:32-i64:64-a:0-v32:32-n16:32"
target triple = "hexagon-unknown--elf"
; Function Attrs: nounwind readnone
define i64 @foo() #0 {
entry:
%0 = tail call i32 @llvm.hexagon.S2.clbp(i64 291)
%1 = tail call i64 @llvm.hexagon.A4.combineir(i32 0, i32 %0)
ret i64 %1
}
; Function Attrs: nounwind readnone
declare i32 @llvm.hexagon.S2.clbp(i64) #1
; Function Attrs: nounwind readnone
declare i64 @llvm.hexagon.A4.combineir(i32, i32) #1
attributes #0 = { nounwind readnone "less-precise-fpmad"="false" "no-frame-pointer-elim"="true" "no-frame-pointer-elim-non-leaf" "no-infs-fp-math"="false" "no-nans-fp-math"="false" "stack-protector-buffer-size"="8" "unsafe-fp-math"="false" "use-soft-float"="false" }
attributes #1 = { nounwind readnone }

View File

@ -0,0 +1,27 @@
; RUN: llc -O2 -march=hexagon < %s | FileCheck %s --check-prefix=CHECK-TEST1
; RUN: llc -O2 -march=hexagon < %s | FileCheck %s --check-prefix=CHECK-TEST2
; RUN: llc -O2 -march=hexagon < %s | FileCheck %s --check-prefix=CHECK-TEST3
define i32 @main() #0 {
entry:
%l = alloca [7 x i32], align 8
%p_arrayidx45 = bitcast [7 x i32]* %l to i32*
%vector_ptr = bitcast [7 x i32]* %l to <2 x i32>*
store <2 x i32> <i32 3, i32 -2>, <2 x i32>* %vector_ptr, align 8
%p_arrayidx.1 = getelementptr [7 x i32], [7 x i32]* %l, i32 0, i32 2
%vector_ptr.1 = bitcast i32* %p_arrayidx.1 to <2 x i32>*
store <2 x i32> <i32 -4, i32 6>, <2 x i32>* %vector_ptr.1, align 8
%p_arrayidx.2 = getelementptr [7 x i32], [7 x i32]* %l, i32 0, i32 4
%vector_ptr.2 = bitcast i32* %p_arrayidx.2 to <2 x i32>*
store <2 x i32> <i32 -8, i32 -10>, <2 x i32>* %vector_ptr.2, align 8
ret i32 0
}
; The instructions seem to be in a different order in the .s file than
; the corresponding values in the .ll file, so just run the test three
; times and each time test for a different instruction.
; CHECK-TEST1: combine(#-2, #3)
; CHECK-TEST2: combine(#6, #-4)
; CHECK-TEST3: combine(#-10, #-8)
attributes #0 = { "less-precise-fpmad"="false" "no-frame-pointer-elim"="false" "no-frame-pointer-elim-non-leaf"="true" "no-infs-fp-math"="false" "no-nans-fp-math"="false" "unsafe-fp-math"="false" "use-soft-float"="false" }

View File

@ -0,0 +1,26 @@
; RUN: llc < %s
; REQUIRES: asserts
target datalayout = "e-m:e-p:32:32-i1:32-i64:64-a:0-v32:32-n16:32"
target triple = "hexagon-unknown--elf"
; Function Attrs: nounwind readnone
define i64 @foo() #0 {
entry:
%0 = tail call i32 @llvm.hexagon.S2.ct0p(i64 18)
%1 = tail call i32 @llvm.hexagon.S2.ct1p(i64 27)
%2 = tail call i64 @llvm.hexagon.A2.combinew(i32 %0, i32 %1)
ret i64 %2
}
; Function Attrs: nounwind readnone
declare i32 @llvm.hexagon.S2.ct0p(i64) #0
; Function Attrs: nounwind readnone
declare i32 @llvm.hexagon.S2.ct1p(i64) #0
; Function Attrs: nounwind readnone
declare i64 @llvm.hexagon.A2.combinew(i32, i32) #0
attributes #0 = { nounwind readnone }

View File

@ -0,0 +1,31 @@
; Expect the constant propagation to evaluate signed and unsigned bit extract.
; RUN: llc -march=hexagon -O2 < %s | FileCheck %s
target triple = "hexagon"
@x = common global i32 0, align 4
@y = common global i32 0, align 4
define void @foo() #0 {
entry:
; extractu(0x000ABCD0, 16, 4)
; should evaluate to 0xABCD (dec 43981)
%0 = call i32 @llvm.hexagon.S2.extractu(i32 703696, i32 16, i32 4)
; CHECK: 43981
; CHECK-NOT: extractu
store i32 %0, i32* @x, align 4
; extract(0x000ABCD0, 16, 4)
; should evaluate to 0xFFFFABCD (dec 4294945741 or -21555)
%1 = call i32 @llvm.hexagon.S4.extract(i32 703696, i32 16, i32 4)
; CHECK: -21555
; CHECK-NOT: extract
store i32 %1, i32* @y, align 4
ret void
}
declare i32 @llvm.hexagon.S2.extractu(i32, i32, i32) #1
declare i32 @llvm.hexagon.S4.extract(i32, i32, i32) #1
attributes #0 = { nounwind "less-precise-fpmad"="false" "no-frame-pointer-elim"="true" "no-frame-pointer-elim-non-leaf"="true" "no-infs-fp-math"="false" "no-nans-fp-math"="false" "unsafe-fp-math"="false" "use-soft-float"="false" }
attributes #1 = { nounwind readnone }

View File

@ -0,0 +1,21 @@
; RUN: llc -O2 -march hexagon < %s
target datalayout = "e-p:32:32:32-i64:64:64-i32:32:32-i16:16:16-i1:32:32-f64:64:64-f32:32:32-v64:64:64-v32:32:32-a0:0-n16:32"
target triple = "hexagon"
define signext i16 @foo(i16 signext %var1, i16 signext %var2) #0 {
entry:
%0 = or i16 %var2, %var1
%1 = icmp slt i16 %0, 0
%cmp8 = icmp sgt i16 %var1, %var2
%or.cond19 = or i1 %1, %cmp8
br i1 %or.cond19, label %return, label %if.end
if.end: ; preds = %entry
br label %return
return: ; preds = %if.end, %if.end15, %entry
%retval.0.reg2mem.0 = phi i16 [ 0, %entry ], [ 32767, %if.end ]
ret i16 %retval.0.reg2mem.0
}
attributes #0 = { nounwind readnone "less-precise-fpmad"="false" "no-frame-pointer-elim"="false" "no-frame-pointer-elim-non-leaf"="true" "no-infs-fp-math"="false" "no-nans-fp-math"="false" "unsafe-fp-math"="false" "use-soft-float"="false" }

View File

@ -0,0 +1,17 @@
; RUN: llc -O2 -march hexagon < %s | FileCheck %s
define i32 @foo(i32 %x) {
%p = icmp eq i32 %x, 0
br i1 %p, label %zero, label %nonzero
nonzero:
%v1 = add i32 %x, 1
%c = icmp eq i32 %x, %v1
; This branch will be rewritten by HCP. A bug would cause both branches to
; go away, leaving no path to "ret -1".
br i1 %c, label %zero, label %other
zero:
ret i32 0
other:
; CHECK: -1
ret i32 -1
}

View File

@ -0,0 +1,19 @@
; RUN: llc -march=hexagon < %s | FileCheck %s
; CHECK: cmp
; Make sure that the result is not a compile-time constant.
define i64 @foo(i32 %x) {
entry:
%c = icmp slt i32 %x, 17
br i1 %c, label %b1, label %b2
b1:
br label %b2
b2:
%p = phi i32 [ 1, %entry ], [ 0, %b1 ]
%q = sub i32 %x, %x
%y = zext i32 %q to i64
%u = shl i64 %y, 32
%v = zext i32 %p to i64
%w = or i64 %u, %v
ret i64 %w
}

View File

@ -0,0 +1,18 @@
; RUN: llc < %s
; REQUIRES: asserts
target datalayout = "e-m:e-p:32:32-i1:32-i64:64-a:0-v32:32-n16:32"
target triple = "hexagon"
; Function Attrs: nounwind readnone
define i64 @foo() #0 {
entry:
%0 = tail call i32 @llvm.hexagon.S2.vsplatrb(i32 255)
%conv = zext i32 %0 to i64
%shl = shl nuw i64 %conv, 32
%or = or i64 %shl, %conv
ret i64 %or
}
declare i32 @llvm.hexagon.S2.vsplatrb(i32) #0
attributes #0 = { nounwind readnone }

View File

@ -1,4 +1,4 @@
; RUN: llc -march=hexagon < %s | FileCheck %s
; RUN: llc -march=hexagon -disable-hcp < %s | FileCheck %s
; Make sure we build the constant vector <7, 7, 7, 7> with a vsplatb.
; CHECK: vsplatb
@B = common global [400 x i8] zeroinitializer, align 8

View File

@ -1,4 +1,4 @@
; RUN: llc -march=hexagon < %s | FileCheck %s
; RUN: llc -march=hexagon -disable-hcp < %s | FileCheck %s
; Make sure we build the constant vector <7, 7, 7, 7> with a vsplath.
; CHECK: vsplath
@B = common global [400 x i16] zeroinitializer, align 8