2016-04-26 04:54:08 +08:00
|
|
|
; RUN: llc -verify-machineinstrs -mtriple=aarch64-linux-gnueabi < %s | FileCheck %s
|
[AArch64] Optimize compare and branch sequence when the compare's constant operand is power of 2
Summary:
Peephole optimization that generates a single TBZ/TBNZ instruction
for test and branch sequences like in the example below. This handles
the cases that miss folding of AND into TBZ/TBNZ during ISelLowering of BR_CC
Examples:
and w8, w8, #0x400
cbnz w8, L1
to
tbnz w8, #10, L1
Reviewers: MatzeB, jmolloy, mcrosier, t.p.northover
Subscribers: aemerson, rengolin, mcrosier, llvm-commits
Differential Revision: http://reviews.llvm.org/D17942
llvm-svn: 263136
2016-03-11 01:54:55 +08:00
|
|
|
|
|
|
|
; CHECK-LABEL: test1
|
|
|
|
; CHECK: tbz {{w[0-9]}}, #3, {{.LBB0_3}}
|
2016-04-26 04:54:08 +08:00
|
|
|
; CHECK: tbz w[[REG1:[0-9]+]], #2, {{.LBB0_3}}
|
|
|
|
; CHECK-NOT: and [[REG2:x[0-9]+]], x[[REG1]], #0x4
|
2016-03-11 03:07:50 +08:00
|
|
|
; CHECK-NOT: cbz [[REG2]], {{.LBB0_3}}
|
[AArch64] Optimize compare and branch sequence when the compare's constant operand is power of 2
Summary:
Peephole optimization that generates a single TBZ/TBNZ instruction
for test and branch sequences like in the example below. This handles
the cases that miss folding of AND into TBZ/TBNZ during ISelLowering of BR_CC
Examples:
and w8, w8, #0x400
cbnz w8, L1
to
tbnz w8, #10, L1
Reviewers: MatzeB, jmolloy, mcrosier, t.p.northover
Subscribers: aemerson, rengolin, mcrosier, llvm-commits
Differential Revision: http://reviews.llvm.org/D17942
llvm-svn: 263136
2016-03-11 01:54:55 +08:00
|
|
|
|
|
|
|
; CHECK: b
|
|
|
|
define void @test1(i64 %A, i64 %B) {
|
|
|
|
entry:
|
|
|
|
%and = and i64 %A, 4
|
|
|
|
%notlhs = icmp eq i64 %and, 0
|
|
|
|
%and.1 = and i64 %B, 8
|
|
|
|
%0 = icmp eq i64 %and.1, 0
|
|
|
|
%1 = or i1 %0, %notlhs
|
|
|
|
br i1 %1, label %if.end3, label %if.then2
|
|
|
|
|
|
|
|
if.then2: ; preds = %entry
|
|
|
|
tail call void @foo(i64 %A, i64 %B)
|
|
|
|
br label %if.end3
|
|
|
|
|
|
|
|
if.end3: ; preds = %if.then2, %entry
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
; CHECK-LABEL: test2
|
|
|
|
; CHECK: cbz {{x[0-9]}}, {{.LBB1_3}}
|
2016-04-26 04:54:08 +08:00
|
|
|
; CHECK: tbz w[[REG1:[0-9]+]], #3, {{.LBB1_3}}
|
|
|
|
; CHECK-NOT: and [REG2:x[0-9]+], x[[REG1]], #0x08
|
2016-03-11 03:07:50 +08:00
|
|
|
; CHECK-NOT: cbz [[REG2]], {{.LBB1_3}}
|
[AArch64] Optimize compare and branch sequence when the compare's constant operand is power of 2
Summary:
Peephole optimization that generates a single TBZ/TBNZ instruction
for test and branch sequences like in the example below. This handles
the cases that miss folding of AND into TBZ/TBNZ during ISelLowering of BR_CC
Examples:
and w8, w8, #0x400
cbnz w8, L1
to
tbnz w8, #10, L1
Reviewers: MatzeB, jmolloy, mcrosier, t.p.northover
Subscribers: aemerson, rengolin, mcrosier, llvm-commits
Differential Revision: http://reviews.llvm.org/D17942
llvm-svn: 263136
2016-03-11 01:54:55 +08:00
|
|
|
|
|
|
|
define void @test2(i64 %A, i64* readonly %B) #0 {
|
|
|
|
entry:
|
|
|
|
%tobool = icmp eq i64* %B, null
|
|
|
|
%and = and i64 %A, 8
|
|
|
|
%tobool1 = icmp eq i64 %and, 0
|
|
|
|
%or.cond = or i1 %tobool, %tobool1
|
|
|
|
br i1 %or.cond, label %if.end3, label %if.then2
|
|
|
|
|
|
|
|
if.then2: ; preds = %entry
|
|
|
|
%0 = load i64, i64* %B, align 4
|
|
|
|
tail call void @foo(i64 %A, i64 %0)
|
|
|
|
br label %if.end3
|
|
|
|
|
|
|
|
if.end3: ; preds = %entry, %if.then2
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-04-26 04:54:08 +08:00
|
|
|
; Make sure we use the W variant when log2(mask) is < 32.
|
|
|
|
; CHECK-LABEL: test3
|
|
|
|
; CHECK: tbz {{w[0-9]}}, #3, {{.LBB2_3}}
|
|
|
|
; CHECK: tbz w[[REG1:[0-9]+]], #28, {{.LBB2_3}}
|
|
|
|
; CHECK-NOT: and [[REG2:x[0-9]+]], x[[REG1]]
|
|
|
|
; CHECK-NOT: cbz [[REG2]], {{.LBB2_3}}
|
|
|
|
define void @test3(i64 %A, i64 %B) {
|
|
|
|
entry:
|
|
|
|
%shift = shl i64 1, 28
|
|
|
|
%and = and i64 %A, %shift
|
|
|
|
%notlhs = icmp eq i64 %and, 0
|
|
|
|
%and.1 = and i64 %B, 8
|
|
|
|
%0 = icmp eq i64 %and.1, 0
|
|
|
|
%1 = or i1 %0, %notlhs
|
|
|
|
br i1 %1, label %if.then2, label %if.end3
|
|
|
|
|
|
|
|
if.then2: ; preds = %entry
|
|
|
|
tail call void @foo(i64 %A, i64 %B)
|
|
|
|
br label %if.end3
|
|
|
|
|
|
|
|
if.end3: ; preds = %if.then2, %entry
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
; CHECK-LABEL: test4
|
|
|
|
; CHECK: tbz {{w[0-9]}}, #3, {{.LBB3_3}}
|
|
|
|
; CHECK: tbz [[REG1:x[0-9]+]], #35, {{.LBB3_3}}
|
|
|
|
; CHECK-NOT: and [[REG2:x[0-9]+]], x[[REG1]]
|
|
|
|
; CHECK-NOT: cbz [[REG2]], {{.LBB2_3}}
|
|
|
|
define void @test4(i64 %A, i64 %B) {
|
|
|
|
entry:
|
|
|
|
%shift = shl i64 1, 35
|
|
|
|
%and = and i64 %A, %shift
|
|
|
|
%notlhs = icmp eq i64 %and, 0
|
|
|
|
%and.1 = and i64 %B, 8
|
|
|
|
%0 = icmp eq i64 %and.1, 0
|
|
|
|
%1 = or i1 %0, %notlhs
|
|
|
|
br i1 %1, label %if.then2, label %if.end3
|
|
|
|
|
|
|
|
if.then2: ; preds = %entry
|
|
|
|
tail call void @foo(i64 %A, i64 %B)
|
|
|
|
br label %if.end3
|
|
|
|
|
|
|
|
if.end3: ; preds = %if.then2, %entry
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
[AArch64] Optimize compare and branch sequence when the compare's constant operand is power of 2
Summary:
Peephole optimization that generates a single TBZ/TBNZ instruction
for test and branch sequences like in the example below. This handles
the cases that miss folding of AND into TBZ/TBNZ during ISelLowering of BR_CC
Examples:
and w8, w8, #0x400
cbnz w8, L1
to
tbnz w8, #10, L1
Reviewers: MatzeB, jmolloy, mcrosier, t.p.northover
Subscribers: aemerson, rengolin, mcrosier, llvm-commits
Differential Revision: http://reviews.llvm.org/D17942
llvm-svn: 263136
2016-03-11 01:54:55 +08:00
|
|
|
|
|
|
|
declare void @foo(i64, i64)
|