2018-05-30 02:17:16 +08:00
|
|
|
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
|
|
|
; RUN: llc -mtriple=armv7-unknown-linux < %s | FileCheck --check-prefix=CHECK-ARM %s
|
ARM: Better codegen for 64-bit compares.
This introduces a custom lowering for ISD::SETCCE (introduced in r253572)
that allows us to emit a short code sequence for 64-bit compares.
Before:
push {r7, lr}
cmp r0, r2
mov.w r0, #0
mov.w r12, #0
it hs
movhs r0, #1
cmp r1, r3
it ge
movge.w r12, #1
it eq
moveq r12, r0
cmp.w r12, #0
bne .LBB1_2
@ BB#1: @ %bb1
bl f
pop {r7, pc}
.LBB1_2: @ %bb2
bl g
pop {r7, pc}
After:
push {r7, lr}
subs r0, r0, r2
sbcs.w r0, r1, r3
bge .LBB1_2
@ BB#1: @ %bb1
bl f
pop {r7, pc}
.LBB1_2: @ %bb2
bl g
pop {r7, pc}
Saves around 80KB in Chromium's libchrome.so.
Some notes on this patch:
- I don't much like the ARMISD::BRCOND and ARMISD::CMOV combines I
introduced (nothing else needs them). However, they are necessary in
order to avoid poor codegen, and they seem similar to existing combines
in other backends (e.g. X86 combines (brcond (cmp (setcc Compare))) to
(brcond Compare)).
- No support for Thumb-1. This is in principle possible, but we'd need
to implement ARMISD::SUBE for Thumb-1.
Differential Revision: http://reviews.llvm.org/D15256
llvm-svn: 263962
2016-03-22 02:00:02 +08:00
|
|
|
; RUN: llc -mtriple=thumbv6-unknown-linux < %s | FileCheck --check-prefix=CHECK-THUMB1 %s
|
2018-05-30 02:17:16 +08:00
|
|
|
; RUN: llc -mtriple=thumbv7-unknown-linux < %s | FileCheck --check-prefix=CHECK-THUMB2 %s
|
ARM: Better codegen for 64-bit compares.
This introduces a custom lowering for ISD::SETCCE (introduced in r253572)
that allows us to emit a short code sequence for 64-bit compares.
Before:
push {r7, lr}
cmp r0, r2
mov.w r0, #0
mov.w r12, #0
it hs
movhs r0, #1
cmp r1, r3
it ge
movge.w r12, #1
it eq
moveq r12, r0
cmp.w r12, #0
bne .LBB1_2
@ BB#1: @ %bb1
bl f
pop {r7, pc}
.LBB1_2: @ %bb2
bl g
pop {r7, pc}
After:
push {r7, lr}
subs r0, r0, r2
sbcs.w r0, r1, r3
bge .LBB1_2
@ BB#1: @ %bb1
bl f
pop {r7, pc}
.LBB1_2: @ %bb2
bl g
pop {r7, pc}
Saves around 80KB in Chromium's libchrome.so.
Some notes on this patch:
- I don't much like the ARMISD::BRCOND and ARMISD::CMOV combines I
introduced (nothing else needs them). However, they are necessary in
order to avoid poor codegen, and they seem similar to existing combines
in other backends (e.g. X86 combines (brcond (cmp (setcc Compare))) to
(brcond Compare)).
- No support for Thumb-1. This is in principle possible, but we'd need
to implement ARMISD::SUBE for Thumb-1.
Differential Revision: http://reviews.llvm.org/D15256
llvm-svn: 263962
2016-03-22 02:00:02 +08:00
|
|
|
|
|
|
|
define i32 @test_slt1(i64 %a, i64 %b) {
|
2018-05-30 02:17:16 +08:00
|
|
|
; CHECK-ARM-LABEL: test_slt1:
|
|
|
|
; CHECK-ARM: @ %bb.0: @ %entry
|
|
|
|
; CHECK-ARM-NEXT: subs r0, r0, r2
|
|
|
|
; CHECK-ARM-NEXT: mov r12, #2
|
|
|
|
; CHECK-ARM-NEXT: sbcs r0, r1, r3
|
|
|
|
; CHECK-ARM-NEXT: movwlt r12, #1
|
|
|
|
; CHECK-ARM-NEXT: mov r0, r12
|
|
|
|
; CHECK-ARM-NEXT: bx lr
|
|
|
|
;
|
|
|
|
; CHECK-THUMB1-LABEL: test_slt1:
|
|
|
|
; CHECK-THUMB1: @ %bb.0: @ %entry
|
|
|
|
; CHECK-THUMB1-NEXT: subs r0, r0, r2
|
|
|
|
; CHECK-THUMB1-NEXT: sbcs r1, r3
|
|
|
|
; CHECK-THUMB1-NEXT: bge .LBB0_2
|
|
|
|
; CHECK-THUMB1-NEXT: @ %bb.1: @ %bb1
|
|
|
|
; CHECK-THUMB1-NEXT: movs r0, #1
|
|
|
|
; CHECK-THUMB1-NEXT: bx lr
|
|
|
|
; CHECK-THUMB1-NEXT: .LBB0_2: @ %bb2
|
|
|
|
; CHECK-THUMB1-NEXT: movs r0, #2
|
|
|
|
; CHECK-THUMB1-NEXT: bx lr
|
|
|
|
;
|
|
|
|
; CHECK-THUMB2-LABEL: test_slt1:
|
|
|
|
; CHECK-THUMB2: @ %bb.0: @ %entry
|
|
|
|
; CHECK-THUMB2-NEXT: subs r0, r0, r2
|
|
|
|
; CHECK-THUMB2-NEXT: mov.w r12, #2
|
|
|
|
; CHECK-THUMB2-NEXT: sbcs.w r0, r1, r3
|
|
|
|
; CHECK-THUMB2-NEXT: it lt
|
|
|
|
; CHECK-THUMB2-NEXT: movlt.w r12, #1
|
|
|
|
; CHECK-THUMB2-NEXT: mov r0, r12
|
|
|
|
; CHECK-THUMB2-NEXT: bx lr
|
ARM: Better codegen for 64-bit compares.
This introduces a custom lowering for ISD::SETCCE (introduced in r253572)
that allows us to emit a short code sequence for 64-bit compares.
Before:
push {r7, lr}
cmp r0, r2
mov.w r0, #0
mov.w r12, #0
it hs
movhs r0, #1
cmp r1, r3
it ge
movge.w r12, #1
it eq
moveq r12, r0
cmp.w r12, #0
bne .LBB1_2
@ BB#1: @ %bb1
bl f
pop {r7, pc}
.LBB1_2: @ %bb2
bl g
pop {r7, pc}
After:
push {r7, lr}
subs r0, r0, r2
sbcs.w r0, r1, r3
bge .LBB1_2
@ BB#1: @ %bb1
bl f
pop {r7, pc}
.LBB1_2: @ %bb2
bl g
pop {r7, pc}
Saves around 80KB in Chromium's libchrome.so.
Some notes on this patch:
- I don't much like the ARMISD::BRCOND and ARMISD::CMOV combines I
introduced (nothing else needs them). However, they are necessary in
order to avoid poor codegen, and they seem similar to existing combines
in other backends (e.g. X86 combines (brcond (cmp (setcc Compare))) to
(brcond Compare)).
- No support for Thumb-1. This is in principle possible, but we'd need
to implement ARMISD::SUBE for Thumb-1.
Differential Revision: http://reviews.llvm.org/D15256
llvm-svn: 263962
2016-03-22 02:00:02 +08:00
|
|
|
entry:
|
|
|
|
%cmp = icmp slt i64 %a, %b
|
|
|
|
br i1 %cmp, label %bb1, label %bb2
|
|
|
|
bb1:
|
|
|
|
ret i32 1
|
|
|
|
bb2:
|
|
|
|
ret i32 2
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @test_slt2(i64 %a, i64 %b) {
|
2018-05-30 02:17:16 +08:00
|
|
|
; CHECK-ARM-LABEL: test_slt2:
|
|
|
|
; CHECK-ARM: @ %bb.0: @ %entry
|
|
|
|
; CHECK-ARM-NEXT: push {r11, lr}
|
|
|
|
; CHECK-ARM-NEXT: subs r0, r0, r2
|
|
|
|
; CHECK-ARM-NEXT: sbcs r0, r1, r3
|
|
|
|
; CHECK-ARM-NEXT: bge .LBB1_2
|
|
|
|
; CHECK-ARM-NEXT: @ %bb.1: @ %bb1
|
|
|
|
; CHECK-ARM-NEXT: bl f
|
|
|
|
; CHECK-ARM-NEXT: pop {r11, pc}
|
|
|
|
; CHECK-ARM-NEXT: .LBB1_2: @ %bb2
|
|
|
|
; CHECK-ARM-NEXT: bl g
|
|
|
|
; CHECK-ARM-NEXT: pop {r11, pc}
|
|
|
|
;
|
|
|
|
; CHECK-THUMB1-LABEL: test_slt2:
|
|
|
|
; CHECK-THUMB1: @ %bb.0: @ %entry
|
|
|
|
; CHECK-THUMB1-NEXT: push {r7, lr}
|
|
|
|
; CHECK-THUMB1-NEXT: subs r0, r0, r2
|
|
|
|
; CHECK-THUMB1-NEXT: sbcs r1, r3
|
|
|
|
; CHECK-THUMB1-NEXT: bge .LBB1_2
|
|
|
|
; CHECK-THUMB1-NEXT: @ %bb.1: @ %bb1
|
|
|
|
; CHECK-THUMB1-NEXT: bl f
|
|
|
|
; CHECK-THUMB1-NEXT: pop {r7, pc}
|
|
|
|
; CHECK-THUMB1-NEXT: .LBB1_2: @ %bb2
|
|
|
|
; CHECK-THUMB1-NEXT: bl g
|
|
|
|
; CHECK-THUMB1-NEXT: pop {r7, pc}
|
|
|
|
;
|
|
|
|
; CHECK-THUMB2-LABEL: test_slt2:
|
|
|
|
; CHECK-THUMB2: @ %bb.0: @ %entry
|
|
|
|
; CHECK-THUMB2-NEXT: push {r7, lr}
|
|
|
|
; CHECK-THUMB2-NEXT: subs r0, r0, r2
|
|
|
|
; CHECK-THUMB2-NEXT: sbcs.w r0, r1, r3
|
|
|
|
; CHECK-THUMB2-NEXT: bge .LBB1_2
|
|
|
|
; CHECK-THUMB2-NEXT: @ %bb.1: @ %bb1
|
|
|
|
; CHECK-THUMB2-NEXT: bl f
|
|
|
|
; CHECK-THUMB2-NEXT: pop {r7, pc}
|
|
|
|
; CHECK-THUMB2-NEXT: .LBB1_2: @ %bb2
|
|
|
|
; CHECK-THUMB2-NEXT: bl g
|
|
|
|
; CHECK-THUMB2-NEXT: pop {r7, pc}
|
ARM: Better codegen for 64-bit compares.
This introduces a custom lowering for ISD::SETCCE (introduced in r253572)
that allows us to emit a short code sequence for 64-bit compares.
Before:
push {r7, lr}
cmp r0, r2
mov.w r0, #0
mov.w r12, #0
it hs
movhs r0, #1
cmp r1, r3
it ge
movge.w r12, #1
it eq
moveq r12, r0
cmp.w r12, #0
bne .LBB1_2
@ BB#1: @ %bb1
bl f
pop {r7, pc}
.LBB1_2: @ %bb2
bl g
pop {r7, pc}
After:
push {r7, lr}
subs r0, r0, r2
sbcs.w r0, r1, r3
bge .LBB1_2
@ BB#1: @ %bb1
bl f
pop {r7, pc}
.LBB1_2: @ %bb2
bl g
pop {r7, pc}
Saves around 80KB in Chromium's libchrome.so.
Some notes on this patch:
- I don't much like the ARMISD::BRCOND and ARMISD::CMOV combines I
introduced (nothing else needs them). However, they are necessary in
order to avoid poor codegen, and they seem similar to existing combines
in other backends (e.g. X86 combines (brcond (cmp (setcc Compare))) to
(brcond Compare)).
- No support for Thumb-1. This is in principle possible, but we'd need
to implement ARMISD::SUBE for Thumb-1.
Differential Revision: http://reviews.llvm.org/D15256
llvm-svn: 263962
2016-03-22 02:00:02 +08:00
|
|
|
entry:
|
|
|
|
%cmp = icmp slt i64 %a, %b
|
|
|
|
br i1 %cmp, label %bb1, label %bb2
|
|
|
|
bb1:
|
|
|
|
call void @f()
|
|
|
|
ret void
|
|
|
|
bb2:
|
|
|
|
call void @g()
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
declare void @f()
|
|
|
|
declare void @g()
|