forked from OSchip/llvm-project
80 lines
1.9 KiB
LLVM
80 lines
1.9 KiB
LLVM
|
; RUN: llc -mtriple=armv7a -mattr=+hwdiv-arm %s -o - | FileCheck %s --check-prefixes=CHECK,DIV
|
||
|
; RUN: llc -mtriple=armv7a -mattr=-hwdiv-arm %s -o - | FileCheck %s --check-prefixes=CHECK,NODIV
|
||
|
|
||
|
; Check SREM
|
||
|
define dso_local i32 @test_rem(i32 %F) local_unnamed_addr #0 {
|
||
|
; CHECK-LABEL: test_rem
|
||
|
; CHECK: asr r1, r0, #31
|
||
|
; CHECK-NEXT: add r1, r0, r1, lsr #30
|
||
|
; CHECK-NEXT: bic r1, r1, #3
|
||
|
; CHECK-NEXT: sub r0, r0, r1
|
||
|
|
||
|
entry:
|
||
|
%div = srem i32 %F, 4
|
||
|
ret i32 %div
|
||
|
}
|
||
|
|
||
|
; Try an i16 sdiv, with a small immediate.
|
||
|
define dso_local signext i16 @f0(i16 signext %F) local_unnamed_addr #0 {
|
||
|
; CHECK-LABEL: f0
|
||
|
|
||
|
; DIV: mov r1, #2
|
||
|
; DIV-NEXT: sdiv r0, r0, r1
|
||
|
; DIV-NEXT: sxth r0, r0
|
||
|
; DIV-NEXT: bx lr
|
||
|
|
||
|
; NODIV: uxth r1, r0
|
||
|
; NODIV-NEXT: add r0, r0, r1, lsr #15
|
||
|
; NODIV-NEXT: sxth r0, r0
|
||
|
; NODIV-NEXT: asr r0, r0, #1
|
||
|
; NODIV-NEXT: bx lr
|
||
|
|
||
|
entry:
|
||
|
%0 = sdiv i16 %F, 2
|
||
|
ret i16 %0
|
||
|
}
|
||
|
|
||
|
; Try an i32 sdiv, with a small immediate.
|
||
|
define dso_local i32 @f1(i32 %F) local_unnamed_addr #0 {
|
||
|
; CHECK-LABEL: f1
|
||
|
|
||
|
; DIV: mov r1, #4
|
||
|
; DIV-NEXT: sdiv r0, r0, r1
|
||
|
; DIV-NEXT: bx lr
|
||
|
|
||
|
; NODIV: asr r1, r0, #31
|
||
|
; NODIV-NEXT: add r0, r0, r1, lsr #30
|
||
|
; NODIV-NEXT: asr r0, r0, #2
|
||
|
; NODIV-NEXT: bx lr
|
||
|
|
||
|
entry:
|
||
|
%div = sdiv i32 %F, 4
|
||
|
ret i32 %div
|
||
|
}
|
||
|
|
||
|
; Try a large power of 2 immediate, which should also be materialised with 1
|
||
|
; move immediate instruction.
|
||
|
define dso_local i32 @f2(i32 %F) local_unnamed_addr #0 {
|
||
|
; CHECK-LABEL: f2
|
||
|
; DIV: mov r1, #131072
|
||
|
; DIV-NEXT: sdiv r0, r0, r1
|
||
|
; DIV-NEXT: bx lr
|
||
|
entry:
|
||
|
%div = sdiv i32 %F, 131072
|
||
|
ret i32 %div
|
||
|
}
|
||
|
|
||
|
; MinSize not set, so should expand to the faster but longer sequence.
|
||
|
define dso_local i32 @f3(i32 %F) {
|
||
|
; CHECK-LABEL: f3
|
||
|
; CHECK: asr r1, r0, #31
|
||
|
; CHECK-NEXT: add r0, r0, r1, lsr #30
|
||
|
; CHECK-NEXT: asr r0, r0, #2
|
||
|
; CHECK-NEXT: bx lr
|
||
|
entry:
|
||
|
%div = sdiv i32 %F, 4
|
||
|
ret i32 %div
|
||
|
}
|
||
|
|
||
|
attributes #0 = { minsize norecurse nounwind optsize readnone }
|