forked from OSchip/llvm-project
408 lines
8.5 KiB
LLVM
408 lines
8.5 KiB
LLVM
; Test that floating-point compares are omitted if CC already has the
|
|
; right value.
|
|
;
|
|
; RUN: llc < %s -mtriple=s390x-linux-gnu -mcpu=z10 -no-integrated-as | FileCheck %s
|
|
|
|
declare float @llvm.fabs.f32(float %f)
|
|
|
|
; Test addition followed by EQ, which can use the CC result of the addition.
|
|
define float @f1(float %a, float %b, float *%dest) {
|
|
; CHECK-LABEL: f1:
|
|
; CHECK: aebr %f0, %f2
|
|
; CHECK-NEXT: ber %r14
|
|
; CHECK: br %r14
|
|
entry:
|
|
%res = fadd float %a, %b
|
|
%cmp = fcmp oeq float %res, 0.0
|
|
br i1 %cmp, label %exit, label %store
|
|
|
|
store:
|
|
store float %b, float *%dest
|
|
br label %exit
|
|
|
|
exit:
|
|
ret float %res
|
|
}
|
|
|
|
; ...and again with LT.
|
|
define float @f2(float %a, float %b, float *%dest) {
|
|
; CHECK-LABEL: f2:
|
|
; CHECK: aebr %f0, %f2
|
|
; CHECK-NEXT: blr %r14
|
|
; CHECK: br %r14
|
|
entry:
|
|
%res = fadd float %a, %b
|
|
%cmp = fcmp olt float %res, 0.0
|
|
br i1 %cmp, label %exit, label %store
|
|
|
|
store:
|
|
store float %b, float *%dest
|
|
br label %exit
|
|
|
|
exit:
|
|
ret float %res
|
|
}
|
|
|
|
; ...and again with GT.
|
|
define float @f3(float %a, float %b, float *%dest) {
|
|
; CHECK-LABEL: f3:
|
|
; CHECK: aebr %f0, %f2
|
|
; CHECK-NEXT: bhr %r14
|
|
; CHECK: br %r14
|
|
entry:
|
|
%res = fadd float %a, %b
|
|
%cmp = fcmp ogt float %res, 0.0
|
|
br i1 %cmp, label %exit, label %store
|
|
|
|
store:
|
|
store float %b, float *%dest
|
|
br label %exit
|
|
|
|
exit:
|
|
ret float %res
|
|
}
|
|
|
|
; ...and again with UEQ.
|
|
define float @f4(float %a, float %b, float *%dest) {
|
|
; CHECK-LABEL: f4:
|
|
; CHECK: aebr %f0, %f2
|
|
; CHECK-NEXT: bnlhr %r14
|
|
; CHECK: br %r14
|
|
entry:
|
|
%res = fadd float %a, %b
|
|
%cmp = fcmp ueq float %res, 0.0
|
|
br i1 %cmp, label %exit, label %store
|
|
|
|
store:
|
|
store float %b, float *%dest
|
|
br label %exit
|
|
|
|
exit:
|
|
ret float %res
|
|
}
|
|
|
|
; Subtraction also provides a zero-based CC value.
|
|
define float @f5(float %a, float %b, float *%dest) {
|
|
; CHECK-LABEL: f5:
|
|
; CHECK: seb %f0, 0(%r2)
|
|
; CHECK-NEXT: bnher %r14
|
|
; CHECK: br %r14
|
|
entry:
|
|
%cur = load float, float *%dest
|
|
%res = fsub float %a, %cur
|
|
%cmp = fcmp ult float %res, 0.0
|
|
br i1 %cmp, label %exit, label %store
|
|
|
|
store:
|
|
store float %b, float *%dest
|
|
br label %exit
|
|
|
|
exit:
|
|
ret float %res
|
|
}
|
|
|
|
; Test the result of LOAD POSITIVE.
|
|
define float @f6(float %dummy, float %a, float *%dest) {
|
|
; CHECK-LABEL: f6:
|
|
; CHECK: lpebr %f0, %f2
|
|
; CHECK-NEXT: bhr %r14
|
|
; CHECK: br %r14
|
|
entry:
|
|
%res = call float @llvm.fabs.f32(float %a)
|
|
%cmp = fcmp ogt float %res, 0.0
|
|
br i1 %cmp, label %exit, label %store
|
|
|
|
store:
|
|
store float %res, float *%dest
|
|
br label %exit
|
|
|
|
exit:
|
|
ret float %res
|
|
}
|
|
|
|
; Test the result of LOAD NEGATIVE.
|
|
define float @f7(float %dummy, float %a, float *%dest) {
|
|
; CHECK-LABEL: f7:
|
|
; CHECK: lnebr %f0, %f2
|
|
; CHECK-NEXT: blr %r14
|
|
; CHECK: br %r14
|
|
entry:
|
|
%abs = call float @llvm.fabs.f32(float %a)
|
|
%res = fsub float -0.0, %abs
|
|
%cmp = fcmp olt float %res, 0.0
|
|
br i1 %cmp, label %exit, label %store
|
|
|
|
store:
|
|
store float %res, float *%dest
|
|
br label %exit
|
|
|
|
exit:
|
|
ret float %res
|
|
}
|
|
|
|
; Test the result of LOAD COMPLEMENT.
|
|
define float @f8(float %dummy, float %a, float *%dest) {
|
|
; CHECK-LABEL: f8:
|
|
; CHECK: lcebr %f0, %f2
|
|
; CHECK-NEXT: bler %r14
|
|
; CHECK: br %r14
|
|
entry:
|
|
%res = fsub float -0.0, %a
|
|
%cmp = fcmp ole float %res, 0.0
|
|
br i1 %cmp, label %exit, label %store
|
|
|
|
store:
|
|
store float %res, float *%dest
|
|
br label %exit
|
|
|
|
exit:
|
|
ret float %res
|
|
}
|
|
|
|
; Multiplication (for example) does not modify CC.
|
|
define float @f9(float %a, float %b, float *%dest) {
|
|
; CHECK-LABEL: f9:
|
|
; CHECK: meebr %f0, %f2
|
|
; CHECK-NEXT: ltebr %f0, %f0
|
|
; CHECK-NEXT: blhr %r14
|
|
; CHECK: br %r14
|
|
entry:
|
|
%res = fmul float %a, %b
|
|
%cmp = fcmp one float %res, 0.0
|
|
br i1 %cmp, label %exit, label %store
|
|
|
|
store:
|
|
store float %b, float *%dest
|
|
br label %exit
|
|
|
|
exit:
|
|
ret float %res
|
|
}
|
|
|
|
; Test a combination involving a CC-setting instruction followed by
|
|
; a non-CC-setting instruction.
|
|
define float @f10(float %a, float %b, float %c, float *%dest) {
|
|
; CHECK-LABEL: f10:
|
|
; CHECK: aebr %f0, %f2
|
|
; CHECK-NEXT: debr %f0, %f4
|
|
; CHECK-NEXT: ltebr %f0, %f0
|
|
; CHECK-NEXT: bner %r14
|
|
; CHECK: br %r14
|
|
entry:
|
|
%add = fadd float %a, %b
|
|
%res = fdiv float %add, %c
|
|
%cmp = fcmp une float %res, 0.0
|
|
br i1 %cmp, label %exit, label %store
|
|
|
|
store:
|
|
store float %b, float *%dest
|
|
br label %exit
|
|
|
|
exit:
|
|
ret float %res
|
|
}
|
|
|
|
; Test a case where CC is set based on a different register from the
|
|
; compare input.
|
|
define float @f11(float %a, float %b, float %c, float *%dest1, float *%dest2) {
|
|
; CHECK-LABEL: f11:
|
|
; CHECK: aebr %f0, %f2
|
|
; CHECK-NEXT: sebr %f4, %f0
|
|
; CHECK-DAG: ste %f4, 0(%r2)
|
|
; CHECK-DAG: ltebr %f0, %f0
|
|
; CHECK-NEXT: ber %r14
|
|
; CHECK: br %r14
|
|
entry:
|
|
%add = fadd float %a, %b
|
|
%sub = fsub float %c, %add
|
|
store float %sub, float *%dest1
|
|
%cmp = fcmp oeq float %add, 0.0
|
|
br i1 %cmp, label %exit, label %store
|
|
|
|
store:
|
|
store float %sub, float *%dest2
|
|
br label %exit
|
|
|
|
exit:
|
|
ret float %add
|
|
}
|
|
|
|
; Test that LER gets converted to LTEBR where useful.
|
|
define float @f12(float %dummy, float %val, float *%dest) {
|
|
; CHECK-LABEL: f12:
|
|
; CHECK: ltebr %f0, %f2
|
|
; CHECK-NEXT: #APP
|
|
; CHECK-NEXT: blah %f0
|
|
; CHECK-NEXT: #NO_APP
|
|
; CHECK-NEXT: blr %r14
|
|
; CHECK: br %r14
|
|
entry:
|
|
call void asm sideeffect "blah $0", "{f0}"(float %val)
|
|
%cmp = fcmp olt float %val, 0.0
|
|
br i1 %cmp, label %exit, label %store
|
|
|
|
store:
|
|
store float %val, float *%dest
|
|
br label %exit
|
|
|
|
exit:
|
|
ret float %val
|
|
}
|
|
|
|
; Test that LDR gets converted to LTDBR where useful.
|
|
define double @f13(double %dummy, double %val, double *%dest) {
|
|
; CHECK-LABEL: f13:
|
|
; CHECK: ltdbr %f0, %f2
|
|
; CHECK-NEXT: #APP
|
|
; CHECK-NEXT: blah %f0
|
|
; CHECK-NEXT: #NO_APP
|
|
; CHECK-NEXT: blr %r14
|
|
; CHECK: br %r14
|
|
entry:
|
|
call void asm sideeffect "blah $0", "{f0}"(double %val)
|
|
%cmp = fcmp olt double %val, 0.0
|
|
br i1 %cmp, label %exit, label %store
|
|
|
|
store:
|
|
store double %val, double *%dest
|
|
br label %exit
|
|
|
|
exit:
|
|
ret double %val
|
|
}
|
|
|
|
; Test that LXR gets converted to LTXBR where useful.
|
|
define void @f14(fp128 *%ptr1, fp128 *%ptr2) {
|
|
; CHECK-LABEL: f14:
|
|
; CHECK: ltxbr
|
|
; CHECK-NEXT: dxbr
|
|
; CHECK-NEXT: std
|
|
; CHECK-NEXT: std
|
|
; CHECK-NEXT: mxbr
|
|
; CHECK-NEXT: std
|
|
; CHECK-NEXT: std
|
|
; CHECK-NEXT: blr %r14
|
|
; CHECK: br %r14
|
|
entry:
|
|
%val1 = load fp128, fp128 *%ptr1
|
|
%val2 = load fp128, fp128 *%ptr2
|
|
%div = fdiv fp128 %val1, %val2
|
|
store fp128 %div, fp128 *%ptr1
|
|
%mul = fmul fp128 %val1, %val2
|
|
store fp128 %mul, fp128 *%ptr2
|
|
%cmp = fcmp olt fp128 %val1, 0xL00000000000000000000000000000000
|
|
br i1 %cmp, label %exit, label %store
|
|
|
|
store:
|
|
call void asm sideeffect "blah", ""()
|
|
br label %exit
|
|
|
|
exit:
|
|
ret void
|
|
}
|
|
|
|
; Test a case where it is the source rather than destination of LER that
|
|
; we need.
|
|
define float @f15(float %val, float %dummy, float *%dest) {
|
|
; CHECK-LABEL: f15:
|
|
; CHECK: ltebr %f2, %f0
|
|
; CHECK-NEXT: #APP
|
|
; CHECK-NEXT: blah %f2
|
|
; CHECK-NEXT: #NO_APP
|
|
; CHECK-NEXT: blr %r14
|
|
; CHECK: br %r14
|
|
entry:
|
|
call void asm sideeffect "blah $0", "{f2}"(float %val)
|
|
%cmp = fcmp olt float %val, 0.0
|
|
br i1 %cmp, label %exit, label %store
|
|
|
|
store:
|
|
store float %val, float *%dest
|
|
br label %exit
|
|
|
|
exit:
|
|
ret float %val
|
|
}
|
|
|
|
; Test a case where it is the source rather than destination of LDR that
|
|
; we need.
|
|
define double @f16(double %val, double %dummy, double *%dest) {
|
|
; CHECK-LABEL: f16:
|
|
; CHECK: ltdbr %f2, %f0
|
|
; CHECK-NEXT: #APP
|
|
; CHECK-NEXT: blah %f2
|
|
; CHECK-NEXT: #NO_APP
|
|
; CHECK-NEXT: blr %r14
|
|
; CHECK: br %r14
|
|
entry:
|
|
call void asm sideeffect "blah $0", "{f2}"(double %val)
|
|
%cmp = fcmp olt double %val, 0.0
|
|
br i1 %cmp, label %exit, label %store
|
|
|
|
store:
|
|
store double %val, double *%dest
|
|
br label %exit
|
|
|
|
exit:
|
|
ret double %val
|
|
}
|
|
|
|
; Repeat f2 with a comparison against -0.
|
|
define float @f17(float %a, float %b, float *%dest) {
|
|
; CHECK-LABEL: f17:
|
|
; CHECK: aebr %f0, %f2
|
|
; CHECK-NEXT: blr %r14
|
|
; CHECK: br %r14
|
|
entry:
|
|
%res = fadd float %a, %b
|
|
%cmp = fcmp olt float %res, -0.0
|
|
br i1 %cmp, label %exit, label %store
|
|
|
|
store:
|
|
store float %b, float *%dest
|
|
br label %exit
|
|
|
|
exit:
|
|
ret float %res
|
|
}
|
|
|
|
; Test another form of f7 in which the condition is based on the unnegated
|
|
; result. This is what InstCombine would produce.
|
|
define float @f18(float %dummy, float %a, float *%dest) {
|
|
; CHECK-LABEL: f18:
|
|
; CHECK: lnebr %f0, %f2
|
|
; CHECK-NEXT: blr %r14
|
|
; CHECK: br %r14
|
|
entry:
|
|
%abs = call float @llvm.fabs.f32(float %a)
|
|
%res = fsub float -0.0, %abs
|
|
%cmp = fcmp ogt float %abs, 0.0
|
|
br i1 %cmp, label %exit, label %store
|
|
|
|
store:
|
|
store float %res, float *%dest
|
|
br label %exit
|
|
|
|
exit:
|
|
ret float %res
|
|
}
|
|
|
|
; Similarly for f8.
|
|
define float @f19(float %dummy, float %a, float *%dest) {
|
|
; CHECK-LABEL: f19:
|
|
; CHECK: lcebr %f0, %f2
|
|
; CHECK-NEXT: bler %r14
|
|
; CHECK: br %r14
|
|
entry:
|
|
%res = fsub float -0.0, %a
|
|
%cmp = fcmp oge float %a, 0.0
|
|
br i1 %cmp, label %exit, label %store
|
|
|
|
store:
|
|
store float %res, float *%dest
|
|
br label %exit
|
|
|
|
exit:
|
|
ret float %res
|
|
}
|