2018-05-04 01:41:37 +08:00
|
|
|
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
|
|
|
; REQUIRES: asserts
|
2018-05-04 02:49:35 +08:00
|
|
|
; RUN: llc < %s -mtriple=powerpc64le -debug-only=isel -o /dev/null 2>&1 | FileCheck %s --check-prefix=FMFDEBUG
|
|
|
|
; RUN: llc < %s -mtriple=powerpc64le | FileCheck %s --check-prefix=FMF
|
2018-05-15 05:17:49 +08:00
|
|
|
; RUN: llc < %s -mtriple=powerpc64le -debug-only=isel -o /dev/null 2>&1 -enable-unsafe-fp-math -enable-no-nans-fp-math | FileCheck %s --check-prefix=GLOBALDEBUG
|
Migrate some more fadd and fsub cases away from UnsafeFPMath control to utilize NoSignedZerosFPMath options control
Summary: Honoring no signed zeroes is also available as a user control through clang separately regardless of fastmath or UnsafeFPMath context, DAG guards should reflect this context.
Reviewers: spatel, arsenm, hfinkel, wristow, craig.topper
Reviewed By: spatel
Subscribers: rampitec, foad, nhaehnle, wuzish, nemanjai, jvesely, wdng, javed.absar, MaskRay, jsji
Differential Revision: https://reviews.llvm.org/D65170
llvm-svn: 367486
2019-08-01 05:57:28 +08:00
|
|
|
; RUN: llc < %s -mtriple=powerpc64le -enable-unsafe-fp-math -enable-no-nans-fp-math -enable-no-signed-zeros-fp-math | FileCheck %s --check-prefix=GLOBAL
|
2018-05-04 01:41:37 +08:00
|
|
|
|
|
|
|
; Test FP transforms using instruction/node-level fast-math-flags.
|
|
|
|
; We're also checking debug output to verify that FMF is propagated to the newly created nodes.
|
|
|
|
; The run with the global unsafe param tests the pre-FMF behavior using regular instructions/nodes.
|
|
|
|
|
|
|
|
declare float @llvm.fma.f32(float, float, float)
|
|
|
|
declare float @llvm.sqrt.f32(float)
|
|
|
|
|
|
|
|
; X * Y + Z --> fma(X, Y, Z)
|
|
|
|
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; contract bits in fmul is checked.
|
|
|
|
|
2018-05-04 01:41:37 +08:00
|
|
|
; FMFDEBUG-LABEL: Optimized lowered selection DAG: %bb.0 'fmul_fadd_contract1:'
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMFDEBUG-NOT: fma contract {{t[0-9]+}}, {{t[0-9]+}}, {{t[0-9]+}}
|
2018-05-04 01:41:37 +08:00
|
|
|
; FMFDEBUG: Type-legalized selection DAG: %bb.0 'fmul_fadd_contract1:'
|
|
|
|
|
|
|
|
define float @fmul_fadd_contract1(float %x, float %y, float %z) {
|
|
|
|
; FMF-LABEL: fmul_fadd_contract1:
|
|
|
|
; FMF: # %bb.0:
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMF-NEXT: xsmulsp 0, 1, 2
|
|
|
|
; FMF-NEXT: xsaddsp 1, 0, 3
|
2018-05-04 01:41:37 +08:00
|
|
|
; FMF-NEXT: blr
|
|
|
|
;
|
|
|
|
; GLOBAL-LABEL: fmul_fadd_contract1:
|
|
|
|
; GLOBAL: # %bb.0:
|
|
|
|
; GLOBAL-NEXT: xsmaddasp 3, 1, 2
|
|
|
|
; GLOBAL-NEXT: fmr 1, 3
|
|
|
|
; GLOBAL-NEXT: blr
|
|
|
|
%mul = fmul float %x, %y
|
|
|
|
%add = fadd contract float %mul, %z
|
|
|
|
ret float %add
|
|
|
|
}
|
|
|
|
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; contract bits in fadd is also checked.
|
2018-05-04 01:41:37 +08:00
|
|
|
|
|
|
|
; FMFDEBUG-LABEL: Optimized lowered selection DAG: %bb.0 'fmul_fadd_contract2:'
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMFDEBUG-NOT: fma contract {{t[0-9]+}}, {{t[0-9]+}}, {{t[0-9]+}}
|
2018-05-04 01:41:37 +08:00
|
|
|
; FMFDEBUG: Type-legalized selection DAG: %bb.0 'fmul_fadd_contract2:'
|
|
|
|
|
|
|
|
define float @fmul_fadd_contract2(float %x, float %y, float %z) {
|
|
|
|
; FMF-LABEL: fmul_fadd_contract2:
|
|
|
|
; FMF: # %bb.0:
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMF-NEXT: xsmulsp 0, 1, 2
|
|
|
|
; FMF-NEXT: xsaddsp 1, 0, 3
|
|
|
|
; FMF-NEXT: blr
|
|
|
|
;
|
|
|
|
; GLOBAL-LABEL: fmul_fadd_contract2:
|
|
|
|
; GLOBAL: # %bb.0:
|
|
|
|
; GLOBAL-NEXT: xsmaddasp 3, 1, 2
|
|
|
|
; GLOBAL-NEXT: fmr 1, 3
|
|
|
|
; GLOBAL-NEXT: blr
|
|
|
|
%mul = fmul contract float %x, %y
|
|
|
|
%add = fadd float %mul, %z
|
|
|
|
ret float %add
|
|
|
|
}
|
|
|
|
|
|
|
|
; FMFDEBUG-LABEL: Optimized lowered selection DAG: %bb.0 'fmul_fadd_contract3:'
|
|
|
|
; FMFDEBUG: fma contract {{t[0-9]+}}, {{t[0-9]+}}, {{t[0-9]+}}
|
|
|
|
; FMFDEBUG: Type-legalized selection DAG: %bb.0 'fmul_fadd_contract3:'
|
|
|
|
|
|
|
|
define float @fmul_fadd_contract3(float %x, float %y, float %z) {
|
|
|
|
; FMF-LABEL: fmul_fadd_contract3:
|
|
|
|
; FMF: # %bb.0:
|
2018-05-04 01:41:37 +08:00
|
|
|
; FMF-NEXT: xsmaddasp 3, 1, 2
|
|
|
|
; FMF-NEXT: fmr 1, 3
|
|
|
|
; FMF-NEXT: blr
|
|
|
|
;
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; GLOBAL-LABEL: fmul_fadd_contract3:
|
2018-05-04 01:41:37 +08:00
|
|
|
; GLOBAL: # %bb.0:
|
|
|
|
; GLOBAL-NEXT: xsmaddasp 3, 1, 2
|
|
|
|
; GLOBAL-NEXT: fmr 1, 3
|
|
|
|
; GLOBAL-NEXT: blr
|
|
|
|
%mul = fmul contract float %x, %y
|
|
|
|
%add = fadd contract float %mul, %z
|
|
|
|
ret float %add
|
|
|
|
}
|
|
|
|
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; Reassociation does NOT imply that FMA contraction is allowed.
|
2018-05-04 01:41:37 +08:00
|
|
|
|
|
|
|
; FMFDEBUG-LABEL: Optimized lowered selection DAG: %bb.0 'fmul_fadd_reassoc1:'
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMFDEBUG-NOT: fma reassoc {{t[0-9]+}}, {{t[0-9]+}}, {{t[0-9]+}}
|
2018-05-04 01:41:37 +08:00
|
|
|
; FMFDEBUG: Type-legalized selection DAG: %bb.0 'fmul_fadd_reassoc1:'
|
|
|
|
|
|
|
|
define float @fmul_fadd_reassoc1(float %x, float %y, float %z) {
|
|
|
|
; FMF-LABEL: fmul_fadd_reassoc1:
|
|
|
|
; FMF: # %bb.0:
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMF-NEXT: xsmulsp 0, 1, 2
|
|
|
|
; FMF-NEXT: xsaddsp 1, 0, 3
|
2018-05-04 01:41:37 +08:00
|
|
|
; FMF-NEXT: blr
|
|
|
|
;
|
|
|
|
; GLOBAL-LABEL: fmul_fadd_reassoc1:
|
|
|
|
; GLOBAL: # %bb.0:
|
|
|
|
; GLOBAL-NEXT: xsmaddasp 3, 1, 2
|
|
|
|
; GLOBAL-NEXT: fmr 1, 3
|
|
|
|
; GLOBAL-NEXT: blr
|
|
|
|
%mul = fmul float %x, %y
|
|
|
|
%add = fadd reassoc float %mul, %z
|
|
|
|
ret float %add
|
|
|
|
}
|
|
|
|
|
|
|
|
; This shouldn't change anything - the intermediate fmul result is now also flagged.
|
|
|
|
; FMFDEBUG-LABEL: Optimized lowered selection DAG: %bb.0 'fmul_fadd_reassoc2:'
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMFDEBUG-NOT: fma reassoc {{t[0-9]+}}, {{t[0-9]+}}
|
2018-05-04 01:41:37 +08:00
|
|
|
; FMFDEBUG: Type-legalized selection DAG: %bb.0 'fmul_fadd_reassoc2:'
|
|
|
|
|
|
|
|
define float @fmul_fadd_reassoc2(float %x, float %y, float %z) {
|
|
|
|
; FMF-LABEL: fmul_fadd_reassoc2:
|
|
|
|
; FMF: # %bb.0:
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMF-NEXT: xsmulsp 0, 1, 2
|
|
|
|
; FMF-NEXT: xsaddsp 1, 0, 3
|
2018-05-04 01:41:37 +08:00
|
|
|
; FMF-NEXT: blr
|
|
|
|
;
|
|
|
|
; GLOBAL-LABEL: fmul_fadd_reassoc2:
|
|
|
|
; GLOBAL: # %bb.0:
|
|
|
|
; GLOBAL-NEXT: xsmaddasp 3, 1, 2
|
|
|
|
; GLOBAL-NEXT: fmr 1, 3
|
|
|
|
; GLOBAL-NEXT: blr
|
|
|
|
%mul = fmul reassoc float %x, %y
|
|
|
|
%add = fadd reassoc float %mul, %z
|
|
|
|
ret float %add
|
|
|
|
}
|
|
|
|
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; The fadd is now fully 'fast', but fmul is not yet.
|
2018-05-04 01:41:37 +08:00
|
|
|
|
|
|
|
; FMFDEBUG-LABEL: Optimized lowered selection DAG: %bb.0 'fmul_fadd_fast1:'
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMFDEBUG-NOT: fma nnan ninf nsz arcp contract afn reassoc {{t[0-9]+}}, {{t[0-9]+}}, {{t[0-9]+}}
|
2018-05-04 01:41:37 +08:00
|
|
|
; FMFDEBUG: Type-legalized selection DAG: %bb.0 'fmul_fadd_fast1:'
|
|
|
|
|
|
|
|
define float @fmul_fadd_fast1(float %x, float %y, float %z) {
|
|
|
|
; FMF-LABEL: fmul_fadd_fast1:
|
|
|
|
; FMF: # %bb.0:
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMF-NEXT: xsmulsp 0, 1, 2
|
|
|
|
; FMF-NEXT: xsaddsp 1, 0, 3
|
2018-05-04 01:41:37 +08:00
|
|
|
; FMF-NEXT: blr
|
|
|
|
;
|
|
|
|
; GLOBAL-LABEL: fmul_fadd_fast1:
|
|
|
|
; GLOBAL: # %bb.0:
|
|
|
|
; GLOBAL-NEXT: xsmaddasp 3, 1, 2
|
|
|
|
; GLOBAL-NEXT: fmr 1, 3
|
|
|
|
; GLOBAL-NEXT: blr
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
%mul = fmul float %x, %y
|
|
|
|
%add = fadd fast float %mul, %z
|
2018-05-04 01:41:37 +08:00
|
|
|
ret float %add
|
|
|
|
}
|
|
|
|
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; This implies that contraction is allowed - the intermediate fmul result is now also flagged.
|
2018-05-04 01:41:37 +08:00
|
|
|
|
|
|
|
; FMFDEBUG-LABEL: Optimized lowered selection DAG: %bb.0 'fmul_fadd_fast2:'
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMFDEBUG: fma nnan ninf nsz arcp contract afn reassoc {{t[0-9]+}}, {{t[0-9]+}}, {{t[0-9]+}}
|
2018-05-04 01:41:37 +08:00
|
|
|
; FMFDEBUG: Type-legalized selection DAG: %bb.0 'fmul_fadd_fast2:'
|
|
|
|
|
|
|
|
define float @fmul_fadd_fast2(float %x, float %y, float %z) {
|
|
|
|
; FMF-LABEL: fmul_fadd_fast2:
|
|
|
|
; FMF: # %bb.0:
|
|
|
|
; FMF-NEXT: xsmaddasp 3, 1, 2
|
|
|
|
; FMF-NEXT: fmr 1, 3
|
|
|
|
; FMF-NEXT: blr
|
|
|
|
;
|
|
|
|
; GLOBAL-LABEL: fmul_fadd_fast2:
|
|
|
|
; GLOBAL: # %bb.0:
|
|
|
|
; GLOBAL-NEXT: xsmaddasp 3, 1, 2
|
|
|
|
; GLOBAL-NEXT: fmr 1, 3
|
|
|
|
; GLOBAL-NEXT: blr
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
%mul = fmul fast float %x, %y
|
|
|
|
%add = fadd fast float %mul, %z
|
2018-05-04 01:41:37 +08:00
|
|
|
ret float %add
|
|
|
|
}
|
|
|
|
|
|
|
|
; fma(X, 7.0, X * 42.0) --> X * 49.0
|
|
|
|
; This is the minimum FMF needed for this transform - the FMA allows reassociation.
|
|
|
|
|
|
|
|
; FMFDEBUG-LABEL: Optimized lowered selection DAG: %bb.0 'fmul_fma_reassoc1:'
|
2018-07-05 02:54:25 +08:00
|
|
|
; FMFDEBUG: fmul reassoc {{t[0-9]+}},
|
2018-05-04 01:41:37 +08:00
|
|
|
; FMFDEBUG: Type-legalized selection DAG: %bb.0 'fmul_fma_reassoc1:'
|
|
|
|
|
2018-05-04 02:49:35 +08:00
|
|
|
; GLOBALDEBUG-LABEL: Optimized lowered selection DAG: %bb.0 'fmul_fma_reassoc1:'
|
Fast Math Flag mapping into SDNode
Summary: Adding support for Fast flags in the SDNode to leverage fast math sub flag usage.
Reviewers: spatel, arsenm, jbhateja, hfinkel, escha, qcolombet, echristo, wristow, javed.absar
Reviewed By: spatel
Subscribers: llvm-commits, rampitec, nhaehnle, tstellar, FarhanaAleen, nemanjai, javed.absar, jbhateja, hfinkel, wdng
Differential Revision: https://reviews.llvm.org/D45710
llvm-svn: 331547
2018-05-05 02:48:20 +08:00
|
|
|
; GLOBALDEBUG: fmul reassoc {{t[0-9]+}}
|
2018-05-04 02:49:35 +08:00
|
|
|
; GLOBALDEBUG: Type-legalized selection DAG: %bb.0 'fmul_fma_reassoc1:'
|
|
|
|
|
2018-05-04 01:41:37 +08:00
|
|
|
define float @fmul_fma_reassoc1(float %x) {
|
|
|
|
; FMF-LABEL: fmul_fma_reassoc1:
|
|
|
|
; FMF: # %bb.0:
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMF-NEXT: addis 3, 2, .LCPI7_0@toc@ha
|
|
|
|
; FMF-NEXT: lfs 0, .LCPI7_0@toc@l(3)
|
Utilize new SDNode flag functionality to expand current support for fma
Summary: This patch originated from D47388 and is a proper subset of the originating changes, containing only the fmf optimization guard extensions.
Reviewers: spatel, hfinkel, wristow, arsenm, javed.absar, rampitec, nhaehnle, nemanjai
Reviewed By: rampitec, nhaehnle
Subscribers: tpr, nemanjai, wdng
Differential Revision: https://reviews.llvm.org/D47918
llvm-svn: 334876
2018-06-16 08:03:06 +08:00
|
|
|
; FMF-NEXT: xsmulsp 1, 1, 0
|
2018-05-04 01:41:37 +08:00
|
|
|
; FMF-NEXT: blr
|
|
|
|
;
|
|
|
|
; GLOBAL-LABEL: fmul_fma_reassoc1:
|
|
|
|
; GLOBAL: # %bb.0:
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; GLOBAL-NEXT: addis 3, 2, .LCPI7_0@toc@ha
|
|
|
|
; GLOBAL-NEXT: lfs 0, .LCPI7_0@toc@l(3)
|
2018-05-04 01:41:37 +08:00
|
|
|
; GLOBAL-NEXT: xsmulsp 1, 1, 0
|
|
|
|
; GLOBAL-NEXT: blr
|
|
|
|
%mul = fmul float %x, 42.0
|
|
|
|
%fma = call reassoc float @llvm.fma.f32(float %x, float 7.0, float %mul)
|
|
|
|
ret float %fma
|
|
|
|
}
|
|
|
|
|
|
|
|
; This shouldn't change anything - the intermediate fmul result is now also flagged.
|
|
|
|
|
|
|
|
; FMFDEBUG-LABEL: Optimized lowered selection DAG: %bb.0 'fmul_fma_reassoc2:'
|
2018-06-08 06:49:09 +08:00
|
|
|
; FMFDEBUG: fmul reassoc {{t[0-9]+}}
|
2018-05-04 01:41:37 +08:00
|
|
|
; FMFDEBUG: Type-legalized selection DAG: %bb.0 'fmul_fma_reassoc2:'
|
|
|
|
|
2018-05-04 02:49:35 +08:00
|
|
|
; GLOBALDEBUG-LABEL: Optimized lowered selection DAG: %bb.0 'fmul_fma_reassoc2:'
|
Fast Math Flag mapping into SDNode
Summary: Adding support for Fast flags in the SDNode to leverage fast math sub flag usage.
Reviewers: spatel, arsenm, jbhateja, hfinkel, escha, qcolombet, echristo, wristow, javed.absar
Reviewed By: spatel
Subscribers: llvm-commits, rampitec, nhaehnle, tstellar, FarhanaAleen, nemanjai, javed.absar, jbhateja, hfinkel, wdng
Differential Revision: https://reviews.llvm.org/D45710
llvm-svn: 331547
2018-05-05 02:48:20 +08:00
|
|
|
; GLOBALDEBUG: fmul reassoc {{t[0-9]+}}
|
2018-05-04 02:49:35 +08:00
|
|
|
; GLOBALDEBUG: Type-legalized selection DAG: %bb.0 'fmul_fma_reassoc2:'
|
|
|
|
|
2018-05-04 01:41:37 +08:00
|
|
|
define float @fmul_fma_reassoc2(float %x) {
|
|
|
|
; FMF-LABEL: fmul_fma_reassoc2:
|
|
|
|
; FMF: # %bb.0:
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMF-NEXT: addis 3, 2, .LCPI8_0@toc@ha
|
|
|
|
; FMF-NEXT: lfs 0, .LCPI8_0@toc@l(3)
|
Utilize new SDNode flag functionality to expand current support for fma
Summary: This patch originated from D47388 and is a proper subset of the originating changes, containing only the fmf optimization guard extensions.
Reviewers: spatel, hfinkel, wristow, arsenm, javed.absar, rampitec, nhaehnle, nemanjai
Reviewed By: rampitec, nhaehnle
Subscribers: tpr, nemanjai, wdng
Differential Revision: https://reviews.llvm.org/D47918
llvm-svn: 334876
2018-06-16 08:03:06 +08:00
|
|
|
; FMF-NEXT: xsmulsp 1, 1, 0
|
2018-05-04 01:41:37 +08:00
|
|
|
; FMF-NEXT: blr
|
|
|
|
;
|
|
|
|
; GLOBAL-LABEL: fmul_fma_reassoc2:
|
|
|
|
; GLOBAL: # %bb.0:
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; GLOBAL-NEXT: addis 3, 2, .LCPI8_0@toc@ha
|
|
|
|
; GLOBAL-NEXT: lfs 0, .LCPI8_0@toc@l(3)
|
2018-05-04 01:41:37 +08:00
|
|
|
; GLOBAL-NEXT: xsmulsp 1, 1, 0
|
|
|
|
; GLOBAL-NEXT: blr
|
|
|
|
%mul = fmul reassoc float %x, 42.0
|
|
|
|
%fma = call reassoc float @llvm.fma.f32(float %x, float 7.0, float %mul)
|
|
|
|
ret float %fma
|
|
|
|
}
|
|
|
|
|
|
|
|
; The FMA is now fully 'fast'. This implies that reassociation is allowed.
|
|
|
|
|
|
|
|
; FMFDEBUG-LABEL: Optimized lowered selection DAG: %bb.0 'fmul_fma_fast1:'
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMFDEBUG: fmul nnan ninf nsz arcp contract afn reassoc {{t[0-9]+}}
|
2018-05-04 01:41:37 +08:00
|
|
|
; FMFDEBUG: Type-legalized selection DAG: %bb.0 'fmul_fma_fast1:'
|
|
|
|
|
2018-05-04 02:49:35 +08:00
|
|
|
; GLOBALDEBUG-LABEL: Optimized lowered selection DAG: %bb.0 'fmul_fma_fast1:'
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; GLOBALDEBUG: fmul nnan ninf nsz arcp contract afn reassoc {{t[0-9]+}}
|
2018-05-04 02:49:35 +08:00
|
|
|
; GLOBALDEBUG: Type-legalized selection DAG: %bb.0 'fmul_fma_fast1:'
|
|
|
|
|
2018-05-04 01:41:37 +08:00
|
|
|
define float @fmul_fma_fast1(float %x) {
|
|
|
|
; FMF-LABEL: fmul_fma_fast1:
|
|
|
|
; FMF: # %bb.0:
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMF-NEXT: addis 3, 2, .LCPI9_0@toc@ha
|
|
|
|
; FMF-NEXT: lfs 0, .LCPI9_0@toc@l(3)
|
Utilize new SDNode flag functionality to expand current support for fma
Summary: This patch originated from D47388 and is a proper subset of the originating changes, containing only the fmf optimization guard extensions.
Reviewers: spatel, hfinkel, wristow, arsenm, javed.absar, rampitec, nhaehnle, nemanjai
Reviewed By: rampitec, nhaehnle
Subscribers: tpr, nemanjai, wdng
Differential Revision: https://reviews.llvm.org/D47918
llvm-svn: 334876
2018-06-16 08:03:06 +08:00
|
|
|
; FMF-NEXT: xsmulsp 1, 1, 0
|
2018-05-04 01:41:37 +08:00
|
|
|
; FMF-NEXT: blr
|
|
|
|
;
|
|
|
|
; GLOBAL-LABEL: fmul_fma_fast1:
|
|
|
|
; GLOBAL: # %bb.0:
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; GLOBAL-NEXT: addis 3, 2, .LCPI9_0@toc@ha
|
|
|
|
; GLOBAL-NEXT: lfs 0, .LCPI9_0@toc@l(3)
|
2018-05-04 01:41:37 +08:00
|
|
|
; GLOBAL-NEXT: xsmulsp 1, 1, 0
|
|
|
|
; GLOBAL-NEXT: blr
|
|
|
|
%mul = fmul float %x, 42.0
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
%fma = call fast float @llvm.fma.f32(float %x, float 7.0, float %mul)
|
2018-05-04 01:41:37 +08:00
|
|
|
ret float %fma
|
|
|
|
}
|
|
|
|
|
|
|
|
; This shouldn't change anything - the intermediate fmul result is now also flagged.
|
|
|
|
|
|
|
|
; FMFDEBUG-LABEL: Optimized lowered selection DAG: %bb.0 'fmul_fma_fast2:'
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMFDEBUG: fmul nnan ninf nsz arcp contract afn reassoc {{t[0-9]+}}
|
2018-05-04 01:41:37 +08:00
|
|
|
; FMFDEBUG: Type-legalized selection DAG: %bb.0 'fmul_fma_fast2:'
|
|
|
|
|
2018-05-04 02:49:35 +08:00
|
|
|
; GLOBALDEBUG-LABEL: Optimized lowered selection DAG: %bb.0 'fmul_fma_fast2:'
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; GLOBALDEBUG: fmul nnan ninf nsz arcp contract afn reassoc {{t[0-9]+}}
|
2018-05-04 02:49:35 +08:00
|
|
|
; GLOBALDEBUG: Type-legalized selection DAG: %bb.0 'fmul_fma_fast2:'
|
|
|
|
|
2018-05-04 01:41:37 +08:00
|
|
|
define float @fmul_fma_fast2(float %x) {
|
|
|
|
; FMF-LABEL: fmul_fma_fast2:
|
|
|
|
; FMF: # %bb.0:
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMF-NEXT: addis 3, 2, .LCPI10_0@toc@ha
|
|
|
|
; FMF-NEXT: lfs 0, .LCPI10_0@toc@l(3)
|
Utilize new SDNode flag functionality to expand current support for fma
Summary: This patch originated from D47388 and is a proper subset of the originating changes, containing only the fmf optimization guard extensions.
Reviewers: spatel, hfinkel, wristow, arsenm, javed.absar, rampitec, nhaehnle, nemanjai
Reviewed By: rampitec, nhaehnle
Subscribers: tpr, nemanjai, wdng
Differential Revision: https://reviews.llvm.org/D47918
llvm-svn: 334876
2018-06-16 08:03:06 +08:00
|
|
|
; FMF-NEXT: xsmulsp 1, 1, 0
|
2018-05-04 01:41:37 +08:00
|
|
|
; FMF-NEXT: blr
|
|
|
|
;
|
|
|
|
; GLOBAL-LABEL: fmul_fma_fast2:
|
|
|
|
; GLOBAL: # %bb.0:
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; GLOBAL-NEXT: addis 3, 2, .LCPI10_0@toc@ha
|
|
|
|
; GLOBAL-NEXT: lfs 0, .LCPI10_0@toc@l(3)
|
2018-05-04 01:41:37 +08:00
|
|
|
; GLOBAL-NEXT: xsmulsp 1, 1, 0
|
|
|
|
; GLOBAL-NEXT: blr
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
%mul = fmul fast float %x, 42.0
|
|
|
|
%fma = call fast float @llvm.fma.f32(float %x, float 7.0, float %mul)
|
2018-05-04 01:41:37 +08:00
|
|
|
ret float %fma
|
|
|
|
}
|
|
|
|
|
|
|
|
; Reduced precision for sqrt is allowed - should use estimate and NR iterations.
|
|
|
|
|
2019-11-08 10:26:17 +08:00
|
|
|
; FMFDEBUG-LABEL: Optimized lowered selection DAG: %bb.0 'sqrt_afn_ieee:'
|
2020-04-01 16:17:36 +08:00
|
|
|
; FMFDEBUG: fmul ninf afn {{t[0-9]+}}
|
2019-11-08 10:26:17 +08:00
|
|
|
; FMFDEBUG: Type-legalized selection DAG: %bb.0 'sqrt_afn_ieee:'
|
2018-05-04 01:41:37 +08:00
|
|
|
|
2019-11-08 10:26:17 +08:00
|
|
|
; GLOBALDEBUG-LABEL: Optimized lowered selection DAG: %bb.0 'sqrt_afn_ieee:'
|
2020-04-01 16:17:36 +08:00
|
|
|
; GLOBALDEBUG: fmul ninf afn {{t[0-9]+}}
|
2019-11-08 10:26:17 +08:00
|
|
|
; GLOBALDEBUG: Type-legalized selection DAG: %bb.0 'sqrt_afn_ieee:'
|
2018-05-04 02:49:35 +08:00
|
|
|
|
2019-11-08 10:26:17 +08:00
|
|
|
define float @sqrt_afn_ieee(float %x) #0 {
|
|
|
|
; FMF-LABEL: sqrt_afn_ieee:
|
2018-07-05 02:54:25 +08:00
|
|
|
; FMF: # %bb.0:
|
2020-05-12 14:29:40 +08:00
|
|
|
; FMF-NEXT: xsabsdp 0, 1
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMF-NEXT: addis 3, 2, .LCPI11_2@toc@ha
|
|
|
|
; FMF-NEXT: lfs 2, .LCPI11_2@toc@l(3)
|
2019-11-08 10:26:17 +08:00
|
|
|
; FMF-NEXT: fcmpu 0, 0, 2
|
2018-07-05 02:54:25 +08:00
|
|
|
; FMF-NEXT: xxlxor 0, 0, 0
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMF-NEXT: blt 0, .LBB11_2
|
2018-07-05 02:54:25 +08:00
|
|
|
; FMF-NEXT: # %bb.1:
|
2019-05-07 21:48:03 +08:00
|
|
|
; FMF-NEXT: xsrsqrtesp 0, 1
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMF-NEXT: addis 3, 2, .LCPI11_0@toc@ha
|
|
|
|
; FMF-NEXT: addis 4, 2, .LCPI11_1@toc@ha
|
|
|
|
; FMF-NEXT: lfs 2, .LCPI11_0@toc@l(3)
|
|
|
|
; FMF-NEXT: lfs 3, .LCPI11_1@toc@l(4)
|
2019-05-07 21:48:03 +08:00
|
|
|
; FMF-NEXT: xsmulsp 1, 1, 0
|
|
|
|
; FMF-NEXT: xsmulsp 0, 1, 0
|
|
|
|
; FMF-NEXT: xsmulsp 1, 1, 2
|
|
|
|
; FMF-NEXT: xsaddsp 0, 0, 3
|
|
|
|
; FMF-NEXT: xsmulsp 0, 1, 0
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMF-NEXT: .LBB11_2:
|
2018-07-05 02:54:25 +08:00
|
|
|
; FMF-NEXT: fmr 1, 0
|
|
|
|
; FMF-NEXT: blr
|
2018-05-04 01:41:37 +08:00
|
|
|
;
|
2019-11-08 10:26:17 +08:00
|
|
|
; GLOBAL-LABEL: sqrt_afn_ieee:
|
2018-05-04 01:41:37 +08:00
|
|
|
; GLOBAL: # %bb.0:
|
2020-05-12 14:29:40 +08:00
|
|
|
; GLOBAL-NEXT: xsabsdp 0, 1
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; GLOBAL-NEXT: addis 3, 2, .LCPI11_2@toc@ha
|
|
|
|
; GLOBAL-NEXT: lfs 2, .LCPI11_2@toc@l(3)
|
2019-11-08 10:26:17 +08:00
|
|
|
; GLOBAL-NEXT: fcmpu 0, 0, 2
|
2018-05-04 01:41:37 +08:00
|
|
|
; GLOBAL-NEXT: xxlxor 0, 0, 0
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; GLOBAL-NEXT: blt 0, .LBB11_2
|
2018-05-04 01:41:37 +08:00
|
|
|
; GLOBAL-NEXT: # %bb.1:
|
2019-05-07 21:48:03 +08:00
|
|
|
; GLOBAL-NEXT: xsrsqrtesp 0, 1
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; GLOBAL-NEXT: addis 3, 2, .LCPI11_0@toc@ha
|
|
|
|
; GLOBAL-NEXT: addis 4, 2, .LCPI11_1@toc@ha
|
|
|
|
; GLOBAL-NEXT: lfs 2, .LCPI11_0@toc@l(3)
|
|
|
|
; GLOBAL-NEXT: lfs 3, .LCPI11_1@toc@l(4)
|
2019-05-07 21:48:03 +08:00
|
|
|
; GLOBAL-NEXT: xsmulsp 1, 1, 0
|
|
|
|
; GLOBAL-NEXT: xsmaddasp 2, 1, 0
|
|
|
|
; GLOBAL-NEXT: xsmulsp 0, 1, 3
|
|
|
|
; GLOBAL-NEXT: xsmulsp 0, 0, 2
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; GLOBAL-NEXT: .LBB11_2:
|
2018-05-04 01:41:37 +08:00
|
|
|
; GLOBAL-NEXT: fmr 1, 0
|
2020-04-01 16:17:36 +08:00
|
|
|
; GLOBAL-NEXT: blr
|
|
|
|
%rt = call afn ninf float @llvm.sqrt.f32(float %x)
|
|
|
|
ret float %rt
|
|
|
|
}
|
|
|
|
|
|
|
|
define float @sqrt_afn_ieee_inf(float %x) #0 {
|
|
|
|
; FMF-LABEL: sqrt_afn_ieee_inf:
|
|
|
|
; FMF: # %bb.0:
|
|
|
|
; FMF-NEXT: xssqrtsp 1, 1
|
|
|
|
; FMF-NEXT: blr
|
|
|
|
;
|
|
|
|
; GLOBAL-LABEL: sqrt_afn_ieee_inf:
|
|
|
|
; GLOBAL: # %bb.0:
|
|
|
|
; GLOBAL-NEXT: xssqrtsp 1, 1
|
2018-05-04 01:41:37 +08:00
|
|
|
; GLOBAL-NEXT: blr
|
|
|
|
%rt = call afn float @llvm.sqrt.f32(float %x)
|
|
|
|
ret float %rt
|
|
|
|
}
|
|
|
|
|
2019-11-08 10:26:17 +08:00
|
|
|
; FMFDEBUG-LABEL: Optimized lowered selection DAG: %bb.0 'sqrt_afn_preserve_sign:'
|
2020-04-01 16:17:36 +08:00
|
|
|
; FMFDEBUG: fmul ninf afn {{t[0-9]+}}
|
2019-11-08 10:26:17 +08:00
|
|
|
; FMFDEBUG: Type-legalized selection DAG: %bb.0 'sqrt_afn_preserve_sign:'
|
2018-05-04 01:41:37 +08:00
|
|
|
|
2019-11-08 10:26:17 +08:00
|
|
|
; GLOBALDEBUG-LABEL: Optimized lowered selection DAG: %bb.0 'sqrt_afn_preserve_sign:'
|
2020-04-01 16:17:36 +08:00
|
|
|
; GLOBALDEBUG: fmul ninf afn {{t[0-9]+}}
|
2019-11-08 10:26:17 +08:00
|
|
|
; GLOBALDEBUG: Type-legalized selection DAG: %bb.0 'sqrt_afn_preserve_sign:'
|
2018-05-04 02:49:35 +08:00
|
|
|
|
2019-11-08 10:26:17 +08:00
|
|
|
define float @sqrt_afn_preserve_sign(float %x) #1 {
|
|
|
|
; FMF-LABEL: sqrt_afn_preserve_sign:
|
2018-07-05 02:54:25 +08:00
|
|
|
; FMF: # %bb.0:
|
|
|
|
; FMF-NEXT: xxlxor 0, 0, 0
|
|
|
|
; FMF-NEXT: fcmpu 0, 1, 0
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMF-NEXT: beq 0, .LBB13_2
|
2018-07-05 02:54:25 +08:00
|
|
|
; FMF-NEXT: # %bb.1:
|
2019-05-07 21:48:03 +08:00
|
|
|
; FMF-NEXT: xsrsqrtesp 0, 1
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMF-NEXT: addis 3, 2, .LCPI13_0@toc@ha
|
|
|
|
; FMF-NEXT: addis 4, 2, .LCPI13_1@toc@ha
|
|
|
|
; FMF-NEXT: lfs 2, .LCPI13_0@toc@l(3)
|
|
|
|
; FMF-NEXT: lfs 3, .LCPI13_1@toc@l(4)
|
2019-05-07 21:48:03 +08:00
|
|
|
; FMF-NEXT: xsmulsp 1, 1, 0
|
2019-11-08 10:26:17 +08:00
|
|
|
; FMF-NEXT: xsmulsp 0, 1, 0
|
|
|
|
; FMF-NEXT: xsmulsp 1, 1, 2
|
|
|
|
; FMF-NEXT: xsaddsp 0, 0, 3
|
|
|
|
; FMF-NEXT: xsmulsp 0, 1, 0
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMF-NEXT: .LBB13_2:
|
2018-07-05 02:54:25 +08:00
|
|
|
; FMF-NEXT: fmr 1, 0
|
|
|
|
; FMF-NEXT: blr
|
2018-05-04 01:41:37 +08:00
|
|
|
;
|
2019-11-08 10:26:17 +08:00
|
|
|
; GLOBAL-LABEL: sqrt_afn_preserve_sign:
|
2018-05-04 01:41:37 +08:00
|
|
|
; GLOBAL: # %bb.0:
|
|
|
|
; GLOBAL-NEXT: xxlxor 0, 0, 0
|
|
|
|
; GLOBAL-NEXT: fcmpu 0, 1, 0
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; GLOBAL-NEXT: beq 0, .LBB13_2
|
2018-05-04 01:41:37 +08:00
|
|
|
; GLOBAL-NEXT: # %bb.1:
|
2019-05-07 21:48:03 +08:00
|
|
|
; GLOBAL-NEXT: xsrsqrtesp 0, 1
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; GLOBAL-NEXT: addis 3, 2, .LCPI13_0@toc@ha
|
|
|
|
; GLOBAL-NEXT: addis 4, 2, .LCPI13_1@toc@ha
|
|
|
|
; GLOBAL-NEXT: lfs 2, .LCPI13_0@toc@l(3)
|
|
|
|
; GLOBAL-NEXT: lfs 3, .LCPI13_1@toc@l(4)
|
2019-05-07 21:48:03 +08:00
|
|
|
; GLOBAL-NEXT: xsmulsp 1, 1, 0
|
|
|
|
; GLOBAL-NEXT: xsmaddasp 2, 1, 0
|
|
|
|
; GLOBAL-NEXT: xsmulsp 0, 1, 3
|
|
|
|
; GLOBAL-NEXT: xsmulsp 0, 0, 2
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; GLOBAL-NEXT: .LBB13_2:
|
2018-05-04 01:41:37 +08:00
|
|
|
; GLOBAL-NEXT: fmr 1, 0
|
2020-04-01 16:17:36 +08:00
|
|
|
; GLOBAL-NEXT: blr
|
|
|
|
%rt = call afn ninf float @llvm.sqrt.f32(float %x)
|
|
|
|
ret float %rt
|
|
|
|
}
|
|
|
|
|
|
|
|
define float @sqrt_afn_preserve_sign_inf(float %x) #1 {
|
|
|
|
; FMF-LABEL: sqrt_afn_preserve_sign_inf:
|
|
|
|
; FMF: # %bb.0:
|
|
|
|
; FMF-NEXT: xssqrtsp 1, 1
|
|
|
|
; FMF-NEXT: blr
|
|
|
|
;
|
|
|
|
; GLOBAL-LABEL: sqrt_afn_preserve_sign_inf:
|
|
|
|
; GLOBAL: # %bb.0:
|
|
|
|
; GLOBAL-NEXT: xssqrtsp 1, 1
|
2019-11-08 10:26:17 +08:00
|
|
|
; GLOBAL-NEXT: blr
|
|
|
|
%rt = call afn float @llvm.sqrt.f32(float %x)
|
|
|
|
ret float %rt
|
|
|
|
}
|
|
|
|
|
|
|
|
; The call is now fully 'fast'. This implies that approximation is allowed.
|
|
|
|
|
|
|
|
; FMFDEBUG-LABEL: Optimized lowered selection DAG: %bb.0 'sqrt_fast_ieee:'
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMFDEBUG: fmul ninf contract afn reassoc {{t[0-9]+}}
|
2019-11-08 10:26:17 +08:00
|
|
|
; FMFDEBUG: Type-legalized selection DAG: %bb.0 'sqrt_fast_ieee:'
|
|
|
|
|
|
|
|
; GLOBALDEBUG-LABEL: Optimized lowered selection DAG: %bb.0 'sqrt_fast_ieee:'
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; GLOBALDEBUG: fmul ninf contract afn reassoc {{t[0-9]+}}
|
2019-11-08 10:26:17 +08:00
|
|
|
; GLOBALDEBUG: Type-legalized selection DAG: %bb.0 'sqrt_fast_ieee:'
|
|
|
|
|
|
|
|
define float @sqrt_fast_ieee(float %x) #0 {
|
|
|
|
; FMF-LABEL: sqrt_fast_ieee:
|
|
|
|
; FMF: # %bb.0:
|
2020-05-12 14:29:40 +08:00
|
|
|
; FMF-NEXT: xsabsdp 0, 1
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMF-NEXT: addis 3, 2, .LCPI15_2@toc@ha
|
|
|
|
; FMF-NEXT: lfs 2, .LCPI15_2@toc@l(3)
|
2019-11-08 10:26:17 +08:00
|
|
|
; FMF-NEXT: fcmpu 0, 0, 2
|
|
|
|
; FMF-NEXT: xxlxor 0, 0, 0
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMF-NEXT: blt 0, .LBB15_2
|
2019-11-08 10:26:17 +08:00
|
|
|
; FMF-NEXT: # %bb.1:
|
|
|
|
; FMF-NEXT: xsrsqrtesp 0, 1
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMF-NEXT: addis 3, 2, .LCPI15_0@toc@ha
|
|
|
|
; FMF-NEXT: addis 4, 2, .LCPI15_1@toc@ha
|
|
|
|
; FMF-NEXT: lfs 2, .LCPI15_0@toc@l(3)
|
|
|
|
; FMF-NEXT: lfs 3, .LCPI15_1@toc@l(4)
|
2019-11-08 10:26:17 +08:00
|
|
|
; FMF-NEXT: xsmulsp 1, 1, 0
|
|
|
|
; FMF-NEXT: xsmaddasp 2, 1, 0
|
|
|
|
; FMF-NEXT: xsmulsp 0, 1, 3
|
|
|
|
; FMF-NEXT: xsmulsp 0, 0, 2
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMF-NEXT: .LBB15_2:
|
2019-11-08 10:26:17 +08:00
|
|
|
; FMF-NEXT: fmr 1, 0
|
|
|
|
; FMF-NEXT: blr
|
|
|
|
;
|
|
|
|
; GLOBAL-LABEL: sqrt_fast_ieee:
|
|
|
|
; GLOBAL: # %bb.0:
|
2020-05-12 14:29:40 +08:00
|
|
|
; GLOBAL-NEXT: xsabsdp 0, 1
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; GLOBAL-NEXT: addis 3, 2, .LCPI15_2@toc@ha
|
|
|
|
; GLOBAL-NEXT: lfs 2, .LCPI15_2@toc@l(3)
|
2019-11-08 10:26:17 +08:00
|
|
|
; GLOBAL-NEXT: fcmpu 0, 0, 2
|
|
|
|
; GLOBAL-NEXT: xxlxor 0, 0, 0
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; GLOBAL-NEXT: blt 0, .LBB15_2
|
2019-11-08 10:26:17 +08:00
|
|
|
; GLOBAL-NEXT: # %bb.1:
|
|
|
|
; GLOBAL-NEXT: xsrsqrtesp 0, 1
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; GLOBAL-NEXT: addis 3, 2, .LCPI15_0@toc@ha
|
|
|
|
; GLOBAL-NEXT: addis 4, 2, .LCPI15_1@toc@ha
|
|
|
|
; GLOBAL-NEXT: lfs 2, .LCPI15_0@toc@l(3)
|
|
|
|
; GLOBAL-NEXT: lfs 3, .LCPI15_1@toc@l(4)
|
2019-11-08 10:26:17 +08:00
|
|
|
; GLOBAL-NEXT: xsmulsp 1, 1, 0
|
|
|
|
; GLOBAL-NEXT: xsmaddasp 2, 1, 0
|
|
|
|
; GLOBAL-NEXT: xsmulsp 0, 1, 3
|
|
|
|
; GLOBAL-NEXT: xsmulsp 0, 0, 2
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; GLOBAL-NEXT: .LBB15_2:
|
2019-11-08 10:26:17 +08:00
|
|
|
; GLOBAL-NEXT: fmr 1, 0
|
|
|
|
; GLOBAL-NEXT: blr
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
%rt = call contract reassoc afn ninf float @llvm.sqrt.f32(float %x)
|
2019-11-08 10:26:17 +08:00
|
|
|
ret float %rt
|
|
|
|
}
|
|
|
|
|
|
|
|
; The call is now fully 'fast'. This implies that approximation is allowed.
|
|
|
|
|
|
|
|
; FMFDEBUG-LABEL: Optimized lowered selection DAG: %bb.0 'sqrt_fast_preserve_sign:'
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMFDEBUG: fmul ninf contract afn reassoc {{t[0-9]+}}
|
2019-11-08 10:26:17 +08:00
|
|
|
; FMFDEBUG: Type-legalized selection DAG: %bb.0 'sqrt_fast_preserve_sign:'
|
|
|
|
|
|
|
|
; GLOBALDEBUG-LABEL: Optimized lowered selection DAG: %bb.0 'sqrt_fast_preserve_sign:'
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; GLOBALDEBUG: fmul ninf contract afn reassoc {{t[0-9]+}}
|
2019-11-08 10:26:17 +08:00
|
|
|
; GLOBALDEBUG: Type-legalized selection DAG: %bb.0 'sqrt_fast_preserve_sign:'
|
|
|
|
|
|
|
|
define float @sqrt_fast_preserve_sign(float %x) #1 {
|
|
|
|
; FMF-LABEL: sqrt_fast_preserve_sign:
|
|
|
|
; FMF: # %bb.0:
|
|
|
|
; FMF-NEXT: xxlxor 0, 0, 0
|
|
|
|
; FMF-NEXT: fcmpu 0, 1, 0
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMF-NEXT: beq 0, .LBB16_2
|
2019-11-08 10:26:17 +08:00
|
|
|
; FMF-NEXT: # %bb.1:
|
|
|
|
; FMF-NEXT: xsrsqrtesp 0, 1
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMF-NEXT: addis 3, 2, .LCPI16_0@toc@ha
|
|
|
|
; FMF-NEXT: addis 4, 2, .LCPI16_1@toc@ha
|
|
|
|
; FMF-NEXT: lfs 2, .LCPI16_0@toc@l(3)
|
|
|
|
; FMF-NEXT: lfs 3, .LCPI16_1@toc@l(4)
|
2019-11-08 10:26:17 +08:00
|
|
|
; FMF-NEXT: xsmulsp 1, 1, 0
|
|
|
|
; FMF-NEXT: xsmaddasp 2, 1, 0
|
|
|
|
; FMF-NEXT: xsmulsp 0, 1, 3
|
|
|
|
; FMF-NEXT: xsmulsp 0, 0, 2
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMF-NEXT: .LBB16_2:
|
2019-11-08 10:26:17 +08:00
|
|
|
; FMF-NEXT: fmr 1, 0
|
|
|
|
; FMF-NEXT: blr
|
|
|
|
;
|
|
|
|
; GLOBAL-LABEL: sqrt_fast_preserve_sign:
|
|
|
|
; GLOBAL: # %bb.0:
|
|
|
|
; GLOBAL-NEXT: xxlxor 0, 0, 0
|
|
|
|
; GLOBAL-NEXT: fcmpu 0, 1, 0
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; GLOBAL-NEXT: beq 0, .LBB16_2
|
2019-11-08 10:26:17 +08:00
|
|
|
; GLOBAL-NEXT: # %bb.1:
|
|
|
|
; GLOBAL-NEXT: xsrsqrtesp 0, 1
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; GLOBAL-NEXT: addis 3, 2, .LCPI16_0@toc@ha
|
|
|
|
; GLOBAL-NEXT: addis 4, 2, .LCPI16_1@toc@ha
|
|
|
|
; GLOBAL-NEXT: lfs 2, .LCPI16_0@toc@l(3)
|
|
|
|
; GLOBAL-NEXT: lfs 3, .LCPI16_1@toc@l(4)
|
2019-11-08 10:26:17 +08:00
|
|
|
; GLOBAL-NEXT: xsmulsp 1, 1, 0
|
|
|
|
; GLOBAL-NEXT: xsmaddasp 2, 1, 0
|
|
|
|
; GLOBAL-NEXT: xsmulsp 0, 1, 3
|
|
|
|
; GLOBAL-NEXT: xsmulsp 0, 0, 2
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; GLOBAL-NEXT: .LBB16_2:
|
2019-11-08 10:26:17 +08:00
|
|
|
; GLOBAL-NEXT: fmr 1, 0
|
2018-05-04 01:41:37 +08:00
|
|
|
; GLOBAL-NEXT: blr
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
%rt = call contract reassoc ninf afn float @llvm.sqrt.f32(float %x)
|
2018-05-04 01:41:37 +08:00
|
|
|
ret float %rt
|
|
|
|
}
|
|
|
|
|
2018-05-15 05:17:49 +08:00
|
|
|
; fcmp can have fast-math-flags.
|
|
|
|
|
|
|
|
; FMFDEBUG-LABEL: Optimized lowered selection DAG: %bb.0 'fcmp_nnan:'
|
2019-06-04 03:12:15 +08:00
|
|
|
; FMFDEBUG: select_cc nnan {{t[0-9]+}}
|
2018-05-15 05:17:49 +08:00
|
|
|
; FMFDEBUG: Type-legalized selection DAG: %bb.0 'fcmp_nnan:'
|
|
|
|
|
|
|
|
; GLOBALDEBUG-LABEL: Optimized lowered selection DAG: %bb.0 'fcmp_nnan:'
|
2019-06-04 03:12:15 +08:00
|
|
|
; GLOBALDEBUG: select_cc nnan {{t[0-9]+}}
|
2018-05-15 05:17:49 +08:00
|
|
|
; GLOBALDEBUG: Type-legalized selection DAG: %bb.0 'fcmp_nnan:'
|
|
|
|
|
|
|
|
define double @fcmp_nnan(double %a, double %y, double %z) {
|
|
|
|
; FMF-LABEL: fcmp_nnan:
|
|
|
|
; FMF: # %bb.0:
|
|
|
|
; FMF-NEXT: xxlxor 0, 0, 0
|
2018-05-15 22:16:24 +08:00
|
|
|
; FMF-NEXT: xscmpudp 0, 1, 0
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMF-NEXT: blt 0, .LBB17_2
|
2018-05-15 05:17:49 +08:00
|
|
|
; FMF-NEXT: # %bb.1:
|
|
|
|
; FMF-NEXT: fmr 3, 2
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; FMF-NEXT: .LBB17_2:
|
2018-05-15 05:17:49 +08:00
|
|
|
; FMF-NEXT: fmr 1, 3
|
|
|
|
; FMF-NEXT: blr
|
|
|
|
;
|
|
|
|
; GLOBAL-LABEL: fcmp_nnan:
|
|
|
|
; GLOBAL: # %bb.0:
|
|
|
|
; GLOBAL-NEXT: xxlxor 0, 0, 0
|
|
|
|
; GLOBAL-NEXT: xscmpudp 0, 1, 0
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; GLOBAL-NEXT: blt 0, .LBB17_2
|
2018-05-15 05:17:49 +08:00
|
|
|
; GLOBAL-NEXT: # %bb.1:
|
|
|
|
; GLOBAL-NEXT: fmr 3, 2
|
[DAGCombine] reassoc flag shouldn't enable contract
According to IR LangRef, the FMF flag:
contract
Allow floating-point contraction (e.g. fusing a multiply followed by an
addition into a fused multiply-and-add).
reassoc
Allow reassociation transformations for floating-point instructions.
This may dramatically change results in floating-point.
My understanding is that these two flags shouldn't imply each other,
as we might have a SDNode that can be reassociated with others, but
not contractble.
eg: We may want following fmul/fad/fsub to freely reassoc, but don't
want fma being generated here.
%F = fmul reassoc double %A, %B ; <double> [#uses=1]
%G = fmul reassoc double %C, %D ; <double> [#uses=1]
%H = fadd reassoc double %F, %G ; <double> [#uses=1]
%I = fsub reassoc double %H, %E ; <double> [#uses=1]
Before https://reviews.llvm.org/D45710, `reassoc` flag actually
did not imply isContratable either.
The current implementation also only check the flag in fadd node,
ignoring fmul node, this patch update that as well.
Reviewed By: spatel, qiucf
Differential Revision: https://reviews.llvm.org/D104247
2021-06-22 03:25:40 +08:00
|
|
|
; GLOBAL-NEXT: .LBB17_2:
|
2018-05-15 05:17:49 +08:00
|
|
|
; GLOBAL-NEXT: fmr 1, 3
|
|
|
|
; GLOBAL-NEXT: blr
|
|
|
|
%cmp = fcmp nnan ult double %a, 0.0
|
|
|
|
%z.y = select i1 %cmp, double %z, double %y
|
|
|
|
ret double %z.y
|
|
|
|
}
|
|
|
|
|
|
|
|
; FP library calls can have fast-math-flags.
|
|
|
|
|
|
|
|
; FMFDEBUG-LABEL: Optimized lowered selection DAG: %bb.0 'log2_approx:'
|
|
|
|
; FMFDEBUG: ch,glue = PPCISD::CALL_NOP t11, TargetGlobalAddress:i64<double (double)* @log2>
|
|
|
|
; FMFDEBUG: ch,glue = callseq_end t15, TargetConstant:i64<32>, TargetConstant:i64<0>, t15:1
|
2020-09-09 06:09:35 +08:00
|
|
|
; FMFDEBUG: f64,ch,glue = CopyFromReg t16, Register:f64 $f1, t16:1
|
2018-05-15 05:17:49 +08:00
|
|
|
; FMFDEBUG: Type-legalized selection DAG: %bb.0 'log2_approx:'
|
|
|
|
|
|
|
|
; GLOBALDEBUG-LABEL: Optimized lowered selection DAG: %bb.0 'log2_approx:'
|
|
|
|
; GLOBALDEBUG: ch,glue = PPCISD::CALL_NOP t11, TargetGlobalAddress:i64<double (double)* @log2>
|
|
|
|
; GLOBALDEBUG: ch,glue = callseq_end t15, TargetConstant:i64<32>, TargetConstant:i64<0>, t15:1
|
2020-09-09 06:09:35 +08:00
|
|
|
; GLOBALDEBUG: f64,ch,glue = CopyFromReg t16, Register:f64 $f1, t16:1
|
2018-05-15 05:17:49 +08:00
|
|
|
; GLOBALDEBUG: Type-legalized selection DAG: %bb.0 'log2_approx:'
|
|
|
|
|
|
|
|
declare double @log2(double)
|
|
|
|
define double @log2_approx(double %x) nounwind {
|
|
|
|
; FMF-LABEL: log2_approx:
|
|
|
|
; FMF: # %bb.0:
|
|
|
|
; FMF-NEXT: mflr 0
|
|
|
|
; FMF-NEXT: std 0, 16(1)
|
|
|
|
; FMF-NEXT: stdu 1, -32(1)
|
|
|
|
; FMF-NEXT: bl log2
|
|
|
|
; FMF-NEXT: nop
|
|
|
|
; FMF-NEXT: addi 1, 1, 32
|
|
|
|
; FMF-NEXT: ld 0, 16(1)
|
|
|
|
; FMF-NEXT: mtlr 0
|
|
|
|
; FMF-NEXT: blr
|
|
|
|
;
|
|
|
|
; GLOBAL-LABEL: log2_approx:
|
|
|
|
; GLOBAL: # %bb.0:
|
|
|
|
; GLOBAL-NEXT: mflr 0
|
|
|
|
; GLOBAL-NEXT: std 0, 16(1)
|
|
|
|
; GLOBAL-NEXT: stdu 1, -32(1)
|
|
|
|
; GLOBAL-NEXT: bl log2
|
|
|
|
; GLOBAL-NEXT: nop
|
|
|
|
; GLOBAL-NEXT: addi 1, 1, 32
|
|
|
|
; GLOBAL-NEXT: ld 0, 16(1)
|
|
|
|
; GLOBAL-NEXT: mtlr 0
|
|
|
|
; GLOBAL-NEXT: blr
|
|
|
|
%r = call afn double @log2(double %x)
|
|
|
|
ret double %r
|
|
|
|
}
|
|
|
|
|
2018-06-06 02:12:25 +08:00
|
|
|
; -(X - Y) --> (Y - X)
|
|
|
|
|
|
|
|
; FMFDEBUG-LABEL: Optimized lowered selection DAG: %bb.0 'fneg_fsub_nozeros_1:'
|
2018-06-06 02:49:47 +08:00
|
|
|
; FMFDEBUG: fsub nsz {{t[0-9]+}}, {{t[0-9]+}}
|
2018-06-06 02:12:25 +08:00
|
|
|
; FMFDEBUG: Type-legalized selection DAG: %bb.0 'fneg_fsub_nozeros_1:'
|
|
|
|
|
|
|
|
; GLOBALDEBUG-LABEL: Optimized lowered selection DAG: %bb.0 'fneg_fsub_nozeros_1:'
|
2018-06-06 02:49:47 +08:00
|
|
|
; GLOBALDEBUG: fsub nsz {{t[0-9]+}}, {{t[0-9]+}}
|
2018-06-06 02:12:25 +08:00
|
|
|
; GLOBALDEBUG: Type-legalized selection DAG: %bb.0 'fneg_fsub_nozeros_1:'
|
|
|
|
|
|
|
|
define float @fneg_fsub_nozeros_1(float %x, float %y, float %z) {
|
|
|
|
; FMF-LABEL: fneg_fsub_nozeros_1:
|
|
|
|
; FMF: # %bb.0:
|
2018-06-06 02:49:47 +08:00
|
|
|
; FMF-NEXT: xssubsp 1, 2, 1
|
2018-06-06 02:12:25 +08:00
|
|
|
; FMF-NEXT: blr
|
|
|
|
;
|
|
|
|
; GLOBAL-LABEL: fneg_fsub_nozeros_1:
|
|
|
|
; GLOBAL: # %bb.0:
|
2018-06-06 02:49:47 +08:00
|
|
|
; GLOBAL-NEXT: xssubsp 1, 2, 1
|
2018-06-06 02:12:25 +08:00
|
|
|
; GLOBAL-NEXT: blr
|
|
|
|
%neg = fsub float %x, %y
|
2018-06-06 02:49:47 +08:00
|
|
|
%add = fsub nsz float 0.0, %neg
|
2018-06-06 02:12:25 +08:00
|
|
|
ret float %add
|
|
|
|
}
|
2018-06-06 02:49:47 +08:00
|
|
|
|
2019-11-08 10:26:17 +08:00
|
|
|
attributes #0 = { "denormal-fp-math"="ieee,ieee" }
|
|
|
|
attributes #1 = { "denormal-fp-math"="preserve-sign,preserve-sign" }
|