llvm-project/llvm/test/CodeGen/SystemZ/fp-strict-alias.ll

; Verify that strict FP operations are not rescheduled
;
; RUN: llc < %s -mtriple=s390x-linux-gnu -mcpu=z13 | FileCheck %s

declare float @llvm.experimental.constrained.fadd.f32(float, float, metadata, metadata)
declare float @llvm.experimental.constrained.fsub.f32(float, float, metadata, metadata)
declare float @llvm.experimental.constrained.sqrt.f32(float, metadata, metadata)
declare float @llvm.sqrt.f32(float)
declare void @llvm.s390.sfpc(i32)

; For non-strict operations, we expect the post-RA scheduler to
; separate the two square root instructions on z13.
define void @f1(float %f1, float %f2, float %f3, float %f4, float *%ptr0) {
; CHECK-LABEL: f1:
; CHECK: sqebr
; CHECK: {{aebr|sebr}}
; CHECK: sqebr
; CHECK: br %r14

  %add = fadd float %f1, %f2
  %sub = fsub float %f3, %f4
  %sqrt1 = call float @llvm.sqrt.f32(float %f2)
  %sqrt2 = call float @llvm.sqrt.f32(float %f4)

  %ptr1 = getelementptr float, float *%ptr0, i64 1
  %ptr2 = getelementptr float, float *%ptr0, i64 2
  %ptr3 = getelementptr float, float *%ptr0, i64 3

  store float %add, float *%ptr0
  store float %sub, float *%ptr1
  store float %sqrt1, float *%ptr2
  store float %sqrt2, float *%ptr3

  ret void
}

; But for strict operations, this must not happen.
define void @f2(float %f1, float %f2, float %f3, float %f4, float *%ptr0) {
; CHECK-LABEL: f2:
; CHECK: {{aebr|sebr}}
; CHECK: {{aebr|sebr}}
; CHECK: sqebr
; CHECK: sqebr
; CHECK: br %r14

  %add = call float @llvm.experimental.constrained.fadd.f32(
                        float %f1, float %f2,
                        metadata !"round.dynamic",
                        metadata !"fpexcept.strict")
  %sub = call float @llvm.experimental.constrained.fsub.f32(
                        float %f3, float %f4,
                        metadata !"round.dynamic",
                        metadata !"fpexcept.strict")
  %sqrt1 = call float @llvm.experimental.constrained.sqrt.f32(
                        float %f2,
                        metadata !"round.dynamic",
                        metadata !"fpexcept.strict")
  %sqrt2 = call float @llvm.experimental.constrained.sqrt.f32(
                        float %f4,
                        metadata !"round.dynamic",
                        metadata !"fpexcept.strict")

  %ptr1 = getelementptr float, float *%ptr0, i64 1
  %ptr2 = getelementptr float, float *%ptr0, i64 2
  %ptr3 = getelementptr float, float *%ptr0, i64 3

  store float %add, float *%ptr0
  store float %sub, float *%ptr1
  store float %sqrt1, float *%ptr2
  store float %sqrt2, float *%ptr3

  ret void
}

; On the other hand, strict operations that use the fpexcept.ignore
; exception behaviour should be scheduled freely.
define void @f3(float %f1, float %f2, float %f3, float %f4, float *%ptr0) {
; CHECK-LABEL: f3:
; CHECK: sqebr
; CHECK: {{aebr|sebr}}
; CHECK: sqebr
; CHECK: br %r14

  %add = call float @llvm.experimental.constrained.fadd.f32(
                        float %f1, float %f2,
                        metadata !"round.dynamic",
                        metadata !"fpexcept.ignore")
  %sub = call float @llvm.experimental.constrained.fsub.f32(
                        float %f3, float %f4,
                        metadata !"round.dynamic",
                        metadata !"fpexcept.ignore")
  %sqrt1 = call float @llvm.experimental.constrained.sqrt.f32(
                        float %f2,
                        metadata !"round.dynamic",
                        metadata !"fpexcept.ignore")
  %sqrt2 = call float @llvm.experimental.constrained.sqrt.f32(
                        float %f4,
                        metadata !"round.dynamic",
                        metadata !"fpexcept.ignore")

  %ptr1 = getelementptr float, float *%ptr0, i64 1
  %ptr2 = getelementptr float, float *%ptr0, i64 2
  %ptr3 = getelementptr float, float *%ptr0, i64 3

  store float %add, float *%ptr0
  store float %sub, float *%ptr1
  store float %sqrt1, float *%ptr2
  store float %sqrt2, float *%ptr3

  ret void
}

; However, even non-strict operations must not be scheduled across an SFPC.
define void @f4(float %f1, float %f2, float %f3, float %f4, float *%ptr0) {
; CHECK-LABEL: f4:
; CHECK: {{aebr|sebr}}
; CHECK: {{aebr|sebr}}
; CHECK: sfpc
; CHECK: sqebr
; CHECK: sqebr
; CHECK: br %r14

  %add = fadd float %f1, %f2
  %sub = fsub float %f3, %f4
  call void @llvm.s390.sfpc(i32 0)
  %sqrt1 = call float @llvm.sqrt.f32(float %f2)
  %sqrt2 = call float @llvm.sqrt.f32(float %f4)

  %ptr1 = getelementptr float, float *%ptr0, i64 1
  %ptr2 = getelementptr float, float *%ptr0, i64 2
  %ptr3 = getelementptr float, float *%ptr0, i64 3

  store float %add, float *%ptr0
  store float %sub, float *%ptr1
  store float %sqrt1, float *%ptr2
  store float %sqrt2, float *%ptr3

  ret void
}
Allow target to handle STRICT floating-point nodes The ISD::STRICT_ nodes used to implement the constrained floating-point intrinsics are currently never passed to the target back-end, which makes it impossible to handle them correctly (e.g. mark instructions are depending on a floating-point status and control register, or mark instructions as possibly trapping). This patch allows the target to use setOperationAction to switch the action on ISD::STRICT_ nodes to Legal. If this is done, the SelectionDAG common code will stop converting the STRICT nodes to regular floating-point nodes, but instead pass the STRICT nodes to the target using normal SelectionDAG matching rules. To avoid having the back-end duplicate all the floating-point instruction patterns to handle both strict and non-strict variants, we make the MI codegen explicitly aware of the floating-point exceptions by introducing two new concepts: - A new MCID flag "mayRaiseFPException" that the target should set on any instruction that possibly can raise FP exception according to the architecture definition. - A new MI flag FPExcept that CodeGen/SelectionDAG will set on any MI instruction resulting from expansion of any constrained FP intrinsic. Any MI instruction that is both marked as mayRaiseFPException and FPExcept then needs to be considered as raising exceptions by MI-level codegen (e.g. scheduling). Setting those two new flags is straightforward. The mayRaiseFPException flag is simply set via TableGen by marking all relevant instruction patterns in the .td files. The FPExcept flag is set in SDNodeFlags when creating the STRICT_ nodes in the SelectionDAG, and gets inherited in the MachineSDNode nodes created from it during instruction selection. The flag is then transfered to an MIFlag when creating the MI from the MachineSDNode. This is handled just like fast-math flags like no-nans are handled today. This patch includes both common code changes required to implement the new features, and the SystemZ implementation. Reviewed By: andrew.w.kaylor Differential Revision: https://reviews.llvm.org/D55506 llvm-svn: 362663 2019-06-06 06:33:10 +08:00			`; Verify that strict FP operations are not rescheduled`
			`;`
			`; RUN: llc < %s -mtriple=s390x-linux-gnu -mcpu=z13 \| FileCheck %s`

			`declare float @llvm.experimental.constrained.fadd.f32(float, float, metadata, metadata)`
			`declare float @llvm.experimental.constrained.fsub.f32(float, float, metadata, metadata)`
			`declare float @llvm.experimental.constrained.sqrt.f32(float, metadata, metadata)`
			`declare float @llvm.sqrt.f32(float)`
			`declare void @llvm.s390.sfpc(i32)`

			`; For non-strict operations, we expect the post-RA scheduler to`
			`; separate the two square root instructions on z13.`
			`define void @f1(float %f1, float %f2, float %f3, float %f4, float *%ptr0) {`
			`; CHECK-LABEL: f1:`
			`; CHECK: sqebr`
			`; CHECK: {{aebr\|sebr}}`
			`; CHECK: sqebr`
			`; CHECK: br %r14`

			`%add = fadd float %f1, %f2`
			`%sub = fsub float %f3, %f4`
			`%sqrt1 = call float @llvm.sqrt.f32(float %f2)`
			`%sqrt2 = call float @llvm.sqrt.f32(float %f4)`

			`%ptr1 = getelementptr float, float *%ptr0, i64 1`
			`%ptr2 = getelementptr float, float *%ptr0, i64 2`
			`%ptr3 = getelementptr float, float *%ptr0, i64 3`

			`store float %add, float *%ptr0`
			`store float %sub, float *%ptr1`
			`store float %sqrt1, float *%ptr2`
			`store float %sqrt2, float *%ptr3`

			`ret void`
			`}`

			`; But for strict operations, this must not happen.`
			`define void @f2(float %f1, float %f2, float %f3, float %f4, float *%ptr0) {`
			`; CHECK-LABEL: f2:`
			`; CHECK: {{aebr\|sebr}}`
			`; CHECK: {{aebr\|sebr}}`
			`; CHECK: sqebr`
			`; CHECK: sqebr`
			`; CHECK: br %r14`

			`%add = call float @llvm.experimental.constrained.fadd.f32(`
			`float %f1, float %f2,`
			`metadata !"round.dynamic",`
			`metadata !"fpexcept.strict")`
			`%sub = call float @llvm.experimental.constrained.fsub.f32(`
			`float %f3, float %f4,`
			`metadata !"round.dynamic",`
			`metadata !"fpexcept.strict")`
			`%sqrt1 = call float @llvm.experimental.constrained.sqrt.f32(`
			`float %f2,`
			`metadata !"round.dynamic",`
			`metadata !"fpexcept.strict")`
			`%sqrt2 = call float @llvm.experimental.constrained.sqrt.f32(`
			`float %f4,`
			`metadata !"round.dynamic",`
			`metadata !"fpexcept.strict")`

			`%ptr1 = getelementptr float, float *%ptr0, i64 1`
			`%ptr2 = getelementptr float, float *%ptr0, i64 2`
			`%ptr3 = getelementptr float, float *%ptr0, i64 3`

			`store float %add, float *%ptr0`
			`store float %sub, float *%ptr1`
			`store float %sqrt1, float *%ptr2`
			`store float %sqrt2, float *%ptr3`

			`ret void`
			`}`

			`; On the other hand, strict operations that use the fpexcept.ignore`
			`; exception behaviour should be scheduled freely.`
			`define void @f3(float %f1, float %f2, float %f3, float %f4, float *%ptr0) {`
			`; CHECK-LABEL: f3:`
			`; CHECK: sqebr`
			`; CHECK: {{aebr\|sebr}}`
			`; CHECK: sqebr`
			`; CHECK: br %r14`

			`%add = call float @llvm.experimental.constrained.fadd.f32(`
			`float %f1, float %f2,`
			`metadata !"round.dynamic",`
			`metadata !"fpexcept.ignore")`
			`%sub = call float @llvm.experimental.constrained.fsub.f32(`
			`float %f3, float %f4,`
			`metadata !"round.dynamic",`
			`metadata !"fpexcept.ignore")`
			`%sqrt1 = call float @llvm.experimental.constrained.sqrt.f32(`
			`float %f2,`
			`metadata !"round.dynamic",`
			`metadata !"fpexcept.ignore")`
			`%sqrt2 = call float @llvm.experimental.constrained.sqrt.f32(`
			`float %f4,`
			`metadata !"round.dynamic",`
			`metadata !"fpexcept.ignore")`

			`%ptr1 = getelementptr float, float *%ptr0, i64 1`
			`%ptr2 = getelementptr float, float *%ptr0, i64 2`
			`%ptr3 = getelementptr float, float *%ptr0, i64 3`

			`store float %add, float *%ptr0`
			`store float %sub, float *%ptr1`
			`store float %sqrt1, float *%ptr2`
			`store float %sqrt2, float *%ptr3`

			`ret void`
			`}`

			`; However, even non-strict operations must not be scheduled across an SFPC.`
			`define void @f4(float %f1, float %f2, float %f3, float %f4, float *%ptr0) {`
			`; CHECK-LABEL: f4:`
			`; CHECK: {{aebr\|sebr}}`
			`; CHECK: {{aebr\|sebr}}`
			`; CHECK: sfpc`
			`; CHECK: sqebr`
			`; CHECK: sqebr`
			`; CHECK: br %r14`

			`%add = fadd float %f1, %f2`
			`%sub = fsub float %f3, %f4`
			`call void @llvm.s390.sfpc(i32 0)`
			`%sqrt1 = call float @llvm.sqrt.f32(float %f2)`
			`%sqrt2 = call float @llvm.sqrt.f32(float %f4)`

			`%ptr1 = getelementptr float, float *%ptr0, i64 1`
			`%ptr2 = getelementptr float, float *%ptr0, i64 2`
			`%ptr3 = getelementptr float, float *%ptr0, i64 3`

			`store float %add, float *%ptr0`
			`store float %sub, float *%ptr1`
			`store float %sqrt1, float *%ptr2`
			`store float %sqrt2, float *%ptr3`

			`ret void`
			`}`