llvm-project/llvm/test/CodeGen/PowerPC/qpx-rounding-ops.ll

; RUN: llc -verify-machineinstrs < %s -mtriple=powerpc64-unknown-linux-gnu -mcpu=a2q | FileCheck %s
; RUN: llc -verify-machineinstrs < %s -mtriple=powerpc64-unknown-linux-gnu -mcpu=a2q -enable-unsafe-fp-math | FileCheck -check-prefix=CHECK-FM %s
target datalayout = "E-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-f128:128:128-v128:128:128-n32:64"
target triple = "powerpc64-unknown-linux-gnu"

define <4 x float> @test1(<4 x float> %x) nounwind  {
  %call = tail call <4 x float> @llvm.floor.v4f32(<4 x float> %x) nounwind readnone
  ret <4 x float> %call

; CHECK: test1:
; CHECK: qvfrim 1, 1

; CHECK-FM: test1:
; CHECK-FM: qvfrim 1, 1
}

declare <4 x float> @llvm.floor.v4f32(<4 x float>) nounwind readnone

define <4 x double> @test2(<4 x double> %x) nounwind  {
  %call = tail call <4 x double> @llvm.floor.v4f64(<4 x double> %x) nounwind readnone
  ret <4 x double> %call

; CHECK: test2:
; CHECK: qvfrim 1, 1

; CHECK-FM: test2:
; CHECK-FM: qvfrim 1, 1
}

declare <4 x double> @llvm.floor.v4f64(<4 x double>) nounwind readnone

define <4 x float> @test3(<4 x float> %x) nounwind  {
  %call = tail call <4 x float> @llvm.nearbyint.v4f32(<4 x float> %x) nounwind readnone
  ret <4 x float> %call

; CHECK: test3:
; CHECK-NOT: qvfrin

; CHECK-FM: test3:
; CHECK-FM-NOT: qvfrin
}

declare <4 x float> @llvm.nearbyint.v4f32(<4 x float>) nounwind readnone

define <4 x double> @test4(<4 x double> %x) nounwind  {
  %call = tail call <4 x double> @llvm.nearbyint.v4f64(<4 x double> %x) nounwind readnone
  ret <4 x double> %call

; CHECK: test4:
; CHECK-NOT: qvfrin

; CHECK-FM: test4:
; CHECK-FM-NOT: qvfrin
}

declare <4 x double> @llvm.nearbyint.v4f64(<4 x double>) nounwind readnone

define <4 x float> @test5(<4 x float> %x) nounwind  {
  %call = tail call <4 x float> @llvm.ceil.v4f32(<4 x float> %x) nounwind readnone
  ret <4 x float> %call

; CHECK: test5:
; CHECK: qvfrip 1, 1

; CHECK-FM: test5:
; CHECK-FM: qvfrip 1, 1
}

declare <4 x float> @llvm.ceil.v4f32(<4 x float>) nounwind readnone

define <4 x double> @test6(<4 x double> %x) nounwind  {
  %call = tail call <4 x double> @llvm.ceil.v4f64(<4 x double> %x) nounwind readnone
  ret <4 x double> %call

; CHECK: test6:
; CHECK: qvfrip 1, 1

; CHECK-FM: test6:
; CHECK-FM: qvfrip 1, 1
}

declare <4 x double> @llvm.ceil.v4f64(<4 x double>) nounwind readnone

define <4 x float> @test9(<4 x float> %x) nounwind  {
  %call = tail call <4 x float> @llvm.trunc.v4f32(<4 x float> %x) nounwind readnone
  ret <4 x float> %call

; CHECK: test9:
; CHECK: qvfriz 1, 1

; CHECK-FM: test9:
; CHECK-FM: qvfriz 1, 1
}

declare <4 x float> @llvm.trunc.v4f32(<4 x float>) nounwind readnone

define <4 x double> @test10(<4 x double> %x) nounwind  {
  %call = tail call <4 x double> @llvm.trunc.v4f64(<4 x double> %x) nounwind readnone
  ret <4 x double> %call

; CHECK: test10:
; CHECK: qvfriz 1, 1

; CHECK-FM: test10:
; CHECK-FM: qvfriz 1, 1
}

declare <4 x double> @llvm.trunc.v4f64(<4 x double>) nounwind readnone
Adding -verify-machineinstrs option to PowerPC tests Currently we have a number of tests that fail with -verify-machineinstrs. To detect this cases earlier we add the option to the testcases with the exception of tests that will currently fail with this option. PR 27456 keeps track of this failures. No code review, as discussed with Hal Finkel. llvm-svn: 277624 2016-08-04 02:17:35 +08:00			`; RUN: llc -verify-machineinstrs < %s -mtriple=powerpc64-unknown-linux-gnu -mcpu=a2q \| FileCheck %s`
			`; RUN: llc -verify-machineinstrs < %s -mtriple=powerpc64-unknown-linux-gnu -mcpu=a2q -enable-unsafe-fp-math \| FileCheck -check-prefix=CHECK-FM %s`
[PowerPC] Add support for the QPX vector instruction set This adds support for the QPX vector instruction set, which is used by the enhanced A2 cores on the IBM BG/Q supercomputers. QPX vectors are 256 bytes wide, holding 4 double-precision floating-point values. Boolean values, modeled here as <4 x i1> are actually also represented as floating-point values (essentially { -1, 1 } for { false, true }). QPX shares many features with Altivec and VSX, but is distinct from both of them. One major difference is that, instead of adding completely-separate vector registers, QPX vector registers are extensions of the scalar floating-point registers (lane 0 is the corresponding scalar floating-point value). The operations supported on QPX vectors mirrors that supported on the scalar floating-point values (with some additional ones for permutations and logical/comparison operations). I've been maintaining this support out-of-tree, as part of the bgclang project, for several years. This is not the entire bgclang patch set, but is most of the subset that can be cleanly integrated into LLVM proper at this time. Adding this to the LLVM backend is part of my efforts to rebase bgclang to the current LLVM trunk, but is independently useful (especially for codes that use LLVM as a JIT in library form). The assembler/disassembler test coverage is complete. The CodeGen test coverage is not, but I've included some tests, and more will be added as follow-up work. llvm-svn: 230413 2015-02-25 09:06:45 +08:00			`target datalayout = "E-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-f128:128:128-v128:128:128-n32:64"`
			`target triple = "powerpc64-unknown-linux-gnu"`

			`define <4 x float> @test1(<4 x float> %x) nounwind {`
			`%call = tail call <4 x float> @llvm.floor.v4f32(<4 x float> %x) nounwind readnone`
			`ret <4 x float> %call`

			`; CHECK: test1:`
			`; CHECK: qvfrim 1, 1`

			`; CHECK-FM: test1:`
			`; CHECK-FM: qvfrim 1, 1`
			`}`

			`declare <4 x float> @llvm.floor.v4f32(<4 x float>) nounwind readnone`

			`define <4 x double> @test2(<4 x double> %x) nounwind {`
			`%call = tail call <4 x double> @llvm.floor.v4f64(<4 x double> %x) nounwind readnone`
			`ret <4 x double> %call`

			`; CHECK: test2:`
			`; CHECK: qvfrim 1, 1`

			`; CHECK-FM: test2:`
			`; CHECK-FM: qvfrim 1, 1`
			`}`

			`declare <4 x double> @llvm.floor.v4f64(<4 x double>) nounwind readnone`

			`define <4 x float> @test3(<4 x float> %x) nounwind {`
			`%call = tail call <4 x float> @llvm.nearbyint.v4f32(<4 x float> %x) nounwind readnone`
			`ret <4 x float> %call`

			`; CHECK: test3:`
			`; CHECK-NOT: qvfrin`

			`; CHECK-FM: test3:`
			`; CHECK-FM-NOT: qvfrin`
			`}`

			`declare <4 x float> @llvm.nearbyint.v4f32(<4 x float>) nounwind readnone`

			`define <4 x double> @test4(<4 x double> %x) nounwind {`
			`%call = tail call <4 x double> @llvm.nearbyint.v4f64(<4 x double> %x) nounwind readnone`
			`ret <4 x double> %call`

			`; CHECK: test4:`
			`; CHECK-NOT: qvfrin`

			`; CHECK-FM: test4:`
			`; CHECK-FM-NOT: qvfrin`
			`}`

			`declare <4 x double> @llvm.nearbyint.v4f64(<4 x double>) nounwind readnone`

			`define <4 x float> @test5(<4 x float> %x) nounwind {`
			`%call = tail call <4 x float> @llvm.ceil.v4f32(<4 x float> %x) nounwind readnone`
			`ret <4 x float> %call`

			`; CHECK: test5:`
			`; CHECK: qvfrip 1, 1`

			`; CHECK-FM: test5:`
			`; CHECK-FM: qvfrip 1, 1`
			`}`

			`declare <4 x float> @llvm.ceil.v4f32(<4 x float>) nounwind readnone`

			`define <4 x double> @test6(<4 x double> %x) nounwind {`
			`%call = tail call <4 x double> @llvm.ceil.v4f64(<4 x double> %x) nounwind readnone`
			`ret <4 x double> %call`

			`; CHECK: test6:`
			`; CHECK: qvfrip 1, 1`

			`; CHECK-FM: test6:`
			`; CHECK-FM: qvfrip 1, 1`
			`}`

			`declare <4 x double> @llvm.ceil.v4f64(<4 x double>) nounwind readnone`

			`define <4 x float> @test9(<4 x float> %x) nounwind {`
			`%call = tail call <4 x float> @llvm.trunc.v4f32(<4 x float> %x) nounwind readnone`
			`ret <4 x float> %call`

			`; CHECK: test9:`
			`; CHECK: qvfriz 1, 1`

			`; CHECK-FM: test9:`
			`; CHECK-FM: qvfriz 1, 1`
			`}`

			`declare <4 x float> @llvm.trunc.v4f32(<4 x float>) nounwind readnone`

			`define <4 x double> @test10(<4 x double> %x) nounwind {`
			`%call = tail call <4 x double> @llvm.trunc.v4f64(<4 x double> %x) nounwind readnone`
			`ret <4 x double> %call`

			`; CHECK: test10:`
			`; CHECK: qvfriz 1, 1`

			`; CHECK-FM: test10:`
			`; CHECK-FM: qvfriz 1, 1`
			`}`

			`declare <4 x double> @llvm.trunc.v4f64(<4 x double>) nounwind readnone`