From 78309ebef4a35700597bde2cca3052f9c600a0bb Mon Sep 17 00:00:00 2001 From: David Green Date: Fri, 2 Jul 2021 17:03:49 +0100 Subject: [PATCH] [AArch64] Neon saturated truncate tests. NFC --- llvm/test/CodeGen/AArch64/qmovn.ll | 162 +++++++++++++++++++++++++++++ 1 file changed, 162 insertions(+) create mode 100644 llvm/test/CodeGen/AArch64/qmovn.ll diff --git a/llvm/test/CodeGen/AArch64/qmovn.ll b/llvm/test/CodeGen/AArch64/qmovn.ll new file mode 100644 index 000000000000..515f4d5bd114 --- /dev/null +++ b/llvm/test/CodeGen/AArch64/qmovn.ll @@ -0,0 +1,162 @@ +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py +; RUN: llc -mtriple=aarch64-none-none-eabi -verify-machineinstrs %s -o - | FileCheck %s + +define <4 x i16> @vqmovni32_smaxmin(<4 x i32> %s0) { +; CHECK-LABEL: vqmovni32_smaxmin: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: movi v1.4s, #127, msl #8 +; CHECK-NEXT: smin v0.4s, v0.4s, v1.4s +; CHECK-NEXT: mvni v1.4s, #127, msl #8 +; CHECK-NEXT: smax v0.4s, v0.4s, v1.4s +; CHECK-NEXT: xtn v0.4h, v0.4s +; CHECK-NEXT: ret +entry: + %c1 = icmp slt <4 x i32> %s0, + %s1 = select <4 x i1> %c1, <4 x i32> %s0, <4 x i32> + %c2 = icmp sgt <4 x i32> %s1, + %s2 = select <4 x i1> %c2, <4 x i32> %s1, <4 x i32> + %t = trunc <4 x i32> %s2 to <4 x i16> + ret <4 x i16> %t +} + +define <4 x i16> @vqmovni32_sminmax(<4 x i32> %s0) { +; CHECK-LABEL: vqmovni32_sminmax: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: mvni v1.4s, #127, msl #8 +; CHECK-NEXT: smax v0.4s, v0.4s, v1.4s +; CHECK-NEXT: movi v1.4s, #127, msl #8 +; CHECK-NEXT: smin v0.4s, v0.4s, v1.4s +; CHECK-NEXT: xtn v0.4h, v0.4s +; CHECK-NEXT: ret +entry: + %c1 = icmp sgt <4 x i32> %s0, + %s1 = select <4 x i1> %c1, <4 x i32> %s0, <4 x i32> + %c2 = icmp slt <4 x i32> %s1, + %s2 = select <4 x i1> %c2, <4 x i32> %s1, <4 x i32> + %t = trunc <4 x i32> %s2 to <4 x i16> + ret <4 x i16> %t +} + +define <4 x i16> @vqmovni32_umaxmin(<4 x i32> %s0) { +; CHECK-LABEL: vqmovni32_umaxmin: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: movi v1.2d, #0x00ffff0000ffff +; CHECK-NEXT: umin v0.4s, v0.4s, v1.4s +; CHECK-NEXT: xtn v0.4h, v0.4s +; CHECK-NEXT: ret +entry: + %c1 = icmp ult <4 x i32> %s0, + %s1 = select <4 x i1> %c1, <4 x i32> %s0, <4 x i32> + %t = trunc <4 x i32> %s1 to <4 x i16> + ret <4 x i16> %t +} + +define <8 x i8> @vqmovni16_smaxmin(<8 x i16> %s0) { +; CHECK-LABEL: vqmovni16_smaxmin: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: movi v1.8h, #127 +; CHECK-NEXT: smin v0.8h, v0.8h, v1.8h +; CHECK-NEXT: mvni v1.8h, #127 +; CHECK-NEXT: smax v0.8h, v0.8h, v1.8h +; CHECK-NEXT: xtn v0.8b, v0.8h +; CHECK-NEXT: ret +entry: + %c1 = icmp slt <8 x i16> %s0, + %s1 = select <8 x i1> %c1, <8 x i16> %s0, <8 x i16> + %c2 = icmp sgt <8 x i16> %s1, + %s2 = select <8 x i1> %c2, <8 x i16> %s1, <8 x i16> + %t = trunc <8 x i16> %s2 to <8 x i8> + ret <8 x i8> %t +} + +define <8 x i8> @vqmovni16_sminmax(<8 x i16> %s0) { +; CHECK-LABEL: vqmovni16_sminmax: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: mvni v1.8h, #127 +; CHECK-NEXT: smax v0.8h, v0.8h, v1.8h +; CHECK-NEXT: movi v1.8h, #127 +; CHECK-NEXT: smin v0.8h, v0.8h, v1.8h +; CHECK-NEXT: xtn v0.8b, v0.8h +; CHECK-NEXT: ret +entry: + %c1 = icmp sgt <8 x i16> %s0, + %s1 = select <8 x i1> %c1, <8 x i16> %s0, <8 x i16> + %c2 = icmp slt <8 x i16> %s1, + %s2 = select <8 x i1> %c2, <8 x i16> %s1, <8 x i16> + %t = trunc <8 x i16> %s2 to <8 x i8> + ret <8 x i8> %t +} + +define <8 x i8> @vqmovni16_umaxmin(<8 x i16> %s0) { +; CHECK-LABEL: vqmovni16_umaxmin: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: movi v1.2d, #0xff00ff00ff00ff +; CHECK-NEXT: umin v0.8h, v0.8h, v1.8h +; CHECK-NEXT: xtn v0.8b, v0.8h +; CHECK-NEXT: ret +entry: + %c1 = icmp ult <8 x i16> %s0, + %s1 = select <8 x i1> %c1, <8 x i16> %s0, <8 x i16> + %t = trunc <8 x i16> %s1 to <8 x i8> + ret <8 x i8> %t +} + +define <2 x i32> @vqmovni64_smaxmin(<2 x i64> %s0) { +; CHECK-LABEL: vqmovni64_smaxmin: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: mov w8, #2147483647 +; CHECK-NEXT: dup v1.2d, x8 +; CHECK-NEXT: mov x9, #-2147483648 +; CHECK-NEXT: cmgt v2.2d, v1.2d, v0.2d +; CHECK-NEXT: bif v0.16b, v1.16b, v2.16b +; CHECK-NEXT: dup v1.2d, x9 +; CHECK-NEXT: cmgt v2.2d, v0.2d, v1.2d +; CHECK-NEXT: bif v0.16b, v1.16b, v2.16b +; CHECK-NEXT: xtn v0.2s, v0.2d +; CHECK-NEXT: ret +entry: + %c1 = icmp slt <2 x i64> %s0, + %s1 = select <2 x i1> %c1, <2 x i64> %s0, <2 x i64> + %c2 = icmp sgt <2 x i64> %s1, + %s2 = select <2 x i1> %c2, <2 x i64> %s1, <2 x i64> + %t = trunc <2 x i64> %s2 to <2 x i32> + ret <2 x i32> %t +} + +define <2 x i32> @vqmovni64_sminmax(<2 x i64> %s0) { +; CHECK-LABEL: vqmovni64_sminmax: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: mov x8, #-2147483648 +; CHECK-NEXT: dup v1.2d, x8 +; CHECK-NEXT: mov w9, #2147483647 +; CHECK-NEXT: cmgt v2.2d, v0.2d, v1.2d +; CHECK-NEXT: bif v0.16b, v1.16b, v2.16b +; CHECK-NEXT: dup v1.2d, x9 +; CHECK-NEXT: cmgt v2.2d, v1.2d, v0.2d +; CHECK-NEXT: bif v0.16b, v1.16b, v2.16b +; CHECK-NEXT: xtn v0.2s, v0.2d +; CHECK-NEXT: ret +entry: + %c1 = icmp sgt <2 x i64> %s0, + %s1 = select <2 x i1> %c1, <2 x i64> %s0, <2 x i64> + %c2 = icmp slt <2 x i64> %s1, + %s2 = select <2 x i1> %c2, <2 x i64> %s1, <2 x i64> + %t = trunc <2 x i64> %s2 to <2 x i32> + ret <2 x i32> %t +} + +define <2 x i32> @vqmovni64_umaxmin(<2 x i64> %s0) { +; CHECK-LABEL: vqmovni64_umaxmin: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: movi v1.2d, #0x000000ffffffff +; CHECK-NEXT: cmhi v1.2d, v1.2d, v0.2d +; CHECK-NEXT: and v0.16b, v0.16b, v1.16b +; CHECK-NEXT: orn v0.16b, v0.16b, v1.16b +; CHECK-NEXT: xtn v0.2s, v0.2d +; CHECK-NEXT: ret +entry: + %c1 = icmp ult <2 x i64> %s0, + %s1 = select <2 x i1> %c1, <2 x i64> %s0, <2 x i64> + %t = trunc <2 x i64> %s1 to <2 x i32> + ret <2 x i32> %t +}