forked from OSchip/llvm-project
110 lines
3.1 KiB
LLVM
110 lines
3.1 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
|
; RUN: llc < %s -mtriple=x86_64-unknown -mattr=+sse2 | FileCheck %s --check-prefixes=ALL,SSE
|
|
; RUN: llc < %s -mtriple=x86_64-unknown -mattr=+avx | FileCheck %s --check-prefixes=ALL,AVX,AVX1
|
|
; RUN: llc < %s -mtriple=x86_64-unknown -mattr=+avx2 | FileCheck %s --check-prefixes=ALL,AVX,AVX2
|
|
|
|
define <8 x i32> @a(<8 x i32> %a) nounwind {
|
|
; SSE-LABEL: a:
|
|
; SSE: # %bb.0:
|
|
; SSE-NEXT: pslld $16, %xmm0
|
|
; SSE-NEXT: psrad $16, %xmm0
|
|
; SSE-NEXT: pslld $16, %xmm1
|
|
; SSE-NEXT: psrad $16, %xmm1
|
|
; SSE-NEXT: retq
|
|
;
|
|
; AVX1-LABEL: a:
|
|
; AVX1: # %bb.0:
|
|
; AVX1-NEXT: vpslld $16, %xmm0, %xmm1
|
|
; AVX1-NEXT: vpsrad $16, %xmm1, %xmm1
|
|
; AVX1-NEXT: vextractf128 $1, %ymm0, %xmm0
|
|
; AVX1-NEXT: vpslld $16, %xmm0, %xmm0
|
|
; AVX1-NEXT: vpsrad $16, %xmm0, %xmm0
|
|
; AVX1-NEXT: vinsertf128 $1, %xmm0, %ymm1, %ymm0
|
|
; AVX1-NEXT: retq
|
|
;
|
|
; AVX2-LABEL: a:
|
|
; AVX2: # %bb.0:
|
|
; AVX2-NEXT: vpslld $16, %ymm0, %ymm0
|
|
; AVX2-NEXT: vpsrad $16, %ymm0, %ymm0
|
|
; AVX2-NEXT: retq
|
|
%b = trunc <8 x i32> %a to <8 x i16>
|
|
%c = sext <8 x i16> %b to <8 x i32>
|
|
ret <8 x i32> %c
|
|
}
|
|
|
|
define <3 x i32> @b(<3 x i32> %a) nounwind {
|
|
; SSE-LABEL: b:
|
|
; SSE: # %bb.0:
|
|
; SSE-NEXT: pslld $16, %xmm0
|
|
; SSE-NEXT: psrad $16, %xmm0
|
|
; SSE-NEXT: retq
|
|
;
|
|
; AVX-LABEL: b:
|
|
; AVX: # %bb.0:
|
|
; AVX-NEXT: vpslld $16, %xmm0, %xmm0
|
|
; AVX-NEXT: vpsrad $16, %xmm0, %xmm0
|
|
; AVX-NEXT: retq
|
|
%b = trunc <3 x i32> %a to <3 x i16>
|
|
%c = sext <3 x i16> %b to <3 x i32>
|
|
ret <3 x i32> %c
|
|
}
|
|
|
|
define <1 x i32> @c(<1 x i32> %a) nounwind {
|
|
; ALL-LABEL: c:
|
|
; ALL: # %bb.0:
|
|
; ALL-NEXT: movswl %di, %eax
|
|
; ALL-NEXT: retq
|
|
%b = trunc <1 x i32> %a to <1 x i16>
|
|
%c = sext <1 x i16> %b to <1 x i32>
|
|
ret <1 x i32> %c
|
|
}
|
|
|
|
define <8 x i32> @d(<8 x i32> %a) nounwind {
|
|
; SSE-LABEL: d:
|
|
; SSE: # %bb.0:
|
|
; SSE-NEXT: movaps {{.*#+}} xmm2 = [65535,0,65535,0,65535,0,65535,0]
|
|
; SSE-NEXT: andps %xmm2, %xmm0
|
|
; SSE-NEXT: andps %xmm2, %xmm1
|
|
; SSE-NEXT: retq
|
|
;
|
|
; AVX1-LABEL: d:
|
|
; AVX1: # %bb.0:
|
|
; AVX1-NEXT: vandps {{.*}}(%rip), %ymm0, %ymm0
|
|
; AVX1-NEXT: retq
|
|
;
|
|
; AVX2-LABEL: d:
|
|
; AVX2: # %bb.0:
|
|
; AVX2-NEXT: vpxor %xmm1, %xmm1, %xmm1
|
|
; AVX2-NEXT: vpblendw {{.*#+}} ymm0 = ymm0[0],ymm1[1],ymm0[2],ymm1[3],ymm0[4],ymm1[5],ymm0[6],ymm1[7],ymm0[8],ymm1[9],ymm0[10],ymm1[11],ymm0[12],ymm1[13],ymm0[14],ymm1[15]
|
|
; AVX2-NEXT: retq
|
|
%b = trunc <8 x i32> %a to <8 x i16>
|
|
%c = zext <8 x i16> %b to <8 x i32>
|
|
ret <8 x i32> %c
|
|
}
|
|
|
|
define <3 x i32> @e(<3 x i32> %a) nounwind {
|
|
; SSE-LABEL: e:
|
|
; SSE: # %bb.0:
|
|
; SSE-NEXT: andps {{.*}}(%rip), %xmm0
|
|
; SSE-NEXT: retq
|
|
;
|
|
; AVX-LABEL: e:
|
|
; AVX: # %bb.0:
|
|
; AVX-NEXT: vpxor %xmm1, %xmm1, %xmm1
|
|
; AVX-NEXT: vpblendw {{.*#+}} xmm0 = xmm0[0],xmm1[1],xmm0[2],xmm1[3],xmm0[4],xmm1[5],xmm0[6,7]
|
|
; AVX-NEXT: retq
|
|
%b = trunc <3 x i32> %a to <3 x i16>
|
|
%c = zext <3 x i16> %b to <3 x i32>
|
|
ret <3 x i32> %c
|
|
}
|
|
|
|
define <1 x i32> @f(<1 x i32> %a) nounwind {
|
|
; ALL-LABEL: f:
|
|
; ALL: # %bb.0:
|
|
; ALL-NEXT: movzwl %di, %eax
|
|
; ALL-NEXT: retq
|
|
%b = trunc <1 x i32> %a to <1 x i16>
|
|
%c = zext <1 x i16> %b to <1 x i32>
|
|
ret <1 x i32> %c
|
|
}
|