2016-07-09 08:19:07 +08:00
|
|
|
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
2015-10-08 20:55:01 +08:00
|
|
|
; RUN: llc < %s -mtriple=x86_64-apple-darwin -mcpu=skx | FileCheck --check-prefix=SKX %s
|
|
|
|
|
|
|
|
|
|
|
|
define <8 x i16> @extract_subvector128_v32i16(<32 x i16> %x) nounwind {
|
|
|
|
; SKX-LABEL: extract_subvector128_v32i16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0:
|
2017-08-01 06:07:29 +08:00
|
|
|
; SKX-NEXT: vextractf32x4 $2, %zmm0, %xmm0
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2015-10-08 20:55:01 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
%r1 = shufflevector <32 x i16> %x, <32 x i16> undef, <8 x i32> <i32 16, i32 17, i32 18, i32 19, i32 20, i32 21, i32 22, i32 23>
|
|
|
|
ret <8 x i16> %r1
|
|
|
|
}
|
|
|
|
|
|
|
|
define <8 x i16> @extract_subvector128_v32i16_first_element(<32 x i16> %x) nounwind {
|
|
|
|
; SKX-LABEL: extract_subvector128_v32i16_first_element:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0:
|
2017-12-07 18:40:31 +08:00
|
|
|
; SKX-NEXT: ## kill: def %xmm0 killed %xmm0 killed %zmm0
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2015-10-08 20:55:01 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
%r1 = shufflevector <32 x i16> %x, <32 x i16> undef, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7>
|
|
|
|
ret <8 x i16> %r1
|
|
|
|
}
|
|
|
|
|
|
|
|
define <16 x i8> @extract_subvector128_v64i8(<64 x i8> %x) nounwind {
|
|
|
|
; SKX-LABEL: extract_subvector128_v64i8:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0:
|
2017-08-01 06:07:29 +08:00
|
|
|
; SKX-NEXT: vextractf32x4 $2, %zmm0, %xmm0
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2015-10-08 20:55:01 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
%r1 = shufflevector <64 x i8> %x, <64 x i8> undef, <16 x i32> <i32 32, i32 33, i32 34, i32 35, i32 36, i32 37, i32 38,i32 39, i32 40, i32 41, i32 42, i32 43, i32 44, i32 45, i32 46, i32 47>
|
|
|
|
ret <16 x i8> %r1
|
|
|
|
}
|
|
|
|
|
|
|
|
define <16 x i8> @extract_subvector128_v64i8_first_element(<64 x i8> %x) nounwind {
|
|
|
|
; SKX-LABEL: extract_subvector128_v64i8_first_element:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0:
|
2017-12-07 18:40:31 +08:00
|
|
|
; SKX-NEXT: ## kill: def %xmm0 killed %xmm0 killed %zmm0
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2015-10-08 20:55:01 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
%r1 = shufflevector <64 x i8> %x, <64 x i8> undef, <16 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15>
|
|
|
|
ret <16 x i8> %r1
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
define <16 x i16> @extract_subvector256_v32i16(<32 x i16> %x) nounwind {
|
|
|
|
; SKX-LABEL: extract_subvector256_v32i16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0:
|
2017-08-01 06:07:29 +08:00
|
|
|
; SKX-NEXT: vextractf64x4 $1, %zmm0, %ymm0
|
2015-10-08 20:55:01 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
%r1 = shufflevector <32 x i16> %x, <32 x i16> undef, <16 x i32> <i32 16, i32 17, i32 18, i32 19, i32 20, i32 21, i32 22, i32 23, i32 24, i32 25, i32 26, i32 27, i32 28, i32 29, i32 30, i32 31>
|
|
|
|
ret <16 x i16> %r1
|
|
|
|
}
|
|
|
|
|
|
|
|
define <32 x i8> @extract_subvector256_v64i8(<64 x i8> %x) nounwind {
|
|
|
|
; SKX-LABEL: extract_subvector256_v64i8:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0:
|
2017-08-01 06:07:29 +08:00
|
|
|
; SKX-NEXT: vextractf64x4 $1, %zmm0, %ymm0
|
2015-10-08 20:55:01 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
%r1 = shufflevector <64 x i8> %x, <64 x i8> undef, <32 x i32> <i32 32, i32 33, i32 34, i32 35, i32 36, i32 37, i32 38, i32 39, i32 40, i32 41, i32 42, i32 43, i32 44, i32 45, i32 46, i32 47, i32 48, i32 49, i32 50, i32 51, i32 52, i32 53, i32 54, i32 55, i32 56, i32 57, i32 58, i32 59, i32 60, i32 61, i32 62, i32 63>
|
|
|
|
ret <32 x i8> %r1
|
|
|
|
}
|
2016-05-22 06:50:14 +08:00
|
|
|
|
|
|
|
define void @extract_subvector256_v8f64_store(double* nocapture %addr, <4 x double> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector256_v8f64_store:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2017-01-03 13:46:18 +08:00
|
|
|
; SKX-NEXT: vextractf128 $1, %ymm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-05-22 06:50:14 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <4 x double> %a, <4 x double> undef, <2 x i32> <i32 2, i32 3>
|
|
|
|
%1 = bitcast double* %addr to <2 x double>*
|
|
|
|
store <2 x double> %0, <2 x double>* %1, align 1
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @extract_subvector256_v8f32_store(float* nocapture %addr, <8 x float> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector256_v8f32_store:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2017-01-03 13:46:18 +08:00
|
|
|
; SKX-NEXT: vextractf128 $1, %ymm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-05-22 06:50:14 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <8 x float> %a, <8 x float> undef, <4 x i32> <i32 4, i32 5, i32 6, i32 7>
|
|
|
|
%1 = bitcast float* %addr to <4 x float>*
|
|
|
|
store <4 x float> %0, <4 x float>* %1, align 1
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @extract_subvector256_v4i64_store(i64* nocapture %addr, <4 x i64> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector256_v4i64_store:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2017-08-01 06:07:29 +08:00
|
|
|
; SKX-NEXT: vextractf128 $1, %ymm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-05-22 06:50:14 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <4 x i64> %a, <4 x i64> undef, <2 x i32> <i32 2, i32 3>
|
|
|
|
%1 = bitcast i64* %addr to <2 x i64>*
|
|
|
|
store <2 x i64> %0, <2 x i64>* %1, align 1
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @extract_subvector256_v8i32_store(i32* nocapture %addr, <8 x i32> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector256_v8i32_store:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2017-08-01 06:07:29 +08:00
|
|
|
; SKX-NEXT: vextractf128 $1, %ymm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-05-22 06:50:14 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <8 x i32> %a, <8 x i32> undef, <4 x i32> <i32 4, i32 5, i32 6, i32 7>
|
|
|
|
%1 = bitcast i32* %addr to <4 x i32>*
|
|
|
|
store <4 x i32> %0, <4 x i32>* %1, align 1
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @extract_subvector256_v16i16_store(i16* nocapture %addr, <16 x i16> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector256_v16i16_store:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2017-08-01 06:07:29 +08:00
|
|
|
; SKX-NEXT: vextractf128 $1, %ymm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-05-22 06:50:14 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <16 x i16> %a, <16 x i16> undef, <8 x i32> <i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15>
|
|
|
|
%1 = bitcast i16* %addr to <8 x i16>*
|
|
|
|
store <8 x i16> %0, <8 x i16>* %1, align 1
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @extract_subvector256_v32i8_store(i8* nocapture %addr, <32 x i8> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector256_v32i8_store:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2017-08-01 06:07:29 +08:00
|
|
|
; SKX-NEXT: vextractf128 $1, %ymm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-05-22 06:50:14 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <32 x i8> %a, <32 x i8> undef, <16 x i32> <i32 16, i32 17, i32 18, i32 19, i32 20, i32 21, i32 22, i32 23, i32 24, i32 25, i32 26, i32 27, i32 28, i32 29, i32 30, i32 31>
|
|
|
|
%1 = bitcast i8* %addr to <16 x i8>*
|
|
|
|
store <16 x i8> %0, <16 x i8>* %1, align 1
|
|
|
|
ret void
|
|
|
|
}
|
2016-05-23 07:44:33 +08:00
|
|
|
|
|
|
|
define void @extract_subvector256_v4f64_store_lo(double* nocapture %addr, <4 x double> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector256_v4f64_store_lo:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-08-01 04:20:01 +08:00
|
|
|
; SKX-NEXT: vmovups %xmm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-05-23 07:44:33 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <4 x double> %a, <4 x double> undef, <2 x i32> <i32 0, i32 1>
|
|
|
|
%1 = bitcast double* %addr to <2 x double>*
|
|
|
|
store <2 x double> %0, <2 x double>* %1, align 1
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-11-09 13:38:47 +08:00
|
|
|
define void @extract_subvector256_v4f64_store_lo_align_16(double* nocapture %addr, <4 x double> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector256_v4f64_store_lo_align_16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-11-09 13:38:47 +08:00
|
|
|
; SKX-NEXT: vmovaps %xmm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-11-09 13:38:47 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <4 x double> %a, <4 x double> undef, <2 x i32> <i32 0, i32 1>
|
|
|
|
%1 = bitcast double* %addr to <2 x double>*
|
|
|
|
store <2 x double> %0, <2 x double>* %1, align 16
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-05-23 07:44:33 +08:00
|
|
|
define void @extract_subvector256_v4f32_store_lo(float* nocapture %addr, <8 x float> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector256_v4f32_store_lo:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-05-23 07:44:33 +08:00
|
|
|
; SKX-NEXT: vmovups %xmm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-05-23 07:44:33 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <8 x float> %a, <8 x float> undef, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
|
|
|
|
%1 = bitcast float* %addr to <4 x float>*
|
|
|
|
store <4 x float> %0, <4 x float>* %1, align 1
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-11-09 13:38:47 +08:00
|
|
|
define void @extract_subvector256_v4f32_store_lo_align_16(float* nocapture %addr, <8 x float> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector256_v4f32_store_lo_align_16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-11-09 13:38:47 +08:00
|
|
|
; SKX-NEXT: vmovaps %xmm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-11-09 13:38:47 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <8 x float> %a, <8 x float> undef, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
|
|
|
|
%1 = bitcast float* %addr to <4 x float>*
|
|
|
|
store <4 x float> %0, <4 x float>* %1, align 16
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-05-23 07:44:33 +08:00
|
|
|
define void @extract_subvector256_v2i64_store_lo(i64* nocapture %addr, <4 x i64> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector256_v2i64_store_lo:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-08-01 15:55:33 +08:00
|
|
|
; SKX-NEXT: vmovups %xmm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-05-23 07:44:33 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <4 x i64> %a, <4 x i64> undef, <2 x i32> <i32 0, i32 1>
|
|
|
|
%1 = bitcast i64* %addr to <2 x i64>*
|
|
|
|
store <2 x i64> %0, <2 x i64>* %1, align 1
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-11-09 13:38:47 +08:00
|
|
|
define void @extract_subvector256_v2i64_store_lo_align_16(i64* nocapture %addr, <4 x i64> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector256_v2i64_store_lo_align_16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-11-09 13:38:47 +08:00
|
|
|
; SKX-NEXT: vmovaps %xmm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-11-09 13:38:47 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <4 x i64> %a, <4 x i64> undef, <2 x i32> <i32 0, i32 1>
|
|
|
|
%1 = bitcast i64* %addr to <2 x i64>*
|
|
|
|
store <2 x i64> %0, <2 x i64>* %1, align 16
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-05-23 07:44:33 +08:00
|
|
|
define void @extract_subvector256_v4i32_store_lo(i32* nocapture %addr, <8 x i32> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector256_v4i32_store_lo:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-08-01 15:55:33 +08:00
|
|
|
; SKX-NEXT: vmovups %xmm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-05-23 07:44:33 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <8 x i32> %a, <8 x i32> undef, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
|
|
|
|
%1 = bitcast i32* %addr to <4 x i32>*
|
|
|
|
store <4 x i32> %0, <4 x i32>* %1, align 1
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-11-09 13:38:47 +08:00
|
|
|
define void @extract_subvector256_v4i32_store_lo_align_16(i32* nocapture %addr, <8 x i32> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector256_v4i32_store_lo_align_16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-11-09 13:38:47 +08:00
|
|
|
; SKX-NEXT: vmovaps %xmm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-11-09 13:38:47 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <8 x i32> %a, <8 x i32> undef, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
|
|
|
|
%1 = bitcast i32* %addr to <4 x i32>*
|
|
|
|
store <4 x i32> %0, <4 x i32>* %1, align 16
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-05-23 07:44:33 +08:00
|
|
|
define void @extract_subvector256_v8i16_store_lo(i16* nocapture %addr, <16 x i16> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector256_v8i16_store_lo:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-08-01 15:55:33 +08:00
|
|
|
; SKX-NEXT: vmovups %xmm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-05-23 07:44:33 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <16 x i16> %a, <16 x i16> undef, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7>
|
|
|
|
%1 = bitcast i16* %addr to <8 x i16>*
|
|
|
|
store <8 x i16> %0, <8 x i16>* %1, align 1
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-11-09 13:38:47 +08:00
|
|
|
define void @extract_subvector256_v8i16_store_lo_align_16(i16* nocapture %addr, <16 x i16> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector256_v8i16_store_lo_align_16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-11-09 13:38:47 +08:00
|
|
|
; SKX-NEXT: vmovaps %xmm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-11-09 13:38:47 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <16 x i16> %a, <16 x i16> undef, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7>
|
|
|
|
%1 = bitcast i16* %addr to <8 x i16>*
|
|
|
|
store <8 x i16> %0, <8 x i16>* %1, align 16
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-05-23 07:44:33 +08:00
|
|
|
define void @extract_subvector256_v16i8_store_lo(i8* nocapture %addr, <32 x i8> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector256_v16i8_store_lo:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-08-01 15:55:33 +08:00
|
|
|
; SKX-NEXT: vmovups %xmm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-05-23 07:44:33 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <32 x i8> %a, <32 x i8> undef, <16 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15>
|
|
|
|
%1 = bitcast i8* %addr to <16 x i8>*
|
|
|
|
store <16 x i8> %0, <16 x i8>* %1, align 1
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-11-09 13:38:47 +08:00
|
|
|
define void @extract_subvector256_v16i8_store_lo_align_16(i8* nocapture %addr, <32 x i8> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector256_v16i8_store_lo_align_16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-11-09 13:38:47 +08:00
|
|
|
; SKX-NEXT: vmovaps %xmm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-11-09 13:38:47 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <32 x i8> %a, <32 x i8> undef, <16 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15>
|
|
|
|
%1 = bitcast i8* %addr to <16 x i8>*
|
|
|
|
store <16 x i8> %0, <16 x i8>* %1, align 16
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-05-23 07:44:33 +08:00
|
|
|
define void @extract_subvector512_v2f64_store_lo(double* nocapture %addr, <8 x double> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector512_v2f64_store_lo:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-08-01 04:20:01 +08:00
|
|
|
; SKX-NEXT: vmovups %xmm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-05-23 07:44:33 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <8 x double> %a, <8 x double> undef, <2 x i32> <i32 0, i32 1>
|
|
|
|
%1 = bitcast double* %addr to <2 x double>*
|
|
|
|
store <2 x double> %0, <2 x double>* %1, align 1
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-11-09 13:38:47 +08:00
|
|
|
define void @extract_subvector512_v2f64_store_lo_align_16(double* nocapture %addr, <8 x double> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector512_v2f64_store_lo_align_16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-11-09 13:38:47 +08:00
|
|
|
; SKX-NEXT: vmovaps %xmm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-11-09 13:38:47 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <8 x double> %a, <8 x double> undef, <2 x i32> <i32 0, i32 1>
|
|
|
|
%1 = bitcast double* %addr to <2 x double>*
|
|
|
|
store <2 x double> %0, <2 x double>* %1, align 16
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-05-23 07:44:33 +08:00
|
|
|
define void @extract_subvector512_v4f32_store_lo(float* nocapture %addr, <16 x float> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector512_v4f32_store_lo:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-05-23 07:44:33 +08:00
|
|
|
; SKX-NEXT: vmovups %xmm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-05-23 07:44:33 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <16 x float> %a, <16 x float> undef, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
|
|
|
|
%1 = bitcast float* %addr to <4 x float>*
|
|
|
|
store <4 x float> %0, <4 x float>* %1, align 1
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-11-09 13:38:47 +08:00
|
|
|
define void @extract_subvector512_v4f32_store_lo_align_16(float* nocapture %addr, <16 x float> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector512_v4f32_store_lo_align_16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-11-09 13:38:47 +08:00
|
|
|
; SKX-NEXT: vmovaps %xmm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-11-09 13:38:47 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <16 x float> %a, <16 x float> undef, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
|
|
|
|
%1 = bitcast float* %addr to <4 x float>*
|
|
|
|
store <4 x float> %0, <4 x float>* %1, align 16
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-05-23 07:44:33 +08:00
|
|
|
define void @extract_subvector512_v2i64_store_lo(i64* nocapture %addr, <8 x i64> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector512_v2i64_store_lo:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-08-01 15:55:33 +08:00
|
|
|
; SKX-NEXT: vmovups %xmm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-05-23 07:44:33 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <8 x i64> %a, <8 x i64> undef, <2 x i32> <i32 0, i32 1>
|
|
|
|
%1 = bitcast i64* %addr to <2 x i64>*
|
|
|
|
store <2 x i64> %0, <2 x i64>* %1, align 1
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-11-09 13:38:47 +08:00
|
|
|
define void @extract_subvector512_v2i64_store_lo_align_16(i64* nocapture %addr, <8 x i64> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector512_v2i64_store_lo_align_16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-11-09 13:38:47 +08:00
|
|
|
; SKX-NEXT: vmovaps %xmm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-11-09 13:38:47 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <8 x i64> %a, <8 x i64> undef, <2 x i32> <i32 0, i32 1>
|
|
|
|
%1 = bitcast i64* %addr to <2 x i64>*
|
|
|
|
store <2 x i64> %0, <2 x i64>* %1, align 16
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-05-23 07:44:33 +08:00
|
|
|
define void @extract_subvector512_v4i32_store_lo(i32* nocapture %addr, <16 x i32> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector512_v4i32_store_lo:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-08-01 15:55:33 +08:00
|
|
|
; SKX-NEXT: vmovups %xmm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-05-23 07:44:33 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <16 x i32> %a, <16 x i32> undef, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
|
|
|
|
%1 = bitcast i32* %addr to <4 x i32>*
|
|
|
|
store <4 x i32> %0, <4 x i32>* %1, align 1
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-11-09 13:38:47 +08:00
|
|
|
define void @extract_subvector512_v4i32_store_lo_align_16(i32* nocapture %addr, <16 x i32> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector512_v4i32_store_lo_align_16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-11-09 13:38:47 +08:00
|
|
|
; SKX-NEXT: vmovaps %xmm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-11-09 13:38:47 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <16 x i32> %a, <16 x i32> undef, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
|
|
|
|
%1 = bitcast i32* %addr to <4 x i32>*
|
|
|
|
store <4 x i32> %0, <4 x i32>* %1, align 16
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-05-23 07:44:33 +08:00
|
|
|
define void @extract_subvector512_v8i16_store_lo(i16* nocapture %addr, <32 x i16> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector512_v8i16_store_lo:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-08-01 15:55:33 +08:00
|
|
|
; SKX-NEXT: vmovups %xmm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-05-23 07:44:33 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <32 x i16> %a, <32 x i16> undef, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7>
|
|
|
|
%1 = bitcast i16* %addr to <8 x i16>*
|
|
|
|
store <8 x i16> %0, <8 x i16>* %1, align 1
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @extract_subvector512_v16i8_store_lo(i8* nocapture %addr, <64 x i8> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector512_v16i8_store_lo:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-08-01 15:55:33 +08:00
|
|
|
; SKX-NEXT: vmovups %xmm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-05-23 07:44:33 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <64 x i8> %a, <64 x i8> undef, <16 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15>
|
|
|
|
%1 = bitcast i8* %addr to <16 x i8>*
|
|
|
|
store <16 x i8> %0, <16 x i8>* %1, align 1
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-11-09 13:38:47 +08:00
|
|
|
define void @extract_subvector512_v16i8_store_lo_align_16(i8* nocapture %addr, <64 x i8> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector512_v16i8_store_lo_align_16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-11-09 13:38:47 +08:00
|
|
|
; SKX-NEXT: vmovaps %xmm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-11-09 13:38:47 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <64 x i8> %a, <64 x i8> undef, <16 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15>
|
|
|
|
%1 = bitcast i8* %addr to <16 x i8>*
|
|
|
|
store <16 x i8> %0, <16 x i8>* %1, align 16
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-05-23 07:44:33 +08:00
|
|
|
define void @extract_subvector512_v4f64_store_lo(double* nocapture %addr, <8 x double> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector512_v4f64_store_lo:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-08-01 04:20:01 +08:00
|
|
|
; SKX-NEXT: vmovups %ymm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-05-23 07:44:33 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <8 x double> %a, <8 x double> undef, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
|
|
|
|
%1 = bitcast double* %addr to <4 x double>*
|
|
|
|
store <4 x double> %0, <4 x double>* %1, align 1
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-11-09 13:31:53 +08:00
|
|
|
define void @extract_subvector512_v4f64_store_lo_align_16(double* nocapture %addr, <8 x double> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector512_v4f64_store_lo_align_16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-11-09 13:31:57 +08:00
|
|
|
; SKX-NEXT: vmovups %ymm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-11-09 13:31:53 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <8 x double> %a, <8 x double> undef, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
|
|
|
|
%1 = bitcast double* %addr to <4 x double>*
|
|
|
|
store <4 x double> %0, <4 x double>* %1, align 16
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @extract_subvector512_v4f64_store_lo_align_32(double* nocapture %addr, <8 x double> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector512_v4f64_store_lo_align_32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-11-09 13:31:53 +08:00
|
|
|
; SKX-NEXT: vmovaps %ymm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-11-09 13:31:53 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <8 x double> %a, <8 x double> undef, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
|
|
|
|
%1 = bitcast double* %addr to <4 x double>*
|
|
|
|
store <4 x double> %0, <4 x double>* %1, align 32
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-05-23 07:44:33 +08:00
|
|
|
define void @extract_subvector512_v8f32_store_lo(float* nocapture %addr, <16 x float> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector512_v8f32_store_lo:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-05-23 07:44:33 +08:00
|
|
|
; SKX-NEXT: vmovups %ymm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-05-23 07:44:33 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <16 x float> %a, <16 x float> undef, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7>
|
|
|
|
%1 = bitcast float* %addr to <8 x float>*
|
|
|
|
store <8 x float> %0, <8 x float>* %1, align 1
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-11-09 13:31:53 +08:00
|
|
|
define void @extract_subvector512_v8f32_store_lo_align_16(float* nocapture %addr, <16 x float> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector512_v8f32_store_lo_align_16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2017-08-20 06:02:02 +08:00
|
|
|
; SKX-NEXT: vmovups %ymm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-11-09 13:31:53 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <16 x float> %a, <16 x float> undef, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7>
|
|
|
|
%1 = bitcast float* %addr to <8 x float>*
|
|
|
|
store <8 x float> %0, <8 x float>* %1, align 16
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @extract_subvector512_v8f32_store_lo_align_32(float* nocapture %addr, <16 x float> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector512_v8f32_store_lo_align_32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-11-09 13:31:53 +08:00
|
|
|
; SKX-NEXT: vmovaps %ymm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-11-09 13:31:53 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <16 x float> %a, <16 x float> undef, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7>
|
|
|
|
%1 = bitcast float* %addr to <8 x float>*
|
|
|
|
store <8 x float> %0, <8 x float>* %1, align 32
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-05-23 07:44:33 +08:00
|
|
|
define void @extract_subvector512_v4i64_store_lo(i64* nocapture %addr, <8 x i64> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector512_v4i64_store_lo:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-08-01 15:55:33 +08:00
|
|
|
; SKX-NEXT: vmovups %ymm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-05-23 07:44:33 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <8 x i64> %a, <8 x i64> undef, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
|
|
|
|
%1 = bitcast i64* %addr to <4 x i64>*
|
|
|
|
store <4 x i64> %0, <4 x i64>* %1, align 1
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-11-09 13:31:53 +08:00
|
|
|
define void @extract_subvector512_v4i64_store_lo_align_16(i64* nocapture %addr, <8 x i64> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector512_v4i64_store_lo_align_16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-11-09 13:31:57 +08:00
|
|
|
; SKX-NEXT: vmovups %ymm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-11-09 13:31:53 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <8 x i64> %a, <8 x i64> undef, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
|
|
|
|
%1 = bitcast i64* %addr to <4 x i64>*
|
|
|
|
store <4 x i64> %0, <4 x i64>* %1, align 16
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @extract_subvector512_v4i64_store_lo_align_32(i64* nocapture %addr, <8 x i64> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector512_v4i64_store_lo_align_32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-11-09 13:31:53 +08:00
|
|
|
; SKX-NEXT: vmovaps %ymm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-11-09 13:31:53 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <8 x i64> %a, <8 x i64> undef, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
|
|
|
|
%1 = bitcast i64* %addr to <4 x i64>*
|
|
|
|
store <4 x i64> %0, <4 x i64>* %1, align 32
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-05-23 07:44:33 +08:00
|
|
|
define void @extract_subvector512_v8i32_store_lo(i32* nocapture %addr, <16 x i32> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector512_v8i32_store_lo:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-08-01 15:55:33 +08:00
|
|
|
; SKX-NEXT: vmovups %ymm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-05-23 07:44:33 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <16 x i32> %a, <16 x i32> undef, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7>
|
|
|
|
%1 = bitcast i32* %addr to <8 x i32>*
|
|
|
|
store <8 x i32> %0, <8 x i32>* %1, align 1
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-11-09 13:31:53 +08:00
|
|
|
define void @extract_subvector512_v8i32_store_lo_align_16(i32* nocapture %addr, <16 x i32> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector512_v8i32_store_lo_align_16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-11-09 13:31:57 +08:00
|
|
|
; SKX-NEXT: vmovups %ymm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-11-09 13:31:53 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <16 x i32> %a, <16 x i32> undef, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7>
|
|
|
|
%1 = bitcast i32* %addr to <8 x i32>*
|
|
|
|
store <8 x i32> %0, <8 x i32>* %1, align 16
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @extract_subvector512_v8i32_store_lo_align_32(i32* nocapture %addr, <16 x i32> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector512_v8i32_store_lo_align_32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-11-09 13:31:53 +08:00
|
|
|
; SKX-NEXT: vmovaps %ymm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-11-09 13:31:53 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <16 x i32> %a, <16 x i32> undef, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7>
|
|
|
|
%1 = bitcast i32* %addr to <8 x i32>*
|
|
|
|
store <8 x i32> %0, <8 x i32>* %1, align 32
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-05-23 07:44:33 +08:00
|
|
|
define void @extract_subvector512_v16i16_store_lo(i16* nocapture %addr, <32 x i16> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector512_v16i16_store_lo:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-08-01 15:55:33 +08:00
|
|
|
; SKX-NEXT: vmovups %ymm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-05-23 07:44:33 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <32 x i16> %a, <32 x i16> undef, <16 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15>
|
|
|
|
%1 = bitcast i16* %addr to <16 x i16>*
|
|
|
|
store <16 x i16> %0, <16 x i16>* %1, align 1
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-11-09 13:31:53 +08:00
|
|
|
define void @extract_subvector512_v16i16_store_lo_align_16(i16* nocapture %addr, <32 x i16> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector512_v16i16_store_lo_align_16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-11-09 13:31:57 +08:00
|
|
|
; SKX-NEXT: vmovups %ymm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-11-09 13:31:53 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <32 x i16> %a, <32 x i16> undef, <16 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15>
|
|
|
|
%1 = bitcast i16* %addr to <16 x i16>*
|
|
|
|
store <16 x i16> %0, <16 x i16>* %1, align 16
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @extract_subvector512_v16i16_store_lo_align_32(i16* nocapture %addr, <32 x i16> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector512_v16i16_store_lo_align_32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-11-09 13:31:53 +08:00
|
|
|
; SKX-NEXT: vmovaps %ymm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-11-09 13:31:53 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <32 x i16> %a, <32 x i16> undef, <16 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15>
|
|
|
|
%1 = bitcast i16* %addr to <16 x i16>*
|
|
|
|
store <16 x i16> %0, <16 x i16>* %1, align 32
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-05-23 07:44:33 +08:00
|
|
|
define void @extract_subvector512_v32i8_store_lo(i8* nocapture %addr, <64 x i8> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector512_v32i8_store_lo:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-08-01 15:55:33 +08:00
|
|
|
; SKX-NEXT: vmovups %ymm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-05-23 07:44:33 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <64 x i8> %a, <64 x i8> undef, <32 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15, i32 16, i32 17, i32 18, i32 19, i32 20, i32 21, i32 22, i32 23, i32 24, i32 25, i32 26, i32 27, i32 28, i32 29, i32 30, i32 31>
|
|
|
|
%1 = bitcast i8* %addr to <32 x i8>*
|
|
|
|
store <32 x i8> %0, <32 x i8>* %1, align 1
|
|
|
|
ret void
|
|
|
|
}
|
2016-10-31 13:55:57 +08:00
|
|
|
|
2016-11-09 13:31:53 +08:00
|
|
|
define void @extract_subvector512_v32i8_store_lo_align_16(i8* nocapture %addr, <64 x i8> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector512_v32i8_store_lo_align_16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-11-09 13:31:57 +08:00
|
|
|
; SKX-NEXT: vmovups %ymm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-11-09 13:31:53 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <64 x i8> %a, <64 x i8> undef, <32 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15, i32 16, i32 17, i32 18, i32 19, i32 20, i32 21, i32 22, i32 23, i32 24, i32 25, i32 26, i32 27, i32 28, i32 29, i32 30, i32 31>
|
|
|
|
%1 = bitcast i8* %addr to <32 x i8>*
|
|
|
|
store <32 x i8> %0, <32 x i8>* %1, align 16
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @extract_subvector512_v32i8_store_lo_align_32(i8* nocapture %addr, <64 x i8> %a) nounwind uwtable ssp {
|
|
|
|
; SKX-LABEL: extract_subvector512_v32i8_store_lo_align_32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2016-11-09 13:31:53 +08:00
|
|
|
; SKX-NEXT: vmovaps %ymm0, (%rdi)
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-11-09 13:31:53 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = shufflevector <64 x i8> %a, <64 x i8> undef, <32 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15, i32 16, i32 17, i32 18, i32 19, i32 20, i32 21, i32 22, i32 23, i32 24, i32 25, i32 26, i32 27, i32 28, i32 29, i32 30, i32 31>
|
|
|
|
%1 = bitcast i8* %addr to <32 x i8>*
|
|
|
|
store <32 x i8> %0, <32 x i8>* %1, align 32
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-10-31 13:55:57 +08:00
|
|
|
define <4 x double> @test_mm512_mask_extractf64x4_pd(<4 x double> %__W, i8 %__U, <8 x double> %__A) {
|
|
|
|
; SKX-LABEL: test_mm512_mask_extractf64x4_pd:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2017-03-29 00:35:29 +08:00
|
|
|
; SKX-NEXT: kmovd %edi, %k1
|
2016-10-31 13:55:57 +08:00
|
|
|
; SKX-NEXT: vextractf64x4 $1, %zmm1, %ymm0 {%k1}
|
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%shuffle = shufflevector <8 x double> %__A, <8 x double> undef, <4 x i32> <i32 4, i32 5, i32 6, i32 7>
|
|
|
|
%0 = bitcast i8 %__U to <8 x i1>
|
|
|
|
%extract = shufflevector <8 x i1> %0, <8 x i1> undef, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
|
|
|
|
%1 = select <4 x i1> %extract, <4 x double> %shuffle, <4 x double> %__W
|
|
|
|
ret <4 x double> %1
|
|
|
|
}
|
|
|
|
|
|
|
|
define <4 x double> @test_mm512_maskz_extractf64x4_pd(i8 %__U, <8 x double> %__A) {
|
|
|
|
; SKX-LABEL: test_mm512_maskz_extractf64x4_pd:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2017-03-29 00:35:29 +08:00
|
|
|
; SKX-NEXT: kmovd %edi, %k1
|
2016-10-31 13:55:57 +08:00
|
|
|
; SKX-NEXT: vextractf64x4 $1, %zmm0, %ymm0 {%k1} {z}
|
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%shuffle = shufflevector <8 x double> %__A, <8 x double> undef, <4 x i32> <i32 4, i32 5, i32 6, i32 7>
|
|
|
|
%0 = bitcast i8 %__U to <8 x i1>
|
|
|
|
%extract = shufflevector <8 x i1> %0, <8 x i1> undef, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
|
|
|
|
%1 = select <4 x i1> %extract, <4 x double> %shuffle, <4 x double> zeroinitializer
|
|
|
|
ret <4 x double> %1
|
|
|
|
}
|
|
|
|
|
|
|
|
define <4 x float> @test_mm512_mask_extractf32x4_ps(<4 x float> %__W, i8 %__U, <8 x double> %__A) {
|
|
|
|
; SKX-LABEL: test_mm512_mask_extractf32x4_ps:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2017-03-29 00:35:29 +08:00
|
|
|
; SKX-NEXT: kmovd %edi, %k1
|
2016-10-31 13:55:57 +08:00
|
|
|
; SKX-NEXT: vextractf32x4 $1, %zmm1, %xmm0 {%k1}
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-10-31 13:55:57 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = bitcast <8 x double> %__A to <16 x float>
|
|
|
|
%shuffle = shufflevector <16 x float> %0, <16 x float> undef, <4 x i32> <i32 4, i32 5, i32 6, i32 7>
|
|
|
|
%1 = bitcast i8 %__U to <8 x i1>
|
|
|
|
%extract = shufflevector <8 x i1> %1, <8 x i1> undef, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
|
|
|
|
%2 = select <4 x i1> %extract, <4 x float> %shuffle, <4 x float> %__W
|
|
|
|
ret <4 x float> %2
|
|
|
|
}
|
|
|
|
|
|
|
|
define <4 x float> @test_mm512_maskz_extractf32x4_ps(i8 %__U, <8 x double> %__A) {
|
|
|
|
; SKX-LABEL: test_mm512_maskz_extractf32x4_ps:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2017-03-29 00:35:29 +08:00
|
|
|
; SKX-NEXT: kmovd %edi, %k1
|
2016-10-31 13:55:57 +08:00
|
|
|
; SKX-NEXT: vextractf32x4 $1, %zmm0, %xmm0 {%k1} {z}
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-10-31 13:55:57 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = bitcast <8 x double> %__A to <16 x float>
|
|
|
|
%shuffle = shufflevector <16 x float> %0, <16 x float> undef, <4 x i32> <i32 4, i32 5, i32 6, i32 7>
|
|
|
|
%1 = bitcast i8 %__U to <8 x i1>
|
|
|
|
%extract = shufflevector <8 x i1> %1, <8 x i1> undef, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
|
|
|
|
%2 = select <4 x i1> %extract, <4 x float> %shuffle, <4 x float> zeroinitializer
|
|
|
|
ret <4 x float> %2
|
|
|
|
}
|
|
|
|
|
|
|
|
define <2 x double> @test_mm256_mask_extractf64x2_pd(<2 x double> %__W, i8 %__U, <4 x double> %__A) {
|
|
|
|
; SKX-LABEL: test_mm256_mask_extractf64x2_pd:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2017-03-29 00:35:29 +08:00
|
|
|
; SKX-NEXT: kmovd %edi, %k1
|
2016-10-31 13:55:57 +08:00
|
|
|
; SKX-NEXT: vextractf64x2 $1, %ymm1, %xmm0 {%k1}
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-10-31 13:55:57 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%shuffle = shufflevector <4 x double> %__A, <4 x double> undef, <2 x i32> <i32 2, i32 3>
|
|
|
|
%0 = bitcast i8 %__U to <8 x i1>
|
|
|
|
%extract = shufflevector <8 x i1> %0, <8 x i1> undef, <2 x i32> <i32 0, i32 1>
|
|
|
|
%1 = select <2 x i1> %extract, <2 x double> %shuffle, <2 x double> %__W
|
|
|
|
ret <2 x double> %1
|
|
|
|
}
|
|
|
|
|
|
|
|
define <2 x double> @test_mm256_maskz_extractf64x2_pd(i8 %__U, <4 x double> %__A) {
|
|
|
|
; SKX-LABEL: test_mm256_maskz_extractf64x2_pd:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2017-03-29 00:35:29 +08:00
|
|
|
; SKX-NEXT: kmovd %edi, %k1
|
2016-10-31 13:55:57 +08:00
|
|
|
; SKX-NEXT: vextractf64x2 $1, %ymm0, %xmm0 {%k1} {z}
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-10-31 13:55:57 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%shuffle = shufflevector <4 x double> %__A, <4 x double> undef, <2 x i32> <i32 2, i32 3>
|
|
|
|
%0 = bitcast i8 %__U to <8 x i1>
|
|
|
|
%extract = shufflevector <8 x i1> %0, <8 x i1> undef, <2 x i32> <i32 0, i32 1>
|
|
|
|
%1 = select <2 x i1> %extract, <2 x double> %shuffle, <2 x double> zeroinitializer
|
|
|
|
ret <2 x double> %1
|
|
|
|
}
|
|
|
|
|
|
|
|
define <2 x i64> @test_mm256_mask_extracti64x2_epi64(<2 x i64> %__W, i8 %__U, <4 x i64> %__A) {
|
|
|
|
; SKX-LABEL: test_mm256_mask_extracti64x2_epi64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2017-03-29 00:35:29 +08:00
|
|
|
; SKX-NEXT: kmovd %edi, %k1
|
2016-10-31 13:55:57 +08:00
|
|
|
; SKX-NEXT: vextracti64x2 $1, %ymm1, %xmm0 {%k1}
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-10-31 13:55:57 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%shuffle = shufflevector <4 x i64> %__A, <4 x i64> undef, <2 x i32> <i32 2, i32 3>
|
|
|
|
%0 = bitcast i8 %__U to <8 x i1>
|
|
|
|
%extract = shufflevector <8 x i1> %0, <8 x i1> undef, <2 x i32> <i32 0, i32 1>
|
|
|
|
%1 = select <2 x i1> %extract, <2 x i64> %shuffle, <2 x i64> %__W
|
|
|
|
ret <2 x i64> %1
|
|
|
|
}
|
|
|
|
|
|
|
|
define <2 x i64> @test_mm256_maskz_extracti64x2_epi64(i8 %__U, <4 x i64> %__A) {
|
|
|
|
; SKX-LABEL: test_mm256_maskz_extracti64x2_epi64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2017-03-29 00:35:29 +08:00
|
|
|
; SKX-NEXT: kmovd %edi, %k1
|
2016-10-31 13:55:57 +08:00
|
|
|
; SKX-NEXT: vextracti64x2 $1, %ymm0, %xmm0 {%k1} {z}
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-10-31 13:55:57 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%shuffle = shufflevector <4 x i64> %__A, <4 x i64> undef, <2 x i32> <i32 2, i32 3>
|
|
|
|
%0 = bitcast i8 %__U to <8 x i1>
|
|
|
|
%extract = shufflevector <8 x i1> %0, <8 x i1> undef, <2 x i32> <i32 0, i32 1>
|
|
|
|
%1 = select <2 x i1> %extract, <2 x i64> %shuffle, <2 x i64> zeroinitializer
|
|
|
|
ret <2 x i64> %1
|
|
|
|
}
|
|
|
|
|
|
|
|
define <4 x float> @test_mm256_mask_extractf32x4_ps(<4 x float> %__W, i8 %__U, <8 x float> %__A) {
|
|
|
|
; SKX-LABEL: test_mm256_mask_extractf32x4_ps:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2017-03-29 00:35:29 +08:00
|
|
|
; SKX-NEXT: kmovd %edi, %k1
|
2016-10-31 13:55:57 +08:00
|
|
|
; SKX-NEXT: vextractf32x4 $1, %ymm1, %xmm0 {%k1}
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-10-31 13:55:57 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%shuffle = shufflevector <8 x float> %__A, <8 x float> undef, <4 x i32> <i32 4, i32 5, i32 6, i32 7>
|
|
|
|
%0 = bitcast i8 %__U to <8 x i1>
|
|
|
|
%extract = shufflevector <8 x i1> %0, <8 x i1> undef, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
|
|
|
|
%1 = select <4 x i1> %extract, <4 x float> %shuffle, <4 x float> %__W
|
|
|
|
ret <4 x float> %1
|
|
|
|
}
|
|
|
|
|
|
|
|
define <4 x float> @test_mm256_maskz_extractf32x4_ps(i8 %__U, <8 x float> %__A) {
|
|
|
|
; SKX-LABEL: test_mm256_maskz_extractf32x4_ps:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2017-03-29 00:35:29 +08:00
|
|
|
; SKX-NEXT: kmovd %edi, %k1
|
2016-10-31 13:55:57 +08:00
|
|
|
; SKX-NEXT: vextractf32x4 $1, %ymm0, %xmm0 {%k1} {z}
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-10-31 13:55:57 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%shuffle = shufflevector <8 x float> %__A, <8 x float> undef, <4 x i32> <i32 4, i32 5, i32 6, i32 7>
|
|
|
|
%0 = bitcast i8 %__U to <8 x i1>
|
|
|
|
%extract = shufflevector <8 x i1> %0, <8 x i1> undef, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
|
|
|
|
%1 = select <4 x i1> %extract, <4 x float> %shuffle, <4 x float> zeroinitializer
|
|
|
|
ret <4 x float> %1
|
|
|
|
}
|
|
|
|
|
|
|
|
define <2 x i64> @test_mm256_mask_extracti32x4_epi32(<2 x i64> %__W, i8 %__U, <4 x i64> %__A) {
|
|
|
|
; SKX-LABEL: test_mm256_mask_extracti32x4_epi32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2017-03-29 00:35:29 +08:00
|
|
|
; SKX-NEXT: kmovd %edi, %k1
|
2016-10-31 13:55:57 +08:00
|
|
|
; SKX-NEXT: vextracti32x4 $1, %ymm1, %xmm0 {%k1}
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-10-31 13:55:57 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = bitcast <4 x i64> %__A to <8 x i32>
|
|
|
|
%shuffle = shufflevector <8 x i32> %0, <8 x i32> undef, <4 x i32> <i32 4, i32 5, i32 6, i32 7>
|
|
|
|
%1 = bitcast <2 x i64> %__W to <4 x i32>
|
|
|
|
%2 = bitcast i8 %__U to <8 x i1>
|
|
|
|
%extract = shufflevector <8 x i1> %2, <8 x i1> undef, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
|
|
|
|
%3 = select <4 x i1> %extract, <4 x i32> %shuffle, <4 x i32> %1
|
|
|
|
%4 = bitcast <4 x i32> %3 to <2 x i64>
|
|
|
|
ret <2 x i64> %4
|
|
|
|
}
|
|
|
|
|
|
|
|
define <2 x i64> @test_mm256_maskz_extracti32x4_epi32(i8 %__U, <4 x i64> %__A) {
|
|
|
|
; SKX-LABEL: test_mm256_maskz_extracti32x4_epi32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2017-03-29 00:35:29 +08:00
|
|
|
; SKX-NEXT: kmovd %edi, %k1
|
2016-10-31 13:55:57 +08:00
|
|
|
; SKX-NEXT: vextracti32x4 $1, %ymm0, %xmm0 {%k1} {z}
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-10-31 13:55:57 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = bitcast <4 x i64> %__A to <8 x i32>
|
|
|
|
%shuffle = shufflevector <8 x i32> %0, <8 x i32> undef, <4 x i32> <i32 4, i32 5, i32 6, i32 7>
|
|
|
|
%1 = bitcast i8 %__U to <8 x i1>
|
|
|
|
%extract = shufflevector <8 x i1> %1, <8 x i1> undef, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
|
|
|
|
%2 = select <4 x i1> %extract, <4 x i32> %shuffle, <4 x i32> zeroinitializer
|
|
|
|
%3 = bitcast <4 x i32> %2 to <2 x i64>
|
|
|
|
ret <2 x i64> %3
|
|
|
|
}
|
|
|
|
|
|
|
|
define <8 x float> @test_mm512_mask_extractf32x8_ps(<8 x float> %__W, i8 %__U, <16 x float> %__A) {
|
|
|
|
; SKX-LABEL: test_mm512_mask_extractf32x8_ps:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2017-03-29 00:35:29 +08:00
|
|
|
; SKX-NEXT: kmovd %edi, %k1
|
2016-10-31 13:55:57 +08:00
|
|
|
; SKX-NEXT: vextractf32x8 $1, %zmm1, %ymm0 {%k1}
|
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%shuffle = shufflevector <16 x float> %__A, <16 x float> undef, <8 x i32> <i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15>
|
|
|
|
%0 = bitcast i8 %__U to <8 x i1>
|
|
|
|
%1 = select <8 x i1> %0, <8 x float> %shuffle, <8 x float> %__W
|
|
|
|
ret <8 x float> %1
|
|
|
|
}
|
|
|
|
|
|
|
|
define <8 x float> @test_mm512_maskz_extractf32x8_ps(i8 %__U, <16 x float> %__A) {
|
|
|
|
; SKX-LABEL: test_mm512_maskz_extractf32x8_ps:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2017-03-29 00:35:29 +08:00
|
|
|
; SKX-NEXT: kmovd %edi, %k1
|
2016-10-31 13:55:57 +08:00
|
|
|
; SKX-NEXT: vextractf32x8 $1, %zmm0, %ymm0 {%k1} {z}
|
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%shuffle = shufflevector <16 x float> %__A, <16 x float> undef, <8 x i32> <i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15>
|
|
|
|
%0 = bitcast i8 %__U to <8 x i1>
|
|
|
|
%1 = select <8 x i1> %0, <8 x float> %shuffle, <8 x float> zeroinitializer
|
|
|
|
ret <8 x float> %1
|
|
|
|
}
|
|
|
|
|
|
|
|
define <2 x double> @test_mm512_mask_extractf64x2_pd(<2 x double> %__W, i8 %__U, <8 x double> %__A) {
|
|
|
|
; SKX-LABEL: test_mm512_mask_extractf64x2_pd:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2017-03-29 00:35:29 +08:00
|
|
|
; SKX-NEXT: kmovd %edi, %k1
|
2016-10-31 13:55:57 +08:00
|
|
|
; SKX-NEXT: vextractf64x2 $3, %zmm1, %xmm0 {%k1}
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-10-31 13:55:57 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%shuffle = shufflevector <8 x double> %__A, <8 x double> undef, <2 x i32> <i32 6, i32 7>
|
|
|
|
%0 = bitcast i8 %__U to <8 x i1>
|
|
|
|
%extract = shufflevector <8 x i1> %0, <8 x i1> undef, <2 x i32> <i32 0, i32 1>
|
|
|
|
%1 = select <2 x i1> %extract, <2 x double> %shuffle, <2 x double> %__W
|
|
|
|
ret <2 x double> %1
|
|
|
|
}
|
|
|
|
|
|
|
|
define <2 x double> @test_mm512_maskz_extractf64x2_pd(i8 %__U, <8 x double> %__A) {
|
|
|
|
; SKX-LABEL: test_mm512_maskz_extractf64x2_pd:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKX: ## %bb.0: ## %entry
|
2017-03-29 00:35:29 +08:00
|
|
|
; SKX-NEXT: kmovd %edi, %k1
|
2016-10-31 13:55:57 +08:00
|
|
|
; SKX-NEXT: vextractf64x2 $3, %zmm0, %xmm0 {%k1} {z}
|
2017-03-03 17:03:24 +08:00
|
|
|
; SKX-NEXT: vzeroupper
|
2016-10-31 13:55:57 +08:00
|
|
|
; SKX-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%shuffle = shufflevector <8 x double> %__A, <8 x double> undef, <2 x i32> <i32 6, i32 7>
|
|
|
|
%0 = bitcast i8 %__U to <8 x i1>
|
|
|
|
%extract = shufflevector <8 x i1> %0, <8 x i1> undef, <2 x i32> <i32 0, i32 1>
|
|
|
|
%1 = select <2 x i1> %extract, <2 x double> %shuffle, <2 x double> zeroinitializer
|
|
|
|
ret <2 x double> %1
|
|
|
|
}
|