2015-11-24 05:33:58 +08:00
|
|
|
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
2017-06-21 22:23:02 +08:00
|
|
|
; RUN: llc < %s -mtriple=x86_64-unknown-unknown | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE2
|
|
|
|
; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+sse3 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE3
|
|
|
|
; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+ssse3 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSSE3
|
|
|
|
; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+sse4.1 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE41
|
|
|
|
; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+avx | FileCheck %s --check-prefix=ALL --check-prefix=AVX --check-prefix=AVX1
|
|
|
|
; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+avx2 | FileCheck %s --check-prefix=ALL --check-prefix=AVX --check-prefix=AVX2
|
|
|
|
; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+avx512vl | FileCheck %s --check-prefix=ALL --check-prefix=AVX --check-prefix=AVX512VL
|
2014-06-27 19:23:44 +08:00
|
|
|
|
|
|
|
define <2 x i64> @shuffle_v2i64_00(<2 x i64> %a, <2 x i64> %b) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-LABEL: shuffle_v2i64_00:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-NEXT: pshufd {{.*#+}} xmm0 = xmm0[0,1,0,1]
|
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
2014-10-01 08:41:21 +08:00
|
|
|
; AVX1-LABEL: shuffle_v2i64_00:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX1: # %bb.0:
|
2017-09-18 11:29:47 +08:00
|
|
|
; AVX1-NEXT: vpermilps {{.*#+}} xmm0 = xmm0[0,1,0,1]
|
2014-10-01 08:41:21 +08:00
|
|
|
; AVX1-NEXT: retq
|
|
|
|
;
|
|
|
|
; AVX2-LABEL: shuffle_v2i64_00:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX2: # %bb.0:
|
2019-02-02 05:41:30 +08:00
|
|
|
; AVX2-NEXT: vmovddup {{.*#+}} xmm0 = xmm0[0,0]
|
2014-10-01 08:41:21 +08:00
|
|
|
; AVX2-NEXT: retq
|
2015-10-25 23:39:22 +08:00
|
|
|
;
|
|
|
|
; AVX512VL-LABEL: shuffle_v2i64_00:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX512VL: # %bb.0:
|
2019-02-02 05:41:30 +08:00
|
|
|
; AVX512VL-NEXT: vmovddup {{.*#+}} xmm0 = xmm0[0,0]
|
2015-10-25 23:39:22 +08:00
|
|
|
; AVX512VL-NEXT: retq
|
2014-06-27 19:23:44 +08:00
|
|
|
%shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 0, i32 0>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
define <2 x i64> @shuffle_v2i64_10(<2 x i64> %a, <2 x i64> %b) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-LABEL: shuffle_v2i64_10:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-NEXT: pshufd {{.*#+}} xmm0 = xmm0[2,3,0,1]
|
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
|
|
|
; AVX-LABEL: shuffle_v2i64_10:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2017-09-18 11:29:47 +08:00
|
|
|
; AVX-NEXT: vpermilps {{.*#+}} xmm0 = xmm0[2,3,0,1]
|
2014-10-01 05:44:34 +08:00
|
|
|
; AVX-NEXT: retq
|
2014-06-27 19:23:44 +08:00
|
|
|
%shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 1, i32 0>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
define <2 x i64> @shuffle_v2i64_11(<2 x i64> %a, <2 x i64> %b) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-LABEL: shuffle_v2i64_11:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-NEXT: pshufd {{.*#+}} xmm0 = xmm0[2,3,2,3]
|
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
|
|
|
; AVX-LABEL: shuffle_v2i64_11:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2017-09-18 11:29:47 +08:00
|
|
|
; AVX-NEXT: vpermilps {{.*#+}} xmm0 = xmm0[2,3,2,3]
|
2014-10-01 05:44:34 +08:00
|
|
|
; AVX-NEXT: retq
|
2014-06-27 19:23:44 +08:00
|
|
|
%shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 1, i32 1>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
define <2 x i64> @shuffle_v2i64_22(<2 x i64> %a, <2 x i64> %b) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-LABEL: shuffle_v2i64_22:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-NEXT: pshufd {{.*#+}} xmm0 = xmm1[0,1,0,1]
|
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
2014-10-01 08:41:21 +08:00
|
|
|
; AVX1-LABEL: shuffle_v2i64_22:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX1: # %bb.0:
|
2017-09-18 11:29:47 +08:00
|
|
|
; AVX1-NEXT: vpermilps {{.*#+}} xmm0 = xmm1[0,1,0,1]
|
2014-10-01 08:41:21 +08:00
|
|
|
; AVX1-NEXT: retq
|
|
|
|
;
|
|
|
|
; AVX2-LABEL: shuffle_v2i64_22:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX2: # %bb.0:
|
2019-02-02 05:41:30 +08:00
|
|
|
; AVX2-NEXT: vmovddup {{.*#+}} xmm0 = xmm1[0,0]
|
2014-10-01 08:41:21 +08:00
|
|
|
; AVX2-NEXT: retq
|
2015-10-25 23:39:22 +08:00
|
|
|
;
|
|
|
|
; AVX512VL-LABEL: shuffle_v2i64_22:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX512VL: # %bb.0:
|
2019-02-02 05:41:30 +08:00
|
|
|
; AVX512VL-NEXT: vmovddup {{.*#+}} xmm0 = xmm1[0,0]
|
2015-10-25 23:39:22 +08:00
|
|
|
; AVX512VL-NEXT: retq
|
2014-06-27 19:23:44 +08:00
|
|
|
%shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 2, i32 2>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
define <2 x i64> @shuffle_v2i64_32(<2 x i64> %a, <2 x i64> %b) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-LABEL: shuffle_v2i64_32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-NEXT: pshufd {{.*#+}} xmm0 = xmm1[2,3,0,1]
|
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
|
|
|
; AVX-LABEL: shuffle_v2i64_32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2017-09-18 11:29:47 +08:00
|
|
|
; AVX-NEXT: vpermilps {{.*#+}} xmm0 = xmm1[2,3,0,1]
|
2014-10-01 05:44:34 +08:00
|
|
|
; AVX-NEXT: retq
|
2014-06-27 19:23:44 +08:00
|
|
|
%shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 3, i32 2>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
define <2 x i64> @shuffle_v2i64_33(<2 x i64> %a, <2 x i64> %b) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-LABEL: shuffle_v2i64_33:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-NEXT: pshufd {{.*#+}} xmm0 = xmm1[2,3,2,3]
|
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
|
|
|
; AVX-LABEL: shuffle_v2i64_33:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2017-09-18 11:29:47 +08:00
|
|
|
; AVX-NEXT: vpermilps {{.*#+}} xmm0 = xmm1[2,3,2,3]
|
2014-10-01 05:44:34 +08:00
|
|
|
; AVX-NEXT: retq
|
2014-06-27 19:23:44 +08:00
|
|
|
%shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 3, i32 3>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
|
|
|
|
define <2 x double> @shuffle_v2f64_00(<2 x double> %a, <2 x double> %b) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE2-LABEL: shuffle_v2f64_00:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE2: # %bb.0:
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE2-NEXT: movlhps {{.*#+}} xmm0 = xmm0[0,0]
|
2014-09-15 07:19:37 +08:00
|
|
|
; SSE2-NEXT: retq
|
2015-01-27 05:15:42 +08:00
|
|
|
;
|
|
|
|
; SSE3-LABEL: shuffle_v2f64_00:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE3: # %bb.0:
|
2015-01-27 05:15:42 +08:00
|
|
|
; SSE3-NEXT: movddup {{.*#+}} xmm0 = xmm0[0,0]
|
|
|
|
; SSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSSE3-LABEL: shuffle_v2f64_00:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSSE3: # %bb.0:
|
2015-01-27 05:15:42 +08:00
|
|
|
; SSSE3-NEXT: movddup {{.*#+}} xmm0 = xmm0[0,0]
|
|
|
|
; SSSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSE41-LABEL: shuffle_v2f64_00:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE41: # %bb.0:
|
2015-01-27 05:15:42 +08:00
|
|
|
; SSE41-NEXT: movddup {{.*#+}} xmm0 = xmm0[0,0]
|
|
|
|
; SSE41-NEXT: retq
|
|
|
|
;
|
|
|
|
; AVX-LABEL: shuffle_v2f64_00:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2015-01-27 05:15:42 +08:00
|
|
|
; AVX-NEXT: vmovddup {{.*#+}} xmm0 = xmm0[0,0]
|
|
|
|
; AVX-NEXT: retq
|
|
|
|
%shuffle = shufflevector <2 x double> %a, <2 x double> %b, <2 x i32> <i32 0, i32 0>
|
|
|
|
ret <2 x double> %shuffle
|
2014-06-27 19:23:44 +08:00
|
|
|
}
|
|
|
|
define <2 x double> @shuffle_v2f64_10(<2 x double> %a, <2 x double> %b) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-LABEL: shuffle_v2f64_10:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2019-07-08 14:52:49 +08:00
|
|
|
; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[2,3,0,1]
|
2014-09-21 06:09:27 +08:00
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
2015-11-18 07:29:49 +08:00
|
|
|
; AVX-LABEL: shuffle_v2f64_10:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2015-11-18 07:29:49 +08:00
|
|
|
; AVX-NEXT: vpermilpd {{.*#+}} xmm0 = xmm0[1,0]
|
|
|
|
; AVX-NEXT: retq
|
2015-10-25 23:32:04 +08:00
|
|
|
|
2014-06-27 19:23:44 +08:00
|
|
|
%shuffle = shufflevector <2 x double> %a, <2 x double> %b, <2 x i32> <i32 1, i32 0>
|
|
|
|
ret <2 x double> %shuffle
|
|
|
|
}
|
|
|
|
define <2 x double> @shuffle_v2f64_11(<2 x double> %a, <2 x double> %b) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-LABEL: shuffle_v2f64_11:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2018-08-03 00:48:01 +08:00
|
|
|
; SSE-NEXT: movhlps {{.*#+}} xmm0 = xmm0[1,1]
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
2015-11-21 21:04:42 +08:00
|
|
|
; AVX-LABEL: shuffle_v2f64_11:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2016-06-28 16:08:15 +08:00
|
|
|
; AVX-NEXT: vpermilpd {{.*#+}} xmm0 = xmm0[1,1]
|
2015-11-21 21:04:42 +08:00
|
|
|
; AVX-NEXT: retq
|
2014-06-27 19:23:44 +08:00
|
|
|
%shuffle = shufflevector <2 x double> %a, <2 x double> %b, <2 x i32> <i32 1, i32 1>
|
|
|
|
ret <2 x double> %shuffle
|
|
|
|
}
|
|
|
|
define <2 x double> @shuffle_v2f64_22(<2 x double> %a, <2 x double> %b) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE2-LABEL: shuffle_v2f64_22:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE2: # %bb.0:
|
2014-09-15 07:19:37 +08:00
|
|
|
; SSE2-NEXT: movaps %xmm1, %xmm0
|
2018-09-20 02:59:08 +08:00
|
|
|
; SSE2-NEXT: movlhps {{.*#+}} xmm0 = xmm0[0],xmm1[0]
|
2014-09-15 07:19:37 +08:00
|
|
|
; SSE2-NEXT: retq
|
2015-01-27 05:15:42 +08:00
|
|
|
;
|
|
|
|
; SSE3-LABEL: shuffle_v2f64_22:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE3: # %bb.0:
|
2015-01-27 05:15:42 +08:00
|
|
|
; SSE3-NEXT: movddup {{.*#+}} xmm0 = xmm1[0,0]
|
|
|
|
; SSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSSE3-LABEL: shuffle_v2f64_22:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSSE3: # %bb.0:
|
2015-01-27 05:15:42 +08:00
|
|
|
; SSSE3-NEXT: movddup {{.*#+}} xmm0 = xmm1[0,0]
|
|
|
|
; SSSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSE41-LABEL: shuffle_v2f64_22:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE41: # %bb.0:
|
2015-01-27 05:15:42 +08:00
|
|
|
; SSE41-NEXT: movddup {{.*#+}} xmm0 = xmm1[0,0]
|
|
|
|
; SSE41-NEXT: retq
|
|
|
|
;
|
|
|
|
; AVX-LABEL: shuffle_v2f64_22:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2015-01-27 05:15:42 +08:00
|
|
|
; AVX-NEXT: vmovddup {{.*#+}} xmm0 = xmm1[0,0]
|
|
|
|
; AVX-NEXT: retq
|
|
|
|
%shuffle = shufflevector <2 x double> %a, <2 x double> %b, <2 x i32> <i32 2, i32 2>
|
|
|
|
ret <2 x double> %shuffle
|
2014-06-27 19:23:44 +08:00
|
|
|
}
|
|
|
|
define <2 x double> @shuffle_v2f64_32(<2 x double> %a, <2 x double> %b) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-LABEL: shuffle_v2f64_32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2019-07-08 14:52:49 +08:00
|
|
|
; SSE-NEXT: movaps %xmm1, %xmm0
|
|
|
|
; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[2,3],xmm1[0,1]
|
2014-09-21 05:26:41 +08:00
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
2015-11-18 07:29:49 +08:00
|
|
|
; AVX-LABEL: shuffle_v2f64_32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2015-11-18 07:29:49 +08:00
|
|
|
; AVX-NEXT: vpermilpd {{.*#+}} xmm0 = xmm1[1,0]
|
|
|
|
; AVX-NEXT: retq
|
2015-10-25 23:32:04 +08:00
|
|
|
|
2014-06-27 19:23:44 +08:00
|
|
|
%shuffle = shufflevector <2 x double> %a, <2 x double> %b, <2 x i32> <i32 3, i32 2>
|
|
|
|
ret <2 x double> %shuffle
|
|
|
|
}
|
|
|
|
define <2 x double> @shuffle_v2f64_33(<2 x double> %a, <2 x double> %b) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-LABEL: shuffle_v2f64_33:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2014-09-21 05:26:41 +08:00
|
|
|
; SSE-NEXT: movaps %xmm1, %xmm0
|
2018-09-20 02:59:08 +08:00
|
|
|
; SSE-NEXT: unpckhpd {{.*#+}} xmm0 = xmm0[1],xmm1[1]
|
2014-09-21 05:26:41 +08:00
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
2015-11-21 21:04:42 +08:00
|
|
|
; AVX-LABEL: shuffle_v2f64_33:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2016-06-28 16:08:15 +08:00
|
|
|
; AVX-NEXT: vpermilpd {{.*#+}} xmm0 = xmm1[1,1]
|
2015-11-21 21:04:42 +08:00
|
|
|
; AVX-NEXT: retq
|
2014-06-27 19:23:44 +08:00
|
|
|
%shuffle = shufflevector <2 x double> %a, <2 x double> %b, <2 x i32> <i32 3, i32 3>
|
|
|
|
ret <2 x double> %shuffle
|
|
|
|
}
|
2014-09-15 07:15:52 +08:00
|
|
|
define <2 x double> @shuffle_v2f64_03(<2 x double> %a, <2 x double> %b) {
|
2014-10-04 06:43:17 +08:00
|
|
|
; SSE2-LABEL: shuffle_v2f64_03:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE2: # %bb.0:
|
2019-07-08 14:52:49 +08:00
|
|
|
; SSE2-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[2,3]
|
2014-10-04 06:43:17 +08:00
|
|
|
; SSE2-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSE3-LABEL: shuffle_v2f64_03:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE3: # %bb.0:
|
2019-07-08 14:52:49 +08:00
|
|
|
; SSE3-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[2,3]
|
2014-10-04 06:43:17 +08:00
|
|
|
; SSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSSE3-LABEL: shuffle_v2f64_03:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSSE3: # %bb.0:
|
2019-07-08 14:52:49 +08:00
|
|
|
; SSSE3-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[2,3]
|
2014-10-04 06:43:17 +08:00
|
|
|
; SSSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSE41-LABEL: shuffle_v2f64_03:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE41: # %bb.0:
|
2018-01-16 06:18:45 +08:00
|
|
|
; SSE41-NEXT: blendps {{.*#+}} xmm0 = xmm0[0,1],xmm1[2,3]
|
2014-10-04 06:43:17 +08:00
|
|
|
; SSE41-NEXT: retq
|
2014-10-01 05:44:34 +08:00
|
|
|
;
|
2018-07-14 10:05:08 +08:00
|
|
|
; AVX-LABEL: shuffle_v2f64_03:
|
|
|
|
; AVX: # %bb.0:
|
|
|
|
; AVX-NEXT: vblendps {{.*#+}} xmm0 = xmm0[0,1],xmm1[2,3]
|
|
|
|
; AVX-NEXT: retq
|
2014-09-15 07:15:52 +08:00
|
|
|
%shuffle = shufflevector <2 x double> %a, <2 x double> %b, <2 x i32> <i32 0, i32 3>
|
|
|
|
ret <2 x double> %shuffle
|
|
|
|
}
|
|
|
|
define <2 x double> @shuffle_v2f64_21(<2 x double> %a, <2 x double> %b) {
|
2014-10-04 06:43:17 +08:00
|
|
|
; SSE2-LABEL: shuffle_v2f64_21:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE2: # %bb.0:
|
2015-01-31 22:09:36 +08:00
|
|
|
; SSE2-NEXT: movsd {{.*#+}} xmm0 = xmm1[0],xmm0[1]
|
2014-10-04 06:43:17 +08:00
|
|
|
; SSE2-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSE3-LABEL: shuffle_v2f64_21:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE3: # %bb.0:
|
2015-01-31 22:09:36 +08:00
|
|
|
; SSE3-NEXT: movsd {{.*#+}} xmm0 = xmm1[0],xmm0[1]
|
2014-10-04 06:43:17 +08:00
|
|
|
; SSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSSE3-LABEL: shuffle_v2f64_21:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSSE3: # %bb.0:
|
2015-01-31 22:09:36 +08:00
|
|
|
; SSSE3-NEXT: movsd {{.*#+}} xmm0 = xmm1[0],xmm0[1]
|
2014-10-04 06:43:17 +08:00
|
|
|
; SSSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSE41-LABEL: shuffle_v2f64_21:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE41: # %bb.0:
|
2018-01-16 06:18:45 +08:00
|
|
|
; SSE41-NEXT: blendps {{.*#+}} xmm0 = xmm1[0,1],xmm0[2,3]
|
2014-10-04 06:43:17 +08:00
|
|
|
; SSE41-NEXT: retq
|
2014-10-01 05:44:34 +08:00
|
|
|
;
|
2018-07-14 10:05:08 +08:00
|
|
|
; AVX-LABEL: shuffle_v2f64_21:
|
|
|
|
; AVX: # %bb.0:
|
|
|
|
; AVX-NEXT: vblendps {{.*#+}} xmm0 = xmm1[0,1],xmm0[2,3]
|
|
|
|
; AVX-NEXT: retq
|
2014-09-15 07:15:52 +08:00
|
|
|
%shuffle = shufflevector <2 x double> %a, <2 x double> %b, <2 x i32> <i32 2, i32 1>
|
|
|
|
ret <2 x double> %shuffle
|
|
|
|
}
|
2018-01-10 20:23:39 +08:00
|
|
|
define <2 x double> @shuffle_v2f64_u2(<2 x double> %a, <2 x double> %b) {
|
|
|
|
; SSE2-LABEL: shuffle_v2f64_u2:
|
|
|
|
; SSE2: # %bb.0:
|
2018-01-15 02:50:34 +08:00
|
|
|
; SSE2-NEXT: movlhps {{.*#+}} xmm0 = xmm0[0],xmm1[0]
|
2018-01-10 20:23:39 +08:00
|
|
|
; SSE2-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSE3-LABEL: shuffle_v2f64_u2:
|
|
|
|
; SSE3: # %bb.0:
|
|
|
|
; SSE3-NEXT: movddup {{.*#+}} xmm0 = xmm1[0,0]
|
|
|
|
; SSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSSE3-LABEL: shuffle_v2f64_u2:
|
|
|
|
; SSSE3: # %bb.0:
|
|
|
|
; SSSE3-NEXT: movddup {{.*#+}} xmm0 = xmm1[0,0]
|
|
|
|
; SSSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSE41-LABEL: shuffle_v2f64_u2:
|
|
|
|
; SSE41: # %bb.0:
|
|
|
|
; SSE41-NEXT: movddup {{.*#+}} xmm0 = xmm1[0,0]
|
|
|
|
; SSE41-NEXT: retq
|
|
|
|
;
|
|
|
|
; AVX-LABEL: shuffle_v2f64_u2:
|
|
|
|
; AVX: # %bb.0:
|
|
|
|
; AVX-NEXT: vmovddup {{.*#+}} xmm0 = xmm1[0,0]
|
|
|
|
; AVX-NEXT: retq
|
|
|
|
%shuffle = shufflevector <2 x double> %a, <2 x double> %b, <2 x i32> <i32 undef, i32 2>
|
|
|
|
ret <2 x double> %shuffle
|
|
|
|
}
|
2018-01-15 02:38:21 +08:00
|
|
|
define <2 x double> @shuffle_v2f64_3u(<2 x double> %a, <2 x double> %b) {
|
|
|
|
; SSE-LABEL: shuffle_v2f64_3u:
|
|
|
|
; SSE: # %bb.0:
|
|
|
|
; SSE-NEXT: movaps %xmm1, %xmm0
|
2018-09-20 02:59:08 +08:00
|
|
|
; SSE-NEXT: unpckhpd {{.*#+}} xmm0 = xmm0[1],xmm1[1]
|
2018-01-15 02:38:21 +08:00
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
|
|
|
; AVX-LABEL: shuffle_v2f64_3u:
|
|
|
|
; AVX: # %bb.0:
|
|
|
|
; AVX-NEXT: vpermilpd {{.*#+}} xmm0 = xmm1[1,0]
|
|
|
|
; AVX-NEXT: retq
|
|
|
|
%shuffle = shufflevector <2 x double> %a, <2 x double> %b, <2 x i32> <i32 3, i32 undef>
|
|
|
|
ret <2 x double> %shuffle
|
|
|
|
}
|
2014-06-27 19:23:44 +08:00
|
|
|
|
|
|
|
define <2 x i64> @shuffle_v2i64_02(<2 x i64> %a, <2 x i64> %b) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-LABEL: shuffle_v2i64_02:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2017-09-18 12:40:58 +08:00
|
|
|
; SSE-NEXT: movlhps {{.*#+}} xmm0 = xmm0[0],xmm1[0]
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
2015-11-18 06:35:45 +08:00
|
|
|
; AVX-LABEL: shuffle_v2i64_02:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2017-09-18 12:40:58 +08:00
|
|
|
; AVX-NEXT: vmovlhps {{.*#+}} xmm0 = xmm0[0],xmm1[0]
|
2015-11-18 06:35:45 +08:00
|
|
|
; AVX-NEXT: retq
|
2014-06-27 19:23:44 +08:00
|
|
|
%shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 0, i32 2>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
define <2 x i64> @shuffle_v2i64_02_copy(<2 x i64> %nonce, <2 x i64> %a, <2 x i64> %b) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-LABEL: shuffle_v2i64_02_copy:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2017-09-18 11:29:54 +08:00
|
|
|
; SSE-NEXT: movaps %xmm1, %xmm0
|
2018-09-20 02:59:08 +08:00
|
|
|
; SSE-NEXT: movlhps {{.*#+}} xmm0 = xmm0[0],xmm2[0]
|
2014-09-21 05:26:41 +08:00
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
2015-11-18 06:35:45 +08:00
|
|
|
; AVX-LABEL: shuffle_v2i64_02_copy:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2017-09-18 12:40:58 +08:00
|
|
|
; AVX-NEXT: vmovlhps {{.*#+}} xmm0 = xmm1[0],xmm2[0]
|
2015-11-18 06:35:45 +08:00
|
|
|
; AVX-NEXT: retq
|
2014-06-27 19:23:44 +08:00
|
|
|
%shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 0, i32 2>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
define <2 x i64> @shuffle_v2i64_03(<2 x i64> %a, <2 x i64> %b) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE2-LABEL: shuffle_v2i64_03:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE2: # %bb.0:
|
2019-07-08 14:52:49 +08:00
|
|
|
; SSE2-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[2,3]
|
2014-09-15 07:43:33 +08:00
|
|
|
; SSE2-NEXT: retq
|
|
|
|
;
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE3-LABEL: shuffle_v2i64_03:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE3: # %bb.0:
|
2019-07-08 14:52:49 +08:00
|
|
|
; SSE3-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[2,3]
|
2014-09-15 07:43:33 +08:00
|
|
|
; SSE3-NEXT: retq
|
|
|
|
;
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSSE3-LABEL: shuffle_v2i64_03:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSSE3: # %bb.0:
|
2019-07-08 14:52:49 +08:00
|
|
|
; SSSE3-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[2,3]
|
2014-09-18 16:33:04 +08:00
|
|
|
; SSSE3-NEXT: retq
|
|
|
|
;
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE41-LABEL: shuffle_v2i64_03:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE41: # %bb.0:
|
2018-01-16 06:18:45 +08:00
|
|
|
; SSE41-NEXT: blendps {{.*#+}} xmm0 = xmm0[0,1],xmm1[2,3]
|
2014-09-15 07:43:33 +08:00
|
|
|
; SSE41-NEXT: retq
|
2014-10-01 05:44:34 +08:00
|
|
|
;
|
2018-01-16 06:18:45 +08:00
|
|
|
; AVX-LABEL: shuffle_v2i64_03:
|
|
|
|
; AVX: # %bb.0:
|
|
|
|
; AVX-NEXT: vblendps {{.*#+}} xmm0 = xmm0[0,1],xmm1[2,3]
|
|
|
|
; AVX-NEXT: retq
|
2014-06-27 19:23:44 +08:00
|
|
|
%shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 0, i32 3>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
define <2 x i64> @shuffle_v2i64_03_copy(<2 x i64> %nonce, <2 x i64> %a, <2 x i64> %b) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE2-LABEL: shuffle_v2i64_03_copy:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE2: # %bb.0:
|
2019-07-08 14:52:49 +08:00
|
|
|
; SSE2-NEXT: movaps %xmm1, %xmm0
|
|
|
|
; SSE2-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm2[2,3]
|
2014-09-15 07:43:33 +08:00
|
|
|
; SSE2-NEXT: retq
|
|
|
|
;
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE3-LABEL: shuffle_v2i64_03_copy:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE3: # %bb.0:
|
2019-07-08 14:52:49 +08:00
|
|
|
; SSE3-NEXT: movaps %xmm1, %xmm0
|
|
|
|
; SSE3-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm2[2,3]
|
2014-09-15 07:43:33 +08:00
|
|
|
; SSE3-NEXT: retq
|
|
|
|
;
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSSE3-LABEL: shuffle_v2i64_03_copy:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSSE3: # %bb.0:
|
2019-07-08 14:52:49 +08:00
|
|
|
; SSSE3-NEXT: movaps %xmm1, %xmm0
|
|
|
|
; SSSE3-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm2[2,3]
|
2014-09-18 16:33:04 +08:00
|
|
|
; SSSE3-NEXT: retq
|
|
|
|
;
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE41-LABEL: shuffle_v2i64_03_copy:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE41: # %bb.0:
|
2018-01-16 06:18:45 +08:00
|
|
|
; SSE41-NEXT: movaps %xmm1, %xmm0
|
2018-09-20 02:59:08 +08:00
|
|
|
; SSE41-NEXT: blendps {{.*#+}} xmm0 = xmm0[0,1],xmm2[2,3]
|
2014-09-15 07:43:33 +08:00
|
|
|
; SSE41-NEXT: retq
|
2014-10-01 05:44:34 +08:00
|
|
|
;
|
2018-01-16 06:18:45 +08:00
|
|
|
; AVX-LABEL: shuffle_v2i64_03_copy:
|
|
|
|
; AVX: # %bb.0:
|
|
|
|
; AVX-NEXT: vblendps {{.*#+}} xmm0 = xmm1[0,1],xmm2[2,3]
|
|
|
|
; AVX-NEXT: retq
|
2014-06-27 19:23:44 +08:00
|
|
|
%shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 0, i32 3>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
define <2 x i64> @shuffle_v2i64_12(<2 x i64> %a, <2 x i64> %b) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE2-LABEL: shuffle_v2i64_12:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE2: # %bb.0:
|
2019-07-08 14:52:49 +08:00
|
|
|
; SSE2-NEXT: shufps {{.*#+}} xmm0 = xmm0[2,3],xmm1[0,1]
|
2014-09-18 17:00:25 +08:00
|
|
|
; SSE2-NEXT: retq
|
|
|
|
;
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE3-LABEL: shuffle_v2i64_12:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE3: # %bb.0:
|
2019-07-08 14:52:49 +08:00
|
|
|
; SSE3-NEXT: shufps {{.*#+}} xmm0 = xmm0[2,3],xmm1[0,1]
|
2014-09-18 17:00:25 +08:00
|
|
|
; SSE3-NEXT: retq
|
|
|
|
;
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSSE3-LABEL: shuffle_v2i64_12:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSSE3: # %bb.0:
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSSE3-NEXT: palignr {{.*#+}} xmm1 = xmm0[8,9,10,11,12,13,14,15],xmm1[0,1,2,3,4,5,6,7]
|
2014-09-18 17:00:25 +08:00
|
|
|
; SSSE3-NEXT: movdqa %xmm1, %xmm0
|
|
|
|
; SSSE3-NEXT: retq
|
|
|
|
;
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE41-LABEL: shuffle_v2i64_12:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE41: # %bb.0:
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE41-NEXT: palignr {{.*#+}} xmm1 = xmm0[8,9,10,11,12,13,14,15],xmm1[0,1,2,3,4,5,6,7]
|
2014-09-18 17:00:25 +08:00
|
|
|
; SSE41-NEXT: movdqa %xmm1, %xmm0
|
|
|
|
; SSE41-NEXT: retq
|
2014-10-01 05:44:34 +08:00
|
|
|
;
|
|
|
|
; AVX-LABEL: shuffle_v2i64_12:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2014-10-01 05:44:34 +08:00
|
|
|
; AVX-NEXT: vpalignr {{.*#+}} xmm0 = xmm0[8,9,10,11,12,13,14,15],xmm1[0,1,2,3,4,5,6,7]
|
|
|
|
; AVX-NEXT: retq
|
2014-06-27 19:23:44 +08:00
|
|
|
%shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 1, i32 2>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
define <2 x i64> @shuffle_v2i64_12_copy(<2 x i64> %nonce, <2 x i64> %a, <2 x i64> %b) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE2-LABEL: shuffle_v2i64_12_copy:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE2: # %bb.0:
|
2019-07-08 14:52:49 +08:00
|
|
|
; SSE2-NEXT: movaps %xmm1, %xmm0
|
|
|
|
; SSE2-NEXT: shufps {{.*#+}} xmm0 = xmm0[2,3],xmm2[0,1]
|
2014-09-18 17:00:25 +08:00
|
|
|
; SSE2-NEXT: retq
|
|
|
|
;
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE3-LABEL: shuffle_v2i64_12_copy:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE3: # %bb.0:
|
2019-07-08 14:52:49 +08:00
|
|
|
; SSE3-NEXT: movaps %xmm1, %xmm0
|
|
|
|
; SSE3-NEXT: shufps {{.*#+}} xmm0 = xmm0[2,3],xmm2[0,1]
|
2014-09-18 17:00:25 +08:00
|
|
|
; SSE3-NEXT: retq
|
|
|
|
;
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSSE3-LABEL: shuffle_v2i64_12_copy:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSSE3: # %bb.0:
|
2014-09-18 17:00:25 +08:00
|
|
|
; SSSE3-NEXT: movdqa %xmm2, %xmm0
|
2018-09-20 02:59:08 +08:00
|
|
|
; SSSE3-NEXT: palignr {{.*#+}} xmm0 = xmm1[8,9,10,11,12,13,14,15],xmm0[0,1,2,3,4,5,6,7]
|
2014-09-18 17:00:25 +08:00
|
|
|
; SSSE3-NEXT: retq
|
|
|
|
;
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE41-LABEL: shuffle_v2i64_12_copy:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE41: # %bb.0:
|
2014-09-18 17:00:25 +08:00
|
|
|
; SSE41-NEXT: movdqa %xmm2, %xmm0
|
2018-09-20 02:59:08 +08:00
|
|
|
; SSE41-NEXT: palignr {{.*#+}} xmm0 = xmm1[8,9,10,11,12,13,14,15],xmm0[0,1,2,3,4,5,6,7]
|
2014-09-18 17:00:25 +08:00
|
|
|
; SSE41-NEXT: retq
|
2014-10-01 05:44:34 +08:00
|
|
|
;
|
|
|
|
; AVX-LABEL: shuffle_v2i64_12_copy:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2014-10-01 05:44:34 +08:00
|
|
|
; AVX-NEXT: vpalignr {{.*#+}} xmm0 = xmm1[8,9,10,11,12,13,14,15],xmm2[0,1,2,3,4,5,6,7]
|
|
|
|
; AVX-NEXT: retq
|
2014-06-27 19:23:44 +08:00
|
|
|
%shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 1, i32 2>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
define <2 x i64> @shuffle_v2i64_13(<2 x i64> %a, <2 x i64> %b) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-LABEL: shuffle_v2i64_13:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2017-09-18 11:29:54 +08:00
|
|
|
; SSE-NEXT: unpckhpd {{.*#+}} xmm0 = xmm0[1],xmm1[1]
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
2015-11-18 06:35:45 +08:00
|
|
|
; AVX-LABEL: shuffle_v2i64_13:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2017-09-18 11:29:54 +08:00
|
|
|
; AVX-NEXT: vunpckhpd {{.*#+}} xmm0 = xmm0[1],xmm1[1]
|
2015-11-18 06:35:45 +08:00
|
|
|
; AVX-NEXT: retq
|
2014-06-27 19:23:44 +08:00
|
|
|
%shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 1, i32 3>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
define <2 x i64> @shuffle_v2i64_13_copy(<2 x i64> %nonce, <2 x i64> %a, <2 x i64> %b) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-LABEL: shuffle_v2i64_13_copy:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2017-09-18 11:29:54 +08:00
|
|
|
; SSE-NEXT: movaps %xmm1, %xmm0
|
2018-09-20 02:59:08 +08:00
|
|
|
; SSE-NEXT: unpckhpd {{.*#+}} xmm0 = xmm0[1],xmm2[1]
|
2014-09-21 05:26:41 +08:00
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
2015-11-18 06:35:45 +08:00
|
|
|
; AVX-LABEL: shuffle_v2i64_13_copy:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2017-09-18 11:29:54 +08:00
|
|
|
; AVX-NEXT: vunpckhpd {{.*#+}} xmm0 = xmm1[1],xmm2[1]
|
2015-11-18 06:35:45 +08:00
|
|
|
; AVX-NEXT: retq
|
2014-06-27 19:23:44 +08:00
|
|
|
%shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 1, i32 3>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
define <2 x i64> @shuffle_v2i64_20(<2 x i64> %a, <2 x i64> %b) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-LABEL: shuffle_v2i64_20:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2017-09-18 12:40:58 +08:00
|
|
|
; SSE-NEXT: movlhps {{.*#+}} xmm1 = xmm1[0],xmm0[0]
|
2017-09-18 11:29:54 +08:00
|
|
|
; SSE-NEXT: movaps %xmm1, %xmm0
|
2014-09-21 05:26:41 +08:00
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
2015-11-18 06:35:45 +08:00
|
|
|
; AVX-LABEL: shuffle_v2i64_20:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2017-09-18 12:40:58 +08:00
|
|
|
; AVX-NEXT: vmovlhps {{.*#+}} xmm0 = xmm1[0],xmm0[0]
|
2015-11-18 06:35:45 +08:00
|
|
|
; AVX-NEXT: retq
|
2014-06-27 19:23:44 +08:00
|
|
|
%shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 2, i32 0>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
define <2 x i64> @shuffle_v2i64_20_copy(<2 x i64> %nonce, <2 x i64> %a, <2 x i64> %b) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-LABEL: shuffle_v2i64_20_copy:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2017-09-18 11:29:54 +08:00
|
|
|
; SSE-NEXT: movaps %xmm2, %xmm0
|
2018-09-20 02:59:08 +08:00
|
|
|
; SSE-NEXT: movlhps {{.*#+}} xmm0 = xmm0[0],xmm1[0]
|
2014-09-21 05:26:41 +08:00
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
2015-11-18 06:35:45 +08:00
|
|
|
; AVX-LABEL: shuffle_v2i64_20_copy:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2017-09-18 12:40:58 +08:00
|
|
|
; AVX-NEXT: vmovlhps {{.*#+}} xmm0 = xmm2[0],xmm1[0]
|
2015-11-18 06:35:45 +08:00
|
|
|
; AVX-NEXT: retq
|
2014-06-27 19:23:44 +08:00
|
|
|
%shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 2, i32 0>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
define <2 x i64> @shuffle_v2i64_21(<2 x i64> %a, <2 x i64> %b) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE2-LABEL: shuffle_v2i64_21:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE2: # %bb.0:
|
2015-01-31 22:09:36 +08:00
|
|
|
; SSE2-NEXT: movsd {{.*#+}} xmm0 = xmm1[0],xmm0[1]
|
2014-09-15 07:43:33 +08:00
|
|
|
; SSE2-NEXT: retq
|
|
|
|
;
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE3-LABEL: shuffle_v2i64_21:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE3: # %bb.0:
|
2015-01-31 22:09:36 +08:00
|
|
|
; SSE3-NEXT: movsd {{.*#+}} xmm0 = xmm1[0],xmm0[1]
|
2014-09-15 07:43:33 +08:00
|
|
|
; SSE3-NEXT: retq
|
|
|
|
;
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSSE3-LABEL: shuffle_v2i64_21:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSSE3: # %bb.0:
|
2015-01-31 22:09:36 +08:00
|
|
|
; SSSE3-NEXT: movsd {{.*#+}} xmm0 = xmm1[0],xmm0[1]
|
2014-09-18 16:33:04 +08:00
|
|
|
; SSSE3-NEXT: retq
|
|
|
|
;
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE41-LABEL: shuffle_v2i64_21:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE41: # %bb.0:
|
2018-01-16 06:18:45 +08:00
|
|
|
; SSE41-NEXT: blendps {{.*#+}} xmm0 = xmm1[0,1],xmm0[2,3]
|
2014-09-15 07:43:33 +08:00
|
|
|
; SSE41-NEXT: retq
|
2014-10-01 05:44:34 +08:00
|
|
|
;
|
2018-01-16 06:18:45 +08:00
|
|
|
; AVX-LABEL: shuffle_v2i64_21:
|
|
|
|
; AVX: # %bb.0:
|
|
|
|
; AVX-NEXT: vblendps {{.*#+}} xmm0 = xmm1[0,1],xmm0[2,3]
|
|
|
|
; AVX-NEXT: retq
|
2014-06-27 19:23:44 +08:00
|
|
|
%shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 2, i32 1>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
define <2 x i64> @shuffle_v2i64_21_copy(<2 x i64> %nonce, <2 x i64> %a, <2 x i64> %b) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE2-LABEL: shuffle_v2i64_21_copy:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE2: # %bb.0:
|
2015-02-04 18:58:53 +08:00
|
|
|
; SSE2-NEXT: movapd %xmm1, %xmm0
|
2018-09-20 02:59:08 +08:00
|
|
|
; SSE2-NEXT: movsd {{.*#+}} xmm0 = xmm2[0],xmm0[1]
|
2014-09-15 07:43:33 +08:00
|
|
|
; SSE2-NEXT: retq
|
|
|
|
;
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE3-LABEL: shuffle_v2i64_21_copy:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE3: # %bb.0:
|
2015-02-04 18:58:53 +08:00
|
|
|
; SSE3-NEXT: movapd %xmm1, %xmm0
|
2018-09-20 02:59:08 +08:00
|
|
|
; SSE3-NEXT: movsd {{.*#+}} xmm0 = xmm2[0],xmm0[1]
|
2014-09-15 07:43:33 +08:00
|
|
|
; SSE3-NEXT: retq
|
|
|
|
;
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSSE3-LABEL: shuffle_v2i64_21_copy:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSSE3: # %bb.0:
|
2015-02-04 18:58:53 +08:00
|
|
|
; SSSE3-NEXT: movapd %xmm1, %xmm0
|
2018-09-20 02:59:08 +08:00
|
|
|
; SSSE3-NEXT: movsd {{.*#+}} xmm0 = xmm2[0],xmm0[1]
|
2014-09-18 16:33:04 +08:00
|
|
|
; SSSE3-NEXT: retq
|
|
|
|
;
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE41-LABEL: shuffle_v2i64_21_copy:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE41: # %bb.0:
|
2018-01-16 06:18:45 +08:00
|
|
|
; SSE41-NEXT: movaps %xmm1, %xmm0
|
2018-09-20 02:59:08 +08:00
|
|
|
; SSE41-NEXT: blendps {{.*#+}} xmm0 = xmm2[0,1],xmm0[2,3]
|
2014-09-15 07:43:33 +08:00
|
|
|
; SSE41-NEXT: retq
|
2014-10-01 05:44:34 +08:00
|
|
|
;
|
2018-01-16 06:18:45 +08:00
|
|
|
; AVX-LABEL: shuffle_v2i64_21_copy:
|
|
|
|
; AVX: # %bb.0:
|
|
|
|
; AVX-NEXT: vblendps {{.*#+}} xmm0 = xmm2[0,1],xmm1[2,3]
|
|
|
|
; AVX-NEXT: retq
|
2014-06-27 19:23:44 +08:00
|
|
|
%shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 2, i32 1>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
define <2 x i64> @shuffle_v2i64_30(<2 x i64> %a, <2 x i64> %b) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE2-LABEL: shuffle_v2i64_30:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE2: # %bb.0:
|
2019-07-08 14:52:49 +08:00
|
|
|
; SSE2-NEXT: shufps {{.*#+}} xmm1 = xmm1[2,3],xmm0[0,1]
|
|
|
|
; SSE2-NEXT: movaps %xmm1, %xmm0
|
2014-09-18 17:00:25 +08:00
|
|
|
; SSE2-NEXT: retq
|
|
|
|
;
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE3-LABEL: shuffle_v2i64_30:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE3: # %bb.0:
|
2019-07-08 14:52:49 +08:00
|
|
|
; SSE3-NEXT: shufps {{.*#+}} xmm1 = xmm1[2,3],xmm0[0,1]
|
|
|
|
; SSE3-NEXT: movaps %xmm1, %xmm0
|
2014-09-18 17:00:25 +08:00
|
|
|
; SSE3-NEXT: retq
|
|
|
|
;
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSSE3-LABEL: shuffle_v2i64_30:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSSE3: # %bb.0:
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSSE3-NEXT: palignr {{.*#+}} xmm0 = xmm1[8,9,10,11,12,13,14,15],xmm0[0,1,2,3,4,5,6,7]
|
2014-09-18 17:00:25 +08:00
|
|
|
; SSSE3-NEXT: retq
|
2014-10-01 05:44:34 +08:00
|
|
|
;
|
|
|
|
; SSE41-LABEL: shuffle_v2i64_30:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE41: # %bb.0:
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE41-NEXT: palignr {{.*#+}} xmm0 = xmm1[8,9,10,11,12,13,14,15],xmm0[0,1,2,3,4,5,6,7]
|
|
|
|
; SSE41-NEXT: retq
|
|
|
|
;
|
|
|
|
; AVX-LABEL: shuffle_v2i64_30:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2014-10-01 05:44:34 +08:00
|
|
|
; AVX-NEXT: vpalignr {{.*#+}} xmm0 = xmm1[8,9,10,11,12,13,14,15],xmm0[0,1,2,3,4,5,6,7]
|
|
|
|
; AVX-NEXT: retq
|
2014-06-27 19:23:44 +08:00
|
|
|
%shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 3, i32 0>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
define <2 x i64> @shuffle_v2i64_30_copy(<2 x i64> %nonce, <2 x i64> %a, <2 x i64> %b) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE2-LABEL: shuffle_v2i64_30_copy:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE2: # %bb.0:
|
2019-07-08 14:52:49 +08:00
|
|
|
; SSE2-NEXT: movaps %xmm2, %xmm0
|
|
|
|
; SSE2-NEXT: shufps {{.*#+}} xmm0 = xmm0[2,3],xmm1[0,1]
|
2014-09-18 17:00:25 +08:00
|
|
|
; SSE2-NEXT: retq
|
|
|
|
;
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE3-LABEL: shuffle_v2i64_30_copy:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE3: # %bb.0:
|
2019-07-08 14:52:49 +08:00
|
|
|
; SSE3-NEXT: movaps %xmm2, %xmm0
|
|
|
|
; SSE3-NEXT: shufps {{.*#+}} xmm0 = xmm0[2,3],xmm1[0,1]
|
2014-09-18 17:00:25 +08:00
|
|
|
; SSE3-NEXT: retq
|
|
|
|
;
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSSE3-LABEL: shuffle_v2i64_30_copy:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSSE3: # %bb.0:
|
2014-09-18 17:00:25 +08:00
|
|
|
; SSSE3-NEXT: movdqa %xmm1, %xmm0
|
2018-09-20 02:59:08 +08:00
|
|
|
; SSSE3-NEXT: palignr {{.*#+}} xmm0 = xmm2[8,9,10,11,12,13,14,15],xmm0[0,1,2,3,4,5,6,7]
|
2014-09-18 17:00:25 +08:00
|
|
|
; SSSE3-NEXT: retq
|
|
|
|
;
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE41-LABEL: shuffle_v2i64_30_copy:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE41: # %bb.0:
|
2014-09-18 17:00:25 +08:00
|
|
|
; SSE41-NEXT: movdqa %xmm1, %xmm0
|
2018-09-20 02:59:08 +08:00
|
|
|
; SSE41-NEXT: palignr {{.*#+}} xmm0 = xmm2[8,9,10,11,12,13,14,15],xmm0[0,1,2,3,4,5,6,7]
|
2014-09-18 17:00:25 +08:00
|
|
|
; SSE41-NEXT: retq
|
2014-10-01 05:44:34 +08:00
|
|
|
;
|
|
|
|
; AVX-LABEL: shuffle_v2i64_30_copy:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2014-10-01 05:44:34 +08:00
|
|
|
; AVX-NEXT: vpalignr {{.*#+}} xmm0 = xmm2[8,9,10,11,12,13,14,15],xmm1[0,1,2,3,4,5,6,7]
|
|
|
|
; AVX-NEXT: retq
|
2014-06-27 19:23:44 +08:00
|
|
|
%shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 3, i32 0>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
define <2 x i64> @shuffle_v2i64_31(<2 x i64> %a, <2 x i64> %b) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-LABEL: shuffle_v2i64_31:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2017-09-18 11:29:54 +08:00
|
|
|
; SSE-NEXT: unpckhpd {{.*#+}} xmm1 = xmm1[1],xmm0[1]
|
|
|
|
; SSE-NEXT: movaps %xmm1, %xmm0
|
2014-09-21 05:26:41 +08:00
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
2015-11-18 06:35:45 +08:00
|
|
|
; AVX-LABEL: shuffle_v2i64_31:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2017-09-18 11:29:54 +08:00
|
|
|
; AVX-NEXT: vunpckhpd {{.*#+}} xmm0 = xmm1[1],xmm0[1]
|
2015-11-18 06:35:45 +08:00
|
|
|
; AVX-NEXT: retq
|
2014-06-27 19:23:44 +08:00
|
|
|
%shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 3, i32 1>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
define <2 x i64> @shuffle_v2i64_31_copy(<2 x i64> %nonce, <2 x i64> %a, <2 x i64> %b) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-LABEL: shuffle_v2i64_31_copy:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2017-09-18 11:29:54 +08:00
|
|
|
; SSE-NEXT: movaps %xmm2, %xmm0
|
2018-09-20 02:59:08 +08:00
|
|
|
; SSE-NEXT: unpckhpd {{.*#+}} xmm0 = xmm0[1],xmm1[1]
|
2014-09-21 05:26:41 +08:00
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
2015-11-18 06:35:45 +08:00
|
|
|
; AVX-LABEL: shuffle_v2i64_31_copy:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2017-09-18 11:29:54 +08:00
|
|
|
; AVX-NEXT: vunpckhpd {{.*#+}} xmm0 = xmm2[1],xmm1[1]
|
2015-11-18 06:35:45 +08:00
|
|
|
; AVX-NEXT: retq
|
2014-06-27 19:23:44 +08:00
|
|
|
%shuffle = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 3, i32 1>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
2014-09-15 06:41:37 +08:00
|
|
|
|
2014-10-03 19:16:45 +08:00
|
|
|
define <2 x i64> @shuffle_v2i64_0z(<2 x i64> %a) {
|
2014-10-03 19:25:58 +08:00
|
|
|
; SSE-LABEL: shuffle_v2i64_0z:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2015-01-31 22:09:36 +08:00
|
|
|
; SSE-NEXT: movq {{.*#+}} xmm0 = xmm0[0],zero
|
2014-10-03 19:25:58 +08:00
|
|
|
; SSE-NEXT: retq
|
2014-10-03 19:16:45 +08:00
|
|
|
;
|
2015-12-13 05:46:23 +08:00
|
|
|
; AVX-LABEL: shuffle_v2i64_0z:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2015-12-13 05:46:23 +08:00
|
|
|
; AVX-NEXT: vmovq {{.*#+}} xmm0 = xmm0[0],zero
|
|
|
|
; AVX-NEXT: retq
|
2014-10-03 19:16:45 +08:00
|
|
|
%shuffle = shufflevector <2 x i64> %a, <2 x i64> zeroinitializer, <2 x i32> <i32 0, i32 3>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
|
|
|
|
define <2 x i64> @shuffle_v2i64_1z(<2 x i64> %a) {
|
|
|
|
; SSE-LABEL: shuffle_v2i64_1z:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2014-11-26 06:34:59 +08:00
|
|
|
; SSE-NEXT: psrldq {{.*#+}} xmm0 = xmm0[8,9,10,11,12,13,14,15],zero,zero,zero,zero,zero,zero,zero,zero
|
2014-10-03 19:16:45 +08:00
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
|
|
|
; AVX-LABEL: shuffle_v2i64_1z:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2014-11-26 06:34:59 +08:00
|
|
|
; AVX-NEXT: vpsrldq {{.*#+}} xmm0 = xmm0[8,9,10,11,12,13,14,15],zero,zero,zero,zero,zero,zero,zero,zero
|
2014-10-03 19:16:45 +08:00
|
|
|
; AVX-NEXT: retq
|
|
|
|
%shuffle = shufflevector <2 x i64> %a, <2 x i64> zeroinitializer, <2 x i32> <i32 1, i32 3>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
|
|
|
|
define <2 x i64> @shuffle_v2i64_z0(<2 x i64> %a) {
|
|
|
|
; SSE-LABEL: shuffle_v2i64_z0:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2014-11-26 06:34:59 +08:00
|
|
|
; SSE-NEXT: pslldq {{.*#+}} xmm0 = zero,zero,zero,zero,zero,zero,zero,zero,xmm0[0,1,2,3,4,5,6,7]
|
2014-10-03 19:16:45 +08:00
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
|
|
|
; AVX-LABEL: shuffle_v2i64_z0:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2014-12-08 01:15:53 +08:00
|
|
|
; AVX-NEXT: vpslldq {{.*#+}} xmm0 = zero,zero,zero,zero,zero,zero,zero,zero,xmm0[0,1,2,3,4,5,6,7]
|
2014-10-03 19:16:45 +08:00
|
|
|
; AVX-NEXT: retq
|
|
|
|
%shuffle = shufflevector <2 x i64> %a, <2 x i64> zeroinitializer, <2 x i32> <i32 2, i32 0>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
|
|
|
|
define <2 x i64> @shuffle_v2i64_z1(<2 x i64> %a) {
|
|
|
|
; SSE2-LABEL: shuffle_v2i64_z1:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE2: # %bb.0:
|
2019-07-24 02:46:15 +08:00
|
|
|
; SSE2-NEXT: xorps %xmm1, %xmm1
|
|
|
|
; SSE2-NEXT: unpckhpd {{.*#+}} xmm1 = xmm1[1],xmm0[1]
|
|
|
|
; SSE2-NEXT: movaps %xmm1, %xmm0
|
2014-10-03 19:16:45 +08:00
|
|
|
; SSE2-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSE3-LABEL: shuffle_v2i64_z1:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE3: # %bb.0:
|
2019-07-24 02:46:15 +08:00
|
|
|
; SSE3-NEXT: xorps %xmm1, %xmm1
|
|
|
|
; SSE3-NEXT: unpckhpd {{.*#+}} xmm1 = xmm1[1],xmm0[1]
|
|
|
|
; SSE3-NEXT: movaps %xmm1, %xmm0
|
2014-10-03 19:16:45 +08:00
|
|
|
; SSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSSE3-LABEL: shuffle_v2i64_z1:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSSE3: # %bb.0:
|
2019-07-24 02:46:15 +08:00
|
|
|
; SSSE3-NEXT: xorps %xmm1, %xmm1
|
|
|
|
; SSSE3-NEXT: unpckhpd {{.*#+}} xmm1 = xmm1[1],xmm0[1]
|
|
|
|
; SSSE3-NEXT: movaps %xmm1, %xmm0
|
2014-10-03 19:16:45 +08:00
|
|
|
; SSSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSE41-LABEL: shuffle_v2i64_z1:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE41: # %bb.0:
|
2018-01-16 06:18:45 +08:00
|
|
|
; SSE41-NEXT: xorps %xmm1, %xmm1
|
|
|
|
; SSE41-NEXT: blendps {{.*#+}} xmm0 = xmm1[0,1],xmm0[2,3]
|
2014-10-03 19:16:45 +08:00
|
|
|
; SSE41-NEXT: retq
|
|
|
|
;
|
2018-07-16 07:32:36 +08:00
|
|
|
; AVX-LABEL: shuffle_v2i64_z1:
|
|
|
|
; AVX: # %bb.0:
|
|
|
|
; AVX-NEXT: vxorps %xmm1, %xmm1, %xmm1
|
|
|
|
; AVX-NEXT: vblendps {{.*#+}} xmm0 = xmm1[0,1],xmm0[2,3]
|
|
|
|
; AVX-NEXT: retq
|
2014-10-03 19:16:45 +08:00
|
|
|
%shuffle = shufflevector <2 x i64> %a, <2 x i64> zeroinitializer, <2 x i32> <i32 2, i32 1>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
|
|
|
|
define <2 x double> @shuffle_v2f64_0z(<2 x double> %a) {
|
2014-10-03 19:25:58 +08:00
|
|
|
; SSE-LABEL: shuffle_v2f64_0z:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2015-01-31 22:09:36 +08:00
|
|
|
; SSE-NEXT: movq {{.*#+}} xmm0 = xmm0[0],zero
|
2014-10-03 19:25:58 +08:00
|
|
|
; SSE-NEXT: retq
|
2014-10-03 19:16:45 +08:00
|
|
|
;
|
2015-12-13 05:46:23 +08:00
|
|
|
; AVX-LABEL: shuffle_v2f64_0z:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2015-12-13 05:46:23 +08:00
|
|
|
; AVX-NEXT: vmovq {{.*#+}} xmm0 = xmm0[0],zero
|
|
|
|
; AVX-NEXT: retq
|
2014-10-03 19:16:45 +08:00
|
|
|
%shuffle = shufflevector <2 x double> %a, <2 x double> zeroinitializer, <2 x i32> <i32 0, i32 3>
|
|
|
|
ret <2 x double> %shuffle
|
|
|
|
}
|
|
|
|
|
|
|
|
define <2 x double> @shuffle_v2f64_1z(<2 x double> %a) {
|
|
|
|
; SSE-LABEL: shuffle_v2f64_1z:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2017-09-18 11:29:54 +08:00
|
|
|
; SSE-NEXT: xorps %xmm1, %xmm1
|
2014-10-03 19:16:45 +08:00
|
|
|
; SSE-NEXT: unpckhpd {{.*#+}} xmm0 = xmm0[1],xmm1[1]
|
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
2018-07-16 07:32:36 +08:00
|
|
|
; AVX-LABEL: shuffle_v2f64_1z:
|
|
|
|
; AVX: # %bb.0:
|
|
|
|
; AVX-NEXT: vxorps %xmm1, %xmm1, %xmm1
|
|
|
|
; AVX-NEXT: vunpckhpd {{.*#+}} xmm0 = xmm0[1],xmm1[1]
|
|
|
|
; AVX-NEXT: retq
|
2014-10-03 19:16:45 +08:00
|
|
|
%shuffle = shufflevector <2 x double> %a, <2 x double> zeroinitializer, <2 x i32> <i32 1, i32 3>
|
|
|
|
ret <2 x double> %shuffle
|
|
|
|
}
|
|
|
|
|
|
|
|
define <2 x double> @shuffle_v2f64_z0(<2 x double> %a) {
|
|
|
|
; SSE-LABEL: shuffle_v2f64_z0:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2017-09-18 11:29:54 +08:00
|
|
|
; SSE-NEXT: xorps %xmm1, %xmm1
|
2017-09-18 12:40:58 +08:00
|
|
|
; SSE-NEXT: movlhps {{.*#+}} xmm1 = xmm1[0],xmm0[0]
|
2017-09-18 11:29:54 +08:00
|
|
|
; SSE-NEXT: movaps %xmm1, %xmm0
|
2014-10-03 19:16:45 +08:00
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
2018-07-16 07:32:36 +08:00
|
|
|
; AVX-LABEL: shuffle_v2f64_z0:
|
|
|
|
; AVX: # %bb.0:
|
|
|
|
; AVX-NEXT: vxorps %xmm1, %xmm1, %xmm1
|
|
|
|
; AVX-NEXT: vmovlhps {{.*#+}} xmm0 = xmm1[0],xmm0[0]
|
|
|
|
; AVX-NEXT: retq
|
2014-10-03 19:16:45 +08:00
|
|
|
%shuffle = shufflevector <2 x double> %a, <2 x double> zeroinitializer, <2 x i32> <i32 2, i32 0>
|
|
|
|
ret <2 x double> %shuffle
|
|
|
|
}
|
|
|
|
|
|
|
|
define <2 x double> @shuffle_v2f64_z1(<2 x double> %a) {
|
2014-10-04 06:43:17 +08:00
|
|
|
; SSE2-LABEL: shuffle_v2f64_z1:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE2: # %bb.0:
|
2015-02-04 18:58:53 +08:00
|
|
|
; SSE2-NEXT: xorpd %xmm1, %xmm1
|
2015-01-31 22:09:36 +08:00
|
|
|
; SSE2-NEXT: movsd {{.*#+}} xmm0 = xmm1[0],xmm0[1]
|
2014-10-04 06:43:17 +08:00
|
|
|
; SSE2-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSE3-LABEL: shuffle_v2f64_z1:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE3: # %bb.0:
|
2015-02-04 18:58:53 +08:00
|
|
|
; SSE3-NEXT: xorpd %xmm1, %xmm1
|
2015-01-31 22:09:36 +08:00
|
|
|
; SSE3-NEXT: movsd {{.*#+}} xmm0 = xmm1[0],xmm0[1]
|
2014-10-04 06:43:17 +08:00
|
|
|
; SSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSSE3-LABEL: shuffle_v2f64_z1:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSSE3: # %bb.0:
|
2015-02-04 18:58:53 +08:00
|
|
|
; SSSE3-NEXT: xorpd %xmm1, %xmm1
|
2015-01-31 22:09:36 +08:00
|
|
|
; SSSE3-NEXT: movsd {{.*#+}} xmm0 = xmm1[0],xmm0[1]
|
2014-10-04 06:43:17 +08:00
|
|
|
; SSSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSE41-LABEL: shuffle_v2f64_z1:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE41: # %bb.0:
|
2018-01-16 06:18:45 +08:00
|
|
|
; SSE41-NEXT: xorps %xmm1, %xmm1
|
|
|
|
; SSE41-NEXT: blendps {{.*#+}} xmm0 = xmm1[0,1],xmm0[2,3]
|
2014-10-04 06:43:17 +08:00
|
|
|
; SSE41-NEXT: retq
|
2014-10-03 19:16:45 +08:00
|
|
|
;
|
2018-07-16 07:32:36 +08:00
|
|
|
; AVX-LABEL: shuffle_v2f64_z1:
|
|
|
|
; AVX: # %bb.0:
|
|
|
|
; AVX-NEXT: vxorps %xmm1, %xmm1, %xmm1
|
|
|
|
; AVX-NEXT: vblendps {{.*#+}} xmm0 = xmm1[0,1],xmm0[2,3]
|
|
|
|
; AVX-NEXT: retq
|
2014-10-03 19:16:45 +08:00
|
|
|
%shuffle = shufflevector <2 x double> %a, <2 x double> zeroinitializer, <2 x i32> <i32 2, i32 1>
|
|
|
|
ret <2 x double> %shuffle
|
|
|
|
}
|
2014-09-15 06:41:37 +08:00
|
|
|
|
2015-03-06 01:14:04 +08:00
|
|
|
define <2 x double> @shuffle_v2f64_bitcast_1z(<2 x double> %a) {
|
|
|
|
; SSE-LABEL: shuffle_v2f64_bitcast_1z:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2017-09-18 11:29:54 +08:00
|
|
|
; SSE-NEXT: xorps %xmm1, %xmm1
|
2017-02-15 19:46:15 +08:00
|
|
|
; SSE-NEXT: unpckhpd {{.*#+}} xmm0 = xmm0[1],xmm1[1]
|
2015-03-06 01:14:04 +08:00
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
2018-07-16 07:32:36 +08:00
|
|
|
; AVX-LABEL: shuffle_v2f64_bitcast_1z:
|
|
|
|
; AVX: # %bb.0:
|
|
|
|
; AVX-NEXT: vxorps %xmm1, %xmm1, %xmm1
|
|
|
|
; AVX-NEXT: vunpckhpd {{.*#+}} xmm0 = xmm0[1],xmm1[1]
|
|
|
|
; AVX-NEXT: retq
|
2015-03-06 01:14:04 +08:00
|
|
|
%shuffle64 = shufflevector <2 x double> %a, <2 x double> zeroinitializer, <2 x i32> <i32 2, i32 1>
|
|
|
|
%bitcast32 = bitcast <2 x double> %shuffle64 to <4 x float>
|
|
|
|
%shuffle32 = shufflevector <4 x float> %bitcast32, <4 x float> undef, <4 x i32> <i32 2, i32 3, i32 0, i32 1>
|
|
|
|
%bitcast64 = bitcast <4 x float> %shuffle32 to <2 x double>
|
|
|
|
ret <2 x double> %bitcast64
|
|
|
|
}
|
|
|
|
|
2015-10-25 23:32:04 +08:00
|
|
|
define <2 x i64> @shuffle_v2i64_bitcast_z123(<2 x i64> %x) {
|
|
|
|
; SSE2-LABEL: shuffle_v2i64_bitcast_z123:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE2: # %bb.0:
|
2015-10-25 23:32:04 +08:00
|
|
|
; SSE2-NEXT: andps {{.*}}(%rip), %xmm0
|
|
|
|
; SSE2-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSE3-LABEL: shuffle_v2i64_bitcast_z123:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE3: # %bb.0:
|
2015-10-25 23:32:04 +08:00
|
|
|
; SSE3-NEXT: andps {{.*}}(%rip), %xmm0
|
|
|
|
; SSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSSE3-LABEL: shuffle_v2i64_bitcast_z123:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSSE3: # %bb.0:
|
2015-10-25 23:32:04 +08:00
|
|
|
; SSSE3-NEXT: andps {{.*}}(%rip), %xmm0
|
|
|
|
; SSSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSE41-LABEL: shuffle_v2i64_bitcast_z123:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE41: # %bb.0:
|
2018-01-16 06:18:45 +08:00
|
|
|
; SSE41-NEXT: xorps %xmm1, %xmm1
|
|
|
|
; SSE41-NEXT: blendps {{.*#+}} xmm0 = xmm1[0],xmm0[1,2,3]
|
2015-10-25 23:32:04 +08:00
|
|
|
; SSE41-NEXT: retq
|
|
|
|
;
|
2018-07-16 07:32:36 +08:00
|
|
|
; AVX-LABEL: shuffle_v2i64_bitcast_z123:
|
|
|
|
; AVX: # %bb.0:
|
|
|
|
; AVX-NEXT: vxorps %xmm1, %xmm1, %xmm1
|
|
|
|
; AVX-NEXT: vblendps {{.*#+}} xmm0 = xmm1[0],xmm0[1,2,3]
|
|
|
|
; AVX-NEXT: retq
|
2015-10-25 23:32:04 +08:00
|
|
|
%bitcast32 = bitcast <2 x i64> %x to <4 x float>
|
|
|
|
%shuffle32 = shufflevector <4 x float> %bitcast32, <4 x float> <float 1.000000e+00, float undef, float undef, float undef>, <4 x i32> <i32 4, i32 1, i32 2, i32 3>
|
|
|
|
%bitcast64 = bitcast <4 x float> %shuffle32 to <2 x i64>
|
|
|
|
%and = and <2 x i64> %bitcast64, <i64 -4294967296, i64 -1>
|
|
|
|
ret <2 x i64> %and
|
|
|
|
}
|
|
|
|
|
2014-09-20 11:32:25 +08:00
|
|
|
define <2 x i64> @insert_reg_and_zero_v2i64(i64 %a) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-LABEL: insert_reg_and_zero_v2i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2017-04-26 15:08:44 +08:00
|
|
|
; SSE-NEXT: movq %rdi, %xmm0
|
2014-09-21 05:26:41 +08:00
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
2014-10-01 05:44:34 +08:00
|
|
|
; AVX-LABEL: insert_reg_and_zero_v2i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2014-10-01 05:44:34 +08:00
|
|
|
; AVX-NEXT: vmovq %rdi, %xmm0
|
2014-09-21 05:26:41 +08:00
|
|
|
; AVX-NEXT: retq
|
2014-09-20 11:32:25 +08:00
|
|
|
%v = insertelement <2 x i64> undef, i64 %a, i32 0
|
|
|
|
%shuffle = shufflevector <2 x i64> %v, <2 x i64> zeroinitializer, <2 x i32> <i32 0, i32 3>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
|
|
|
|
define <2 x i64> @insert_mem_and_zero_v2i64(i64* %ptr) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-LABEL: insert_mem_and_zero_v2i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2016-12-16 00:05:29 +08:00
|
|
|
; SSE-NEXT: movsd {{.*#+}} xmm0 = mem[0],zero
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
2016-02-02 21:32:56 +08:00
|
|
|
; AVX-LABEL: insert_mem_and_zero_v2i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2016-12-16 00:05:29 +08:00
|
|
|
; AVX-NEXT: vmovsd {{.*#+}} xmm0 = mem[0],zero
|
2016-02-02 21:32:56 +08:00
|
|
|
; AVX-NEXT: retq
|
2015-02-28 05:17:42 +08:00
|
|
|
%a = load i64, i64* %ptr
|
2014-09-20 11:32:25 +08:00
|
|
|
%v = insertelement <2 x i64> undef, i64 %a, i32 0
|
|
|
|
%shuffle = shufflevector <2 x i64> %v, <2 x i64> zeroinitializer, <2 x i32> <i32 0, i32 3>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
|
|
|
|
define <2 x double> @insert_reg_and_zero_v2f64(double %a) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-LABEL: insert_reg_and_zero_v2f64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2015-01-31 22:09:36 +08:00
|
|
|
; SSE-NEXT: movq {{.*#+}} xmm0 = xmm0[0],zero
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
2015-12-13 05:46:23 +08:00
|
|
|
; AVX-LABEL: insert_reg_and_zero_v2f64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2015-12-13 05:46:23 +08:00
|
|
|
; AVX-NEXT: vmovq {{.*#+}} xmm0 = xmm0[0],zero
|
|
|
|
; AVX-NEXT: retq
|
2014-09-20 11:32:25 +08:00
|
|
|
%v = insertelement <2 x double> undef, double %a, i32 0
|
|
|
|
%shuffle = shufflevector <2 x double> %v, <2 x double> zeroinitializer, <2 x i32> <i32 0, i32 3>
|
|
|
|
ret <2 x double> %shuffle
|
|
|
|
}
|
|
|
|
|
|
|
|
define <2 x double> @insert_mem_and_zero_v2f64(double* %ptr) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-LABEL: insert_mem_and_zero_v2f64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2015-01-31 22:09:36 +08:00
|
|
|
; SSE-NEXT: movsd {{.*#+}} xmm0 = mem[0],zero
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
2016-02-02 21:32:56 +08:00
|
|
|
; AVX-LABEL: insert_mem_and_zero_v2f64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2016-02-02 21:32:56 +08:00
|
|
|
; AVX-NEXT: vmovsd {{.*#+}} xmm0 = mem[0],zero
|
|
|
|
; AVX-NEXT: retq
|
2015-02-28 05:17:42 +08:00
|
|
|
%a = load double, double* %ptr
|
2014-09-20 11:32:25 +08:00
|
|
|
%v = insertelement <2 x double> undef, double %a, i32 0
|
|
|
|
%shuffle = shufflevector <2 x double> %v, <2 x double> zeroinitializer, <2 x i32> <i32 0, i32 3>
|
|
|
|
ret <2 x double> %shuffle
|
|
|
|
}
|
|
|
|
|
2014-10-01 19:14:02 +08:00
|
|
|
define <2 x i64> @insert_reg_lo_v2i64(i64 %a, <2 x i64> %b) {
|
|
|
|
; SSE2-LABEL: insert_reg_lo_v2i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE2: # %bb.0:
|
2017-04-26 15:08:44 +08:00
|
|
|
; SSE2-NEXT: movq %rdi, %xmm1
|
2015-01-31 22:09:36 +08:00
|
|
|
; SSE2-NEXT: movsd {{.*#+}} xmm0 = xmm1[0],xmm0[1]
|
2014-10-01 19:14:02 +08:00
|
|
|
; SSE2-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSE3-LABEL: insert_reg_lo_v2i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE3: # %bb.0:
|
2017-04-26 15:08:44 +08:00
|
|
|
; SSE3-NEXT: movq %rdi, %xmm1
|
2015-01-31 22:09:36 +08:00
|
|
|
; SSE3-NEXT: movsd {{.*#+}} xmm0 = xmm1[0],xmm0[1]
|
2014-10-01 19:14:02 +08:00
|
|
|
; SSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSSE3-LABEL: insert_reg_lo_v2i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSSE3: # %bb.0:
|
2017-04-26 15:08:44 +08:00
|
|
|
; SSSE3-NEXT: movq %rdi, %xmm1
|
2015-01-31 22:09:36 +08:00
|
|
|
; SSSE3-NEXT: movsd {{.*#+}} xmm0 = xmm1[0],xmm0[1]
|
2014-10-01 19:14:02 +08:00
|
|
|
; SSSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSE41-LABEL: insert_reg_lo_v2i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE41: # %bb.0:
|
2017-12-07 23:17:58 +08:00
|
|
|
; SSE41-NEXT: pinsrq $0, %rdi, %xmm0
|
2014-10-01 19:14:02 +08:00
|
|
|
; SSE41-NEXT: retq
|
|
|
|
;
|
2017-12-07 23:17:58 +08:00
|
|
|
; AVX-LABEL: insert_reg_lo_v2i64:
|
|
|
|
; AVX: # %bb.0:
|
|
|
|
; AVX-NEXT: vpinsrq $0, %rdi, %xmm0, %xmm0
|
|
|
|
; AVX-NEXT: retq
|
2014-10-01 19:14:02 +08:00
|
|
|
%v = insertelement <2 x i64> undef, i64 %a, i32 0
|
|
|
|
%shuffle = shufflevector <2 x i64> %v, <2 x i64> %b, <2 x i32> <i32 0, i32 3>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
|
|
|
|
define <2 x i64> @insert_mem_lo_v2i64(i64* %ptr, <2 x i64> %b) {
|
|
|
|
; SSE2-LABEL: insert_mem_lo_v2i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE2: # %bb.0:
|
2019-07-07 01:59:57 +08:00
|
|
|
; SSE2-NEXT: movlps {{.*#+}} xmm0 = mem[0,1],xmm0[2,3]
|
2014-10-01 19:14:02 +08:00
|
|
|
; SSE2-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSE3-LABEL: insert_mem_lo_v2i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE3: # %bb.0:
|
2019-07-07 01:59:57 +08:00
|
|
|
; SSE3-NEXT: movlps {{.*#+}} xmm0 = mem[0,1],xmm0[2,3]
|
2014-10-01 19:14:02 +08:00
|
|
|
; SSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSSE3-LABEL: insert_mem_lo_v2i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSSE3: # %bb.0:
|
2019-07-07 01:59:57 +08:00
|
|
|
; SSSE3-NEXT: movlps {{.*#+}} xmm0 = mem[0,1],xmm0[2,3]
|
2014-10-01 19:14:02 +08:00
|
|
|
; SSSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSE41-LABEL: insert_mem_lo_v2i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE41: # %bb.0:
|
2017-12-07 23:17:58 +08:00
|
|
|
; SSE41-NEXT: pinsrq $0, (%rdi), %xmm0
|
2014-10-01 19:14:02 +08:00
|
|
|
; SSE41-NEXT: retq
|
|
|
|
;
|
2017-12-07 23:17:58 +08:00
|
|
|
; AVX-LABEL: insert_mem_lo_v2i64:
|
|
|
|
; AVX: # %bb.0:
|
|
|
|
; AVX-NEXT: vpinsrq $0, (%rdi), %xmm0, %xmm0
|
|
|
|
; AVX-NEXT: retq
|
2015-02-28 05:17:42 +08:00
|
|
|
%a = load i64, i64* %ptr
|
2014-10-01 19:14:02 +08:00
|
|
|
%v = insertelement <2 x i64> undef, i64 %a, i32 0
|
|
|
|
%shuffle = shufflevector <2 x i64> %v, <2 x i64> %b, <2 x i32> <i32 0, i32 3>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
|
|
|
|
define <2 x i64> @insert_reg_hi_v2i64(i64 %a, <2 x i64> %b) {
|
2017-12-07 23:17:58 +08:00
|
|
|
; SSE2-LABEL: insert_reg_hi_v2i64:
|
|
|
|
; SSE2: # %bb.0:
|
|
|
|
; SSE2-NEXT: movq %rdi, %xmm1
|
|
|
|
; SSE2-NEXT: punpcklqdq {{.*#+}} xmm0 = xmm0[0],xmm1[0]
|
|
|
|
; SSE2-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSE3-LABEL: insert_reg_hi_v2i64:
|
|
|
|
; SSE3: # %bb.0:
|
|
|
|
; SSE3-NEXT: movq %rdi, %xmm1
|
|
|
|
; SSE3-NEXT: punpcklqdq {{.*#+}} xmm0 = xmm0[0],xmm1[0]
|
|
|
|
; SSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSSE3-LABEL: insert_reg_hi_v2i64:
|
|
|
|
; SSSE3: # %bb.0:
|
|
|
|
; SSSE3-NEXT: movq %rdi, %xmm1
|
|
|
|
; SSSE3-NEXT: punpcklqdq {{.*#+}} xmm0 = xmm0[0],xmm1[0]
|
|
|
|
; SSSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSE41-LABEL: insert_reg_hi_v2i64:
|
|
|
|
; SSE41: # %bb.0:
|
|
|
|
; SSE41-NEXT: pinsrq $1, %rdi, %xmm0
|
|
|
|
; SSE41-NEXT: retq
|
2014-10-01 19:14:02 +08:00
|
|
|
;
|
2015-11-18 06:35:45 +08:00
|
|
|
; AVX-LABEL: insert_reg_hi_v2i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2017-12-07 23:17:58 +08:00
|
|
|
; AVX-NEXT: vpinsrq $1, %rdi, %xmm0, %xmm0
|
2015-11-18 06:35:45 +08:00
|
|
|
; AVX-NEXT: retq
|
2014-10-01 19:14:02 +08:00
|
|
|
%v = insertelement <2 x i64> undef, i64 %a, i32 0
|
|
|
|
%shuffle = shufflevector <2 x i64> %v, <2 x i64> %b, <2 x i32> <i32 2, i32 0>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
|
|
|
|
define <2 x i64> @insert_mem_hi_v2i64(i64* %ptr, <2 x i64> %b) {
|
2017-12-07 23:17:58 +08:00
|
|
|
; SSE2-LABEL: insert_mem_hi_v2i64:
|
|
|
|
; SSE2: # %bb.0:
|
|
|
|
; SSE2-NEXT: movsd {{.*#+}} xmm1 = mem[0],zero
|
|
|
|
; SSE2-NEXT: movlhps {{.*#+}} xmm0 = xmm0[0],xmm1[0]
|
|
|
|
; SSE2-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSE3-LABEL: insert_mem_hi_v2i64:
|
|
|
|
; SSE3: # %bb.0:
|
|
|
|
; SSE3-NEXT: movsd {{.*#+}} xmm1 = mem[0],zero
|
|
|
|
; SSE3-NEXT: movlhps {{.*#+}} xmm0 = xmm0[0],xmm1[0]
|
|
|
|
; SSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSSE3-LABEL: insert_mem_hi_v2i64:
|
|
|
|
; SSSE3: # %bb.0:
|
|
|
|
; SSSE3-NEXT: movsd {{.*#+}} xmm1 = mem[0],zero
|
|
|
|
; SSSE3-NEXT: movlhps {{.*#+}} xmm0 = xmm0[0],xmm1[0]
|
|
|
|
; SSSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSE41-LABEL: insert_mem_hi_v2i64:
|
|
|
|
; SSE41: # %bb.0:
|
|
|
|
; SSE41-NEXT: pinsrq $1, (%rdi), %xmm0
|
|
|
|
; SSE41-NEXT: retq
|
2014-10-01 19:14:02 +08:00
|
|
|
;
|
2016-02-02 21:32:56 +08:00
|
|
|
; AVX-LABEL: insert_mem_hi_v2i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2017-12-07 23:17:58 +08:00
|
|
|
; AVX-NEXT: vpinsrq $1, (%rdi), %xmm0, %xmm0
|
2016-02-02 21:32:56 +08:00
|
|
|
; AVX-NEXT: retq
|
2015-02-28 05:17:42 +08:00
|
|
|
%a = load i64, i64* %ptr
|
2014-10-01 19:14:02 +08:00
|
|
|
%v = insertelement <2 x i64> undef, i64 %a, i32 0
|
|
|
|
%shuffle = shufflevector <2 x i64> %v, <2 x i64> %b, <2 x i32> <i32 2, i32 0>
|
|
|
|
ret <2 x i64> %shuffle
|
|
|
|
}
|
|
|
|
|
|
|
|
define <2 x double> @insert_reg_lo_v2f64(double %a, <2 x double> %b) {
|
2016-10-01 22:26:11 +08:00
|
|
|
; SSE2-LABEL: insert_reg_lo_v2f64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE2: # %bb.0:
|
2019-07-08 14:52:49 +08:00
|
|
|
; SSE2-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[2,3]
|
2016-10-01 22:26:11 +08:00
|
|
|
; SSE2-NEXT: retq
|
2014-10-01 19:14:02 +08:00
|
|
|
;
|
2016-10-01 22:26:11 +08:00
|
|
|
; SSE3-LABEL: insert_reg_lo_v2f64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE3: # %bb.0:
|
2019-07-08 14:52:49 +08:00
|
|
|
; SSE3-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[2,3]
|
2016-10-01 22:26:11 +08:00
|
|
|
; SSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSSE3-LABEL: insert_reg_lo_v2f64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSSE3: # %bb.0:
|
2019-07-08 14:52:49 +08:00
|
|
|
; SSSE3-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[2,3]
|
2016-10-01 22:26:11 +08:00
|
|
|
; SSSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSE41-LABEL: insert_reg_lo_v2f64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE41: # %bb.0:
|
2018-01-16 06:18:45 +08:00
|
|
|
; SSE41-NEXT: blendps {{.*#+}} xmm0 = xmm0[0,1],xmm1[2,3]
|
2016-10-01 22:26:11 +08:00
|
|
|
; SSE41-NEXT: retq
|
|
|
|
;
|
2018-07-14 10:05:08 +08:00
|
|
|
; AVX-LABEL: insert_reg_lo_v2f64:
|
|
|
|
; AVX: # %bb.0:
|
|
|
|
; AVX-NEXT: vblendps {{.*#+}} xmm0 = xmm0[0,1],xmm1[2,3]
|
|
|
|
; AVX-NEXT: retq
|
2014-10-01 19:14:02 +08:00
|
|
|
%v = insertelement <2 x double> undef, double %a, i32 0
|
|
|
|
%shuffle = shufflevector <2 x double> %v, <2 x double> %b, <2 x i32> <i32 0, i32 3>
|
|
|
|
ret <2 x double> %shuffle
|
|
|
|
}
|
|
|
|
|
|
|
|
define <2 x double> @insert_mem_lo_v2f64(double* %ptr, <2 x double> %b) {
|
|
|
|
; SSE-LABEL: insert_mem_lo_v2f64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2019-07-07 01:59:57 +08:00
|
|
|
; SSE-NEXT: movlps {{.*#+}} xmm0 = mem[0,1],xmm0[2,3]
|
2014-10-01 19:14:02 +08:00
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
|
|
|
; AVX-LABEL: insert_mem_lo_v2f64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2019-07-07 01:59:57 +08:00
|
|
|
; AVX-NEXT: vmovlps {{.*#+}} xmm0 = mem[0,1],xmm0[2,3]
|
2014-10-01 19:14:02 +08:00
|
|
|
; AVX-NEXT: retq
|
2015-02-28 05:17:42 +08:00
|
|
|
%a = load double, double* %ptr
|
2014-10-01 19:14:02 +08:00
|
|
|
%v = insertelement <2 x double> undef, double %a, i32 0
|
|
|
|
%shuffle = shufflevector <2 x double> %v, <2 x double> %b, <2 x i32> <i32 0, i32 3>
|
|
|
|
ret <2 x double> %shuffle
|
|
|
|
}
|
|
|
|
|
|
|
|
define <2 x double> @insert_reg_hi_v2f64(double %a, <2 x double> %b) {
|
|
|
|
; SSE-LABEL: insert_reg_hi_v2f64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2017-09-18 12:40:58 +08:00
|
|
|
; SSE-NEXT: movlhps {{.*#+}} xmm1 = xmm1[0],xmm0[0]
|
2017-09-18 11:29:54 +08:00
|
|
|
; SSE-NEXT: movaps %xmm1, %xmm0
|
2014-10-01 19:14:02 +08:00
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
2015-11-18 06:35:45 +08:00
|
|
|
; AVX-LABEL: insert_reg_hi_v2f64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2017-09-18 12:40:58 +08:00
|
|
|
; AVX-NEXT: vmovlhps {{.*#+}} xmm0 = xmm1[0],xmm0[0]
|
2015-11-18 06:35:45 +08:00
|
|
|
; AVX-NEXT: retq
|
2014-10-01 19:14:02 +08:00
|
|
|
%v = insertelement <2 x double> undef, double %a, i32 0
|
|
|
|
%shuffle = shufflevector <2 x double> %v, <2 x double> %b, <2 x i32> <i32 2, i32 0>
|
|
|
|
ret <2 x double> %shuffle
|
|
|
|
}
|
|
|
|
|
|
|
|
define <2 x double> @insert_mem_hi_v2f64(double* %ptr, <2 x double> %b) {
|
|
|
|
; SSE-LABEL: insert_mem_hi_v2f64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2019-07-07 01:59:57 +08:00
|
|
|
; SSE-NEXT: movhps {{.*#+}} xmm0 = xmm0[0,1],mem[0,1]
|
2014-10-01 19:14:02 +08:00
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
|
|
|
; AVX-LABEL: insert_mem_hi_v2f64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2019-07-07 01:59:57 +08:00
|
|
|
; AVX-NEXT: vmovhps {{.*#+}} xmm0 = xmm0[0,1],mem[0,1]
|
2014-10-01 19:14:02 +08:00
|
|
|
; AVX-NEXT: retq
|
2015-02-28 05:17:42 +08:00
|
|
|
%a = load double, double* %ptr
|
2014-10-01 19:14:02 +08:00
|
|
|
%v = insertelement <2 x double> undef, double %a, i32 0
|
|
|
|
%shuffle = shufflevector <2 x double> %v, <2 x double> %b, <2 x i32> <i32 2, i32 0>
|
|
|
|
ret <2 x double> %shuffle
|
|
|
|
}
|
|
|
|
|
2014-09-15 06:41:37 +08:00
|
|
|
define <2 x double> @insert_dup_reg_v2f64(double %a) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE2-LABEL: insert_dup_reg_v2f64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE2: # %bb.0:
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE2-NEXT: movlhps {{.*#+}} xmm0 = xmm0[0,0]
|
2014-09-15 07:19:37 +08:00
|
|
|
; SSE2-NEXT: retq
|
2015-01-27 05:15:42 +08:00
|
|
|
;
|
|
|
|
; SSE3-LABEL: insert_dup_reg_v2f64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE3: # %bb.0:
|
2015-01-27 05:15:42 +08:00
|
|
|
; SSE3-NEXT: movddup {{.*#+}} xmm0 = xmm0[0,0]
|
|
|
|
; SSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSSE3-LABEL: insert_dup_reg_v2f64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSSE3: # %bb.0:
|
2015-01-27 05:15:42 +08:00
|
|
|
; SSSE3-NEXT: movddup {{.*#+}} xmm0 = xmm0[0,0]
|
|
|
|
; SSSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSE41-LABEL: insert_dup_reg_v2f64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE41: # %bb.0:
|
2015-01-27 05:15:42 +08:00
|
|
|
; SSE41-NEXT: movddup {{.*#+}} xmm0 = xmm0[0,0]
|
|
|
|
; SSE41-NEXT: retq
|
|
|
|
;
|
|
|
|
; AVX-LABEL: insert_dup_reg_v2f64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2015-01-27 05:15:42 +08:00
|
|
|
; AVX-NEXT: vmovddup {{.*#+}} xmm0 = xmm0[0,0]
|
|
|
|
; AVX-NEXT: retq
|
|
|
|
%v = insertelement <2 x double> undef, double %a, i32 0
|
|
|
|
%shuffle = shufflevector <2 x double> %v, <2 x double> undef, <2 x i32> <i32 0, i32 0>
|
2014-09-15 06:41:37 +08:00
|
|
|
ret <2 x double> %shuffle
|
|
|
|
}
|
2015-10-25 04:15:43 +08:00
|
|
|
|
2014-09-15 06:41:37 +08:00
|
|
|
define <2 x double> @insert_dup_mem_v2f64(double* %ptr) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE2-LABEL: insert_dup_mem_v2f64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE2: # %bb.0:
|
2015-01-31 22:09:36 +08:00
|
|
|
; SSE2-NEXT: movsd {{.*#+}} xmm0 = mem[0],zero
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE2-NEXT: movlhps {{.*#+}} xmm0 = xmm0[0,0]
|
2014-09-15 07:19:37 +08:00
|
|
|
; SSE2-NEXT: retq
|
2014-09-15 06:41:37 +08:00
|
|
|
;
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE3-LABEL: insert_dup_mem_v2f64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE3: # %bb.0:
|
2015-02-04 18:46:53 +08:00
|
|
|
; SSE3-NEXT: movddup {{.*#+}} xmm0 = mem[0,0]
|
2014-09-15 07:19:37 +08:00
|
|
|
; SSE3-NEXT: retq
|
2014-09-15 07:28:12 +08:00
|
|
|
;
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSSE3-LABEL: insert_dup_mem_v2f64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSSE3: # %bb.0:
|
2015-02-04 18:46:53 +08:00
|
|
|
; SSSE3-NEXT: movddup {{.*#+}} xmm0 = mem[0,0]
|
2014-09-18 16:33:04 +08:00
|
|
|
; SSSE3-NEXT: retq
|
|
|
|
;
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE41-LABEL: insert_dup_mem_v2f64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE41: # %bb.0:
|
2015-02-04 18:46:53 +08:00
|
|
|
; SSE41-NEXT: movddup {{.*#+}} xmm0 = mem[0,0]
|
2014-09-15 07:28:12 +08:00
|
|
|
; SSE41-NEXT: retq
|
2014-10-01 05:44:34 +08:00
|
|
|
;
|
2015-11-19 16:26:56 +08:00
|
|
|
; AVX-LABEL: insert_dup_mem_v2f64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2015-11-19 16:26:56 +08:00
|
|
|
; AVX-NEXT: vmovddup {{.*#+}} xmm0 = mem[0,0]
|
|
|
|
; AVX-NEXT: retq
|
2015-02-28 05:17:42 +08:00
|
|
|
%a = load double, double* %ptr
|
2014-09-15 06:41:37 +08:00
|
|
|
%v = insertelement <2 x double> undef, double %a, i32 0
|
|
|
|
%shuffle = shufflevector <2 x double> %v, <2 x double> undef, <2 x i32> <i32 0, i32 0>
|
|
|
|
ret <2 x double> %shuffle
|
|
|
|
}
|
2014-09-21 06:09:27 +08:00
|
|
|
|
2015-11-19 16:26:56 +08:00
|
|
|
define <2 x double> @insert_dup_mem128_v2f64(<2 x double>* %ptr) nounwind {
|
|
|
|
; SSE2-LABEL: insert_dup_mem128_v2f64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE2: # %bb.0:
|
2015-11-19 16:26:56 +08:00
|
|
|
; SSE2-NEXT: movaps (%rdi), %xmm0
|
|
|
|
; SSE2-NEXT: movlhps {{.*#+}} xmm0 = xmm0[0,0]
|
|
|
|
; SSE2-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSE3-LABEL: insert_dup_mem128_v2f64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE3: # %bb.0:
|
2015-11-19 16:26:56 +08:00
|
|
|
; SSE3-NEXT: movddup {{.*#+}} xmm0 = mem[0,0]
|
|
|
|
; SSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSSE3-LABEL: insert_dup_mem128_v2f64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSSE3: # %bb.0:
|
2015-11-19 16:26:56 +08:00
|
|
|
; SSSE3-NEXT: movddup {{.*#+}} xmm0 = mem[0,0]
|
|
|
|
; SSSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSE41-LABEL: insert_dup_mem128_v2f64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE41: # %bb.0:
|
2015-11-19 16:26:56 +08:00
|
|
|
; SSE41-NEXT: movddup {{.*#+}} xmm0 = mem[0,0]
|
|
|
|
; SSE41-NEXT: retq
|
|
|
|
;
|
|
|
|
; AVX-LABEL: insert_dup_mem128_v2f64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2015-11-19 16:26:56 +08:00
|
|
|
; AVX-NEXT: vmovddup {{.*#+}} xmm0 = mem[0,0]
|
|
|
|
; AVX-NEXT: retq
|
|
|
|
%v = load <2 x double>, <2 x double>* %ptr
|
|
|
|
%shuffle = shufflevector <2 x double> %v, <2 x double> undef, <2 x i32> <i32 0, i32 0>
|
|
|
|
ret <2 x double> %shuffle
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2015-08-21 04:59:41 +08:00
|
|
|
define <2 x i64> @insert_dup_mem_v2i64(i64* %ptr) {
|
|
|
|
; SSE-LABEL: insert_dup_mem_v2i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2015-08-21 04:59:41 +08:00
|
|
|
; SSE-NEXT: movq {{.*#+}} xmm0 = mem[0],zero
|
|
|
|
; SSE-NEXT: pshufd {{.*#+}} xmm0 = xmm0[0,1,0,1]
|
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
2019-02-02 05:41:30 +08:00
|
|
|
; AVX-LABEL: insert_dup_mem_v2i64:
|
|
|
|
; AVX: # %bb.0:
|
|
|
|
; AVX-NEXT: vmovddup {{.*#+}} xmm0 = mem[0,0]
|
|
|
|
; AVX-NEXT: retq
|
2015-08-21 04:59:41 +08:00
|
|
|
%tmp = load i64, i64* %ptr, align 1
|
|
|
|
%tmp1 = insertelement <2 x i64> undef, i64 %tmp, i32 0
|
|
|
|
%tmp2 = shufflevector <2 x i64> %tmp1, <2 x i64> undef, <2 x i32> zeroinitializer
|
|
|
|
ret <2 x i64> %tmp2
|
|
|
|
}
|
|
|
|
|
2014-09-21 06:09:27 +08:00
|
|
|
define <2 x double> @shuffle_mem_v2f64_10(<2 x double>* %ptr) {
|
2014-10-01 05:44:34 +08:00
|
|
|
; SSE-LABEL: shuffle_mem_v2f64_10:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SSE: # %bb.0:
|
2019-07-08 14:52:49 +08:00
|
|
|
; SSE-NEXT: movaps (%rdi), %xmm0
|
|
|
|
; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[2,3,0,1]
|
2014-09-21 06:09:27 +08:00
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
2015-11-18 07:29:49 +08:00
|
|
|
; AVX-LABEL: shuffle_mem_v2f64_10:
|
2017-12-05 01:18:51 +08:00
|
|
|
; AVX: # %bb.0:
|
2015-11-18 07:29:49 +08:00
|
|
|
; AVX-NEXT: vpermilpd {{.*#+}} xmm0 = mem[1,0]
|
|
|
|
; AVX-NEXT: retq
|
2015-10-25 23:32:04 +08:00
|
|
|
|
2015-02-28 05:17:42 +08:00
|
|
|
%a = load <2 x double>, <2 x double>* %ptr
|
2014-09-21 06:09:27 +08:00
|
|
|
%shuffle = shufflevector <2 x double> %a, <2 x double> undef, <2 x i32> <i32 1, i32 0>
|
|
|
|
ret <2 x double> %shuffle
|
|
|
|
}
|
2018-07-18 15:31:30 +08:00
|
|
|
|
|
|
|
define <2 x double> @shuffle_mem_v2f64_31(<2 x double> %a, <2 x double>* %b) {
|
|
|
|
; SSE-LABEL: shuffle_mem_v2f64_31:
|
|
|
|
; SSE: # %bb.0:
|
|
|
|
; SSE-NEXT: movlps {{.*#+}} xmm0 = mem[0,1],xmm0[2,3]
|
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
|
|
|
; AVX-LABEL: shuffle_mem_v2f64_31:
|
|
|
|
; AVX: # %bb.0:
|
2018-07-18 15:31:32 +08:00
|
|
|
; AVX-NEXT: vmovlps {{.*#+}} xmm0 = mem[0,1],xmm0[2,3]
|
2018-07-18 15:31:30 +08:00
|
|
|
; AVX-NEXT: retq
|
|
|
|
%c = load <2 x double>, <2 x double>* %b
|
|
|
|
%f = shufflevector <2 x double> %a, <2 x double> %c, <2 x i32> <i32 3, i32 1>
|
|
|
|
ret <2 x double> %f
|
|
|
|
}
|
2019-07-07 01:59:41 +08:00
|
|
|
|
|
|
|
define <2 x double> @shuffle_mem_v2f64_02(<2 x double> %a, <2 x double>* %pb) {
|
|
|
|
; SSE-LABEL: shuffle_mem_v2f64_02:
|
|
|
|
; SSE: # %bb.0:
|
2019-07-07 01:59:57 +08:00
|
|
|
; SSE-NEXT: movhps {{.*#+}} xmm0 = xmm0[0,1],mem[0,1]
|
2019-07-07 01:59:41 +08:00
|
|
|
; SSE-NEXT: retq
|
|
|
|
;
|
|
|
|
; AVX-LABEL: shuffle_mem_v2f64_02:
|
|
|
|
; AVX: # %bb.0:
|
|
|
|
; AVX-NEXT: vunpcklpd {{.*#+}} xmm0 = xmm0[0],mem[0]
|
|
|
|
; AVX-NEXT: retq
|
|
|
|
%b = load <2 x double>, <2 x double>* %pb, align 1
|
|
|
|
%shuffle = shufflevector <2 x double> %a, <2 x double> %b, <2 x i32> <i32 0, i32 2>
|
|
|
|
ret <2 x double> %shuffle
|
|
|
|
}
|
|
|
|
|
|
|
|
define <2 x double> @shuffle_mem_v2f64_21(<2 x double> %a, <2 x double>* %pb) {
|
|
|
|
; SSE2-LABEL: shuffle_mem_v2f64_21:
|
|
|
|
; SSE2: # %bb.0:
|
2019-07-07 01:59:57 +08:00
|
|
|
; SSE2-NEXT: movlps {{.*#+}} xmm0 = mem[0,1],xmm0[2,3]
|
2019-07-07 01:59:41 +08:00
|
|
|
; SSE2-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSE3-LABEL: shuffle_mem_v2f64_21:
|
|
|
|
; SSE3: # %bb.0:
|
2019-07-07 01:59:57 +08:00
|
|
|
; SSE3-NEXT: movlps {{.*#+}} xmm0 = mem[0,1],xmm0[2,3]
|
2019-07-07 01:59:41 +08:00
|
|
|
; SSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSSE3-LABEL: shuffle_mem_v2f64_21:
|
|
|
|
; SSSE3: # %bb.0:
|
2019-07-07 01:59:57 +08:00
|
|
|
; SSSE3-NEXT: movlps {{.*#+}} xmm0 = mem[0,1],xmm0[2,3]
|
2019-07-07 01:59:41 +08:00
|
|
|
; SSSE3-NEXT: retq
|
|
|
|
;
|
|
|
|
; SSE41-LABEL: shuffle_mem_v2f64_21:
|
|
|
|
; SSE41: # %bb.0:
|
|
|
|
; SSE41-NEXT: movups (%rdi), %xmm1
|
|
|
|
; SSE41-NEXT: blendps {{.*#+}} xmm0 = xmm1[0,1],xmm0[2,3]
|
|
|
|
; SSE41-NEXT: retq
|
|
|
|
;
|
|
|
|
; AVX-LABEL: shuffle_mem_v2f64_21:
|
|
|
|
; AVX: # %bb.0:
|
|
|
|
; AVX-NEXT: vblendps {{.*#+}} xmm0 = mem[0,1],xmm0[2,3]
|
|
|
|
; AVX-NEXT: retq
|
|
|
|
%b = load <2 x double>, <2 x double>* %pb, align 1
|
|
|
|
%shuffle = shufflevector <2 x double> %a, <2 x double> %b, <2 x i32> <i32 2, i32 1>
|
|
|
|
ret <2 x double> %shuffle
|
|
|
|
}
|