forked from OSchip/llvm-project
40 lines
1.4 KiB
LLVM
40 lines
1.4 KiB
LLVM
; RUN: llc -mtriple=x86_64-apple-darwin -mattr=+sse2 < %s | FileCheck --check-prefix=SSE2-CODEGEN %s
|
|
; RUN: opt -mtriple=x86_64-apple-darwin -mattr=+sse2 -cost-model -analyze < %s | FileCheck --check-prefix=SSE2 %s
|
|
|
|
define <4 x i32> @shl(<4 x i32> %vector, i32 %scalar) {
|
|
entry:
|
|
; SSE2: 'shl'
|
|
; SSE2: cost of 1 {{.*}} shl
|
|
; SSE2-CODEGEN: movd %edi, %xmm1
|
|
; SSE2-CODEGEN: pslld %xmm1, %xmm0
|
|
%insert = insertelement <4 x i32> undef, i32 %scalar, i32 0
|
|
%splat = shufflevector <4 x i32> %insert, <4 x i32> undef, <4 x i32> zeroinitializer
|
|
%ret = shl <4 x i32> %vector , %splat
|
|
ret <4 x i32> %ret
|
|
}
|
|
|
|
define <4 x i32> @ashr(<4 x i32> %vector, i32 %scalar) {
|
|
entry:
|
|
; SSE2: 'ashr'
|
|
; SSE2: cost of 1 {{.*}} ashr
|
|
; SSE2-CODEGEN: movd %edi, %xmm1
|
|
; SSE2-CODEGEN: psrad %xmm1, %xmm0
|
|
%insert = insertelement <4 x i32> undef, i32 %scalar, i32 0
|
|
%splat = shufflevector <4 x i32> %insert, <4 x i32> undef, <4 x i32> zeroinitializer
|
|
%ret = ashr <4 x i32> %vector , %splat
|
|
ret <4 x i32> %ret
|
|
}
|
|
|
|
define <4 x i32> @lshr(<4 x i32> %vector, i32 %scalar) {
|
|
entry:
|
|
; SSE2: 'lshr'
|
|
; SSE2: cost of 1 {{.*}} lshr
|
|
; SSE2-CODEGEN: movd %edi, %xmm1
|
|
; SSE2-CODEGEN: psrld %xmm1, %xmm0
|
|
%insert = insertelement <4 x i32> undef, i32 %scalar, i32 0
|
|
%splat = shufflevector <4 x i32> %insert, <4 x i32> undef, <4 x i32> zeroinitializer
|
|
%ret = lshr <4 x i32> %vector , %splat
|
|
ret <4 x i32> %ret
|
|
}
|
|
|