forked from OSchip/llvm-project
27 lines
1008 B
LLVM
27 lines
1008 B
LLVM
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
|
; RUN: llc < %s -mtriple=x86_64-apple-darwin -mattr=+sse2 | FileCheck %s --check-prefix=CHECK --check-prefix=SSE2
|
|
; RUN: llc < %s -mtriple=x86_64-apple-darwin -mattr=+sse4.1 | FileCheck %s --check-prefix=CHECK --check-prefix=SSE41
|
|
|
|
; Make sure that the conversion between v4i8 to v2i16 is not a simple bitcast.
|
|
define void @prom_bug(<4 x i8> %t, i16* %p) {
|
|
; SSE2-LABEL: prom_bug:
|
|
; SSE2: ## %bb.0:
|
|
; SSE2-NEXT: pand {{.*}}(%rip), %xmm0
|
|
; SSE2-NEXT: packuswb %xmm0, %xmm0
|
|
; SSE2-NEXT: packuswb %xmm0, %xmm0
|
|
; SSE2-NEXT: pextrw $0, %xmm0, %eax
|
|
; SSE2-NEXT: movw %ax, (%rdi)
|
|
; SSE2-NEXT: retq
|
|
;
|
|
; SSE41-LABEL: prom_bug:
|
|
; SSE41: ## %bb.0:
|
|
; SSE41-NEXT: pshufb {{.*#+}} xmm0 = xmm0[0,4,8,12,u,u,u,u,u,u,u,u,u,u,u,u]
|
|
; SSE41-NEXT: pextrw $0, %xmm0, (%rdi)
|
|
; SSE41-NEXT: retq
|
|
%r = bitcast <4 x i8> %t to <2 x i16>
|
|
%o = extractelement <2 x i16> %r, i32 0
|
|
store i16 %o, i16* %p
|
|
ret void
|
|
}
|
|
|