llvm-project/llvm/test/CodeGen/X86/avx-cvt-2.ll

; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=avx | FileCheck %s

; Check that we generate vector conversion from float to narrower int types

%f32vec_t = type <8 x float>
%i16vec_t = type <8 x i16>
%i8vec_t =  type <8 x i8>

define void @fptoui16(%f32vec_t %a, %i16vec_t *%p) {
; CHECK-LABEL: fptoui16:
; CHECK:       # BB#0:
; CHECK-NEXT:    vcvttps2dq %ymm0, %ymm0
; CHECK-NEXT:    vextractf128 $1, %ymm0, %xmm1
; CHECK-NEXT:    vmovdqa {{.*#+}} xmm2 = [0,1,4,5,8,9,12,13,8,9,12,13,12,13,14,15]
; CHECK-NEXT:    vpshufb %xmm2, %xmm1, %xmm1
; CHECK-NEXT:    vpshufb %xmm2, %xmm0, %xmm0
; CHECK-NEXT:    vpunpcklqdq {{.*#+}} xmm0 = xmm0[0],xmm1[0]
; CHECK-NEXT:    vmovdqa %xmm0, (%rdi)
; CHECK-NEXT:    vzeroupper
; CHECK-NEXT:    retq
  %b = fptoui %f32vec_t %a to %i16vec_t
  store %i16vec_t %b, %i16vec_t * %p
  ret void
}

define void @fptosi16(%f32vec_t %a, %i16vec_t *%p) {
; CHECK-LABEL: fptosi16:
; CHECK:       # BB#0:
; CHECK-NEXT:    vcvttps2dq %ymm0, %ymm0
; CHECK-NEXT:    vextractf128 $1, %ymm0, %xmm1
; CHECK-NEXT:    vmovdqa {{.*#+}} xmm2 = [0,1,4,5,8,9,12,13,8,9,12,13,12,13,14,15]
; CHECK-NEXT:    vpshufb %xmm2, %xmm1, %xmm1
; CHECK-NEXT:    vpshufb %xmm2, %xmm0, %xmm0
; CHECK-NEXT:    vpunpcklqdq {{.*#+}} xmm0 = xmm0[0],xmm1[0]
; CHECK-NEXT:    vmovdqa %xmm0, (%rdi)
; CHECK-NEXT:    vzeroupper
; CHECK-NEXT:    retq
  %b = fptosi %f32vec_t %a to %i16vec_t
  store %i16vec_t %b, %i16vec_t * %p
  ret void
}

define void @fptoui8(%f32vec_t %a, %i8vec_t *%p) {
; CHECK-LABEL: fptoui8:
; CHECK:       # BB#0:
; CHECK-NEXT:    vcvttps2dq %ymm0, %ymm0
; CHECK-NEXT:    vextractf128 $1, %ymm0, %xmm1
; CHECK-NEXT:    vmovdqa {{.*#+}} xmm2 = [0,1,4,5,8,9,12,13,8,9,12,13,12,13,14,15]
; CHECK-NEXT:    vpshufb %xmm2, %xmm1, %xmm1
; CHECK-NEXT:    vpshufb %xmm2, %xmm0, %xmm0
; CHECK-NEXT:    vpunpcklqdq {{.*#+}} xmm0 = xmm0[0],xmm1[0]
; CHECK-NEXT:    vpackuswb %xmm0, %xmm0, %xmm0
; CHECK-NEXT:    vmovq %xmm0, (%rdi)
; CHECK-NEXT:    vzeroupper
; CHECK-NEXT:    retq
  %b = fptoui %f32vec_t %a to %i8vec_t
  store %i8vec_t %b, %i8vec_t * %p
  ret void
}

define void @fptosi8(%f32vec_t %a, %i8vec_t *%p) {
; CHECK-LABEL: fptosi8:
; CHECK:       # BB#0:
; CHECK-NEXT:    vcvttps2dq %ymm0, %ymm0
; CHECK-NEXT:    vextractf128 $1, %ymm0, %xmm1
; CHECK-NEXT:    vmovdqa {{.*#+}} xmm2 = [0,1,4,5,8,9,12,13,8,9,12,13,12,13,14,15]
; CHECK-NEXT:    vpshufb %xmm2, %xmm1, %xmm1
; CHECK-NEXT:    vpshufb %xmm2, %xmm0, %xmm0
; CHECK-NEXT:    vpunpcklqdq {{.*#+}} xmm0 = xmm0[0],xmm1[0]
; CHECK-NEXT:    vpacksswb %xmm0, %xmm0, %xmm0
; CHECK-NEXT:    vmovq %xmm0, (%rdi)
; CHECK-NEXT:    vzeroupper
; CHECK-NEXT:    retq
  %b = fptosi %f32vec_t %a to %i8vec_t
  store %i8vec_t %b, %i8vec_t * %p
  ret void
}
Make utils/update_llc_test_checks.py note that the assertions are autogenerated. Also update existing test cases which appear to be generated by it and weren't modified (other than addition of the header) by rerunning it. llvm-svn: 253917 2015-11-24 05:33:58 +08:00			`; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py`
use update_llc_test_checks.py to tighten checking; remove unnecessary testing params llvm-svn: 234029 2015-04-04 01:17:50 +08:00			`; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=avx \| FileCheck %s`
[VectorLegalizer/X86] Don't unvectorize fp_to_uint for v8f32->v8i16 Rather than LegalizeAction::Expand, this needs LegalizeAction::Promote to get promoted to fp_to_sint v8f32->v8i32. This is a legal operation on AVX. For that to work properly, we also need to teach the legalizer about the specific promotion required here. The default vector promotion uses bitcasting to a vector type of the same total size. We want to promote the vector element type, effectively widening the operation and then truncating the result. This is analogous to the current logic of how int_to_fp is promoted. The change also factors out some code from the int_to_fp promotion code to ValueType::widenIntegerVectorElementType. This is now shared between int_to_fp and fp_to_int. There is no longer need for the custom lowering of fp_to_sint f32->v8i16 in X86. It can now go through the new target-independent fp_to_*int promotion logic. I also checked that no other target uses Promote for these ops yet, so there shouldn't be any unexpected change in behavior. Fixes <rdar://problem/16202247> llvm-svn: 204058 2014-03-18 01:06:14 +08:00
			`; Check that we generate vector conversion from float to narrower int types`

			`%f32vec_t = type <8 x float>`
			`%i16vec_t = type <8 x i16>`
			`%i8vec_t = type <8 x i8>`

			`define void @fptoui16(%f32vec_t %a, %i16vec_t *%p) {`
			`; CHECK-LABEL: fptoui16:`
use update_llc_test_checks.py to tighten checking; remove unnecessary testing params llvm-svn: 234029 2015-04-04 01:17:50 +08:00			`; CHECK: # BB#0:`
			`; CHECK-NEXT: vcvttps2dq %ymm0, %ymm0`
			`; CHECK-NEXT: vextractf128 $1, %ymm0, %xmm1`
			`; CHECK-NEXT: vmovdqa {{.*#+}} xmm2 = [0,1,4,5,8,9,12,13,8,9,12,13,12,13,14,15]`
			`; CHECK-NEXT: vpshufb %xmm2, %xmm1, %xmm1`
			`; CHECK-NEXT: vpshufb %xmm2, %xmm0, %xmm0`
			`; CHECK-NEXT: vpunpcklqdq {{.*#+}} xmm0 = xmm0[0],xmm1[0]`
			`; CHECK-NEXT: vmovdqa %xmm0, (%rdi)`
			`; CHECK-NEXT: vzeroupper`
			`; CHECK-NEXT: retq`
[VectorLegalizer/X86] Don't unvectorize fp_to_uint for v8f32->v8i16 Rather than LegalizeAction::Expand, this needs LegalizeAction::Promote to get promoted to fp_to_sint v8f32->v8i32. This is a legal operation on AVX. For that to work properly, we also need to teach the legalizer about the specific promotion required here. The default vector promotion uses bitcasting to a vector type of the same total size. We want to promote the vector element type, effectively widening the operation and then truncating the result. This is analogous to the current logic of how int_to_fp is promoted. The change also factors out some code from the int_to_fp promotion code to ValueType::widenIntegerVectorElementType. This is now shared between int_to_fp and fp_to_int. There is no longer need for the custom lowering of fp_to_sint f32->v8i16 in X86. It can now go through the new target-independent fp_to_*int promotion logic. I also checked that no other target uses Promote for these ops yet, so there shouldn't be any unexpected change in behavior. Fixes <rdar://problem/16202247> llvm-svn: 204058 2014-03-18 01:06:14 +08:00			`%b = fptoui %f32vec_t %a to %i16vec_t`
			`store %i16vec_t %b, %i16vec_t * %p`
			`ret void`
			`}`

			`define void @fptosi16(%f32vec_t %a, %i16vec_t *%p) {`
			`; CHECK-LABEL: fptosi16:`
use update_llc_test_checks.py to tighten checking; remove unnecessary testing params llvm-svn: 234029 2015-04-04 01:17:50 +08:00			`; CHECK: # BB#0:`
			`; CHECK-NEXT: vcvttps2dq %ymm0, %ymm0`
			`; CHECK-NEXT: vextractf128 $1, %ymm0, %xmm1`
			`; CHECK-NEXT: vmovdqa {{.*#+}} xmm2 = [0,1,4,5,8,9,12,13,8,9,12,13,12,13,14,15]`
			`; CHECK-NEXT: vpshufb %xmm2, %xmm1, %xmm1`
			`; CHECK-NEXT: vpshufb %xmm2, %xmm0, %xmm0`
			`; CHECK-NEXT: vpunpcklqdq {{.*#+}} xmm0 = xmm0[0],xmm1[0]`
			`; CHECK-NEXT: vmovdqa %xmm0, (%rdi)`
			`; CHECK-NEXT: vzeroupper`
			`; CHECK-NEXT: retq`
[VectorLegalizer/X86] Don't unvectorize fp_to_uint for v8f32->v8i16 Rather than LegalizeAction::Expand, this needs LegalizeAction::Promote to get promoted to fp_to_sint v8f32->v8i32. This is a legal operation on AVX. For that to work properly, we also need to teach the legalizer about the specific promotion required here. The default vector promotion uses bitcasting to a vector type of the same total size. We want to promote the vector element type, effectively widening the operation and then truncating the result. This is analogous to the current logic of how int_to_fp is promoted. The change also factors out some code from the int_to_fp promotion code to ValueType::widenIntegerVectorElementType. This is now shared between int_to_fp and fp_to_int. There is no longer need for the custom lowering of fp_to_sint f32->v8i16 in X86. It can now go through the new target-independent fp_to_*int promotion logic. I also checked that no other target uses Promote for these ops yet, so there shouldn't be any unexpected change in behavior. Fixes <rdar://problem/16202247> llvm-svn: 204058 2014-03-18 01:06:14 +08:00			`%b = fptosi %f32vec_t %a to %i16vec_t`
			`store %i16vec_t %b, %i16vec_t * %p`
			`ret void`
			`}`

			`define void @fptoui8(%f32vec_t %a, %i8vec_t *%p) {`
			`; CHECK-LABEL: fptoui8:`
use update_llc_test_checks.py to tighten checking; remove unnecessary testing params llvm-svn: 234029 2015-04-04 01:17:50 +08:00			`; CHECK: # BB#0:`
			`; CHECK-NEXT: vcvttps2dq %ymm0, %ymm0`
			`; CHECK-NEXT: vextractf128 $1, %ymm0, %xmm1`
			`; CHECK-NEXT: vmovdqa {{.*#+}} xmm2 = [0,1,4,5,8,9,12,13,8,9,12,13,12,13,14,15]`
			`; CHECK-NEXT: vpshufb %xmm2, %xmm1, %xmm1`
			`; CHECK-NEXT: vpshufb %xmm2, %xmm0, %xmm0`
			`; CHECK-NEXT: vpunpcklqdq {{.*#+}} xmm0 = xmm0[0],xmm1[0]`
[X86][SSE] Add support for lowering shuffles to PACKSS/PACKUS If the upper bits of a truncation shuffle patterns have at least the minimum number of sign/zero bits on their inputs then we can safely use PACKSS/PACKUS as shuffles. Partial fix for https://bugs.llvm.org/show_bug.cgi?id=34773 Differential Revision: https://reviews.llvm.org/D38472 llvm-svn: 314788 2017-10-03 20:01:31 +08:00			`; CHECK-NEXT: vpackuswb %xmm0, %xmm0, %xmm0`
use update_llc_test_checks.py to tighten checking; remove unnecessary testing params llvm-svn: 234029 2015-04-04 01:17:50 +08:00			`; CHECK-NEXT: vmovq %xmm0, (%rdi)`
			`; CHECK-NEXT: vzeroupper`
			`; CHECK-NEXT: retq`
[VectorLegalizer/X86] Don't unvectorize fp_to_uint for v8f32->v8i16 Rather than LegalizeAction::Expand, this needs LegalizeAction::Promote to get promoted to fp_to_sint v8f32->v8i32. This is a legal operation on AVX. For that to work properly, we also need to teach the legalizer about the specific promotion required here. The default vector promotion uses bitcasting to a vector type of the same total size. We want to promote the vector element type, effectively widening the operation and then truncating the result. This is analogous to the current logic of how int_to_fp is promoted. The change also factors out some code from the int_to_fp promotion code to ValueType::widenIntegerVectorElementType. This is now shared between int_to_fp and fp_to_int. There is no longer need for the custom lowering of fp_to_sint f32->v8i16 in X86. It can now go through the new target-independent fp_to_*int promotion logic. I also checked that no other target uses Promote for these ops yet, so there shouldn't be any unexpected change in behavior. Fixes <rdar://problem/16202247> llvm-svn: 204058 2014-03-18 01:06:14 +08:00			`%b = fptoui %f32vec_t %a to %i8vec_t`
			`store %i8vec_t %b, %i8vec_t * %p`
			`ret void`
			`}`

			`define void @fptosi8(%f32vec_t %a, %i8vec_t *%p) {`
			`; CHECK-LABEL: fptosi8:`
use update_llc_test_checks.py to tighten checking; remove unnecessary testing params llvm-svn: 234029 2015-04-04 01:17:50 +08:00			`; CHECK: # BB#0:`
			`; CHECK-NEXT: vcvttps2dq %ymm0, %ymm0`
			`; CHECK-NEXT: vextractf128 $1, %ymm0, %xmm1`
			`; CHECK-NEXT: vmovdqa {{.*#+}} xmm2 = [0,1,4,5,8,9,12,13,8,9,12,13,12,13,14,15]`
			`; CHECK-NEXT: vpshufb %xmm2, %xmm1, %xmm1`
			`; CHECK-NEXT: vpshufb %xmm2, %xmm0, %xmm0`
			`; CHECK-NEXT: vpunpcklqdq {{.*#+}} xmm0 = xmm0[0],xmm1[0]`
[X86][SSE] Add support for lowering shuffles to PACKSS/PACKUS If the upper bits of a truncation shuffle patterns have at least the minimum number of sign/zero bits on their inputs then we can safely use PACKSS/PACKUS as shuffles. Partial fix for https://bugs.llvm.org/show_bug.cgi?id=34773 Differential Revision: https://reviews.llvm.org/D38472 llvm-svn: 314788 2017-10-03 20:01:31 +08:00			`; CHECK-NEXT: vpacksswb %xmm0, %xmm0, %xmm0`
use update_llc_test_checks.py to tighten checking; remove unnecessary testing params llvm-svn: 234029 2015-04-04 01:17:50 +08:00			`; CHECK-NEXT: vmovq %xmm0, (%rdi)`
			`; CHECK-NEXT: vzeroupper`
			`; CHECK-NEXT: retq`
[VectorLegalizer/X86] Don't unvectorize fp_to_uint for v8f32->v8i16 Rather than LegalizeAction::Expand, this needs LegalizeAction::Promote to get promoted to fp_to_sint v8f32->v8i32. This is a legal operation on AVX. For that to work properly, we also need to teach the legalizer about the specific promotion required here. The default vector promotion uses bitcasting to a vector type of the same total size. We want to promote the vector element type, effectively widening the operation and then truncating the result. This is analogous to the current logic of how int_to_fp is promoted. The change also factors out some code from the int_to_fp promotion code to ValueType::widenIntegerVectorElementType. This is now shared between int_to_fp and fp_to_int. There is no longer need for the custom lowering of fp_to_sint f32->v8i16 in X86. It can now go through the new target-independent fp_to_*int promotion logic. I also checked that no other target uses Promote for these ops yet, so there shouldn't be any unexpected change in behavior. Fixes <rdar://problem/16202247> llvm-svn: 204058 2014-03-18 01:06:14 +08:00			`%b = fptosi %f32vec_t %a to %i8vec_t`
			`store %i8vec_t %b, %i8vec_t * %p`
			`ret void`
			`}`