llvm-project/llvm/test/CodeGen/Mips/v2i16tof32.ll

; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc < %s -O2 -mtriple mipsel--linux-android -mattr=+dsp -verify-machineinstrs | FileCheck %s

; Function below generates a v2i16 to f32 bitcast.
; Test that we are able to match it.

define float @f(<8 x i16>* %a) {
; CHECK-LABEL: f:
; CHECK:       # %bb.0: # %entry
; CHECK-NEXT:    addiu $sp, $sp, -32
; CHECK-NEXT:    .cfi_def_cfa_offset 32
; CHECK-NEXT:    sw $ra, 28($sp) # 4-byte Folded Spill
; CHECK-NEXT:    sw $fp, 24($sp) # 4-byte Folded Spill
; CHECK-NEXT:    .cfi_offset 31, -4
; CHECK-NEXT:    .cfi_offset 30, -8
; CHECK-NEXT:    move $fp, $sp
; CHECK-NEXT:    .cfi_def_cfa_register 30
; CHECK-NEXT:    addiu $1, $zero, -16
; CHECK-NEXT:    and $sp, $sp, $1
; CHECK-NEXT:    lw $1, 12($4)
; CHECK-NEXT:    lw $2, 0($4)
; CHECK-NEXT:    lw $3, 8($4)
; CHECK-NEXT:    sw $3, 8($sp)
; CHECK-NEXT:    sw $1, 12($sp)
; CHECK-NEXT:    sw $2, 0($sp)
; CHECK-NEXT:    lw $1, 4($4)
; CHECK-NEXT:    sw $1, 4($sp)
; CHECK-NEXT:    mtc1 $2, $f0
; CHECK-NEXT:    move $sp, $fp
; CHECK-NEXT:    lw $fp, 24($sp) # 4-byte Folded Reload
; CHECK-NEXT:    lw $ra, 28($sp) # 4-byte Folded Reload
; CHECK-NEXT:    jr $ra
; CHECK-NEXT:    addiu $sp, $sp, 32
entry:
  %m = alloca <8 x i16>
  %0 = load <8 x i16>, <8 x i16>* %a
  store <8 x i16> %0, <8 x i16>* %m
  %1 = bitcast <8 x i16> %0 to <4 x float>
  %2 = shufflevector <4 x float> %1, <4 x float> undef, <8 x i32> <i32 0, i32 3, i32 2, i32 3, i32 undef, i32 undef, i32 undef, i32 undef>
  %3 = shufflevector <8 x float> zeroinitializer, <8 x float> %2, <8 x i32> <i32 8, i32 9, i32 10, i32 11, i32 4, i32 5, i32 6, i32 7>
  %4 = bitcast <8 x float> %3 to <8 x i32>
  %5 = extractelement <8 x i32> %4, i32 0
  %6 = bitcast i32 %5 to float
  ret float %6
}
[mips] Provide additional DSP bitconvert patterns Previously, v2i16 -> f32 bitcast could not be matched. Add patterns to support matching this and similar types of bitcasts. Differential revision: https://reviews.llvm.org/D40959 llvm-svn: 320562 2017-12-13 18:13:35 +08:00			`; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py`
			`; RUN: llc < %s -O2 -mtriple mipsel--linux-android -mattr=+dsp -verify-machineinstrs \| FileCheck %s`

			`; Function below generates a v2i16 to f32 bitcast.`
			`; Test that we are able to match it.`

			`define float @f(<8 x i16>* %a) {`
			`; CHECK-LABEL: f:`
			`; CHECK: # %bb.0: # %entry`
			`; CHECK-NEXT: addiu $sp, $sp, -32`
			`; CHECK-NEXT: .cfi_def_cfa_offset 32`
[Mips] Always save RA when disabling frame pointer elimination This ensures that frame-based unwinding will continue to work when calling a noreturn function; there is not much use having the caller's frame pointer saved if you don't also have the caller's program counter. Patch by James Clarke. Differential Revision: https://reviews.llvm.org/D68542 llvm-svn: 373907 2019-10-07 22:01:37 +08:00			`; CHECK-NEXT: sw $ra, 28($sp) # 4-byte Folded Spill`
			`; CHECK-NEXT: sw $fp, 24($sp) # 4-byte Folded Spill`
			`; CHECK-NEXT: .cfi_offset 31, -4`
			`; CHECK-NEXT: .cfi_offset 30, -8`
[mips] Provide additional DSP bitconvert patterns Previously, v2i16 -> f32 bitcast could not be matched. Add patterns to support matching this and similar types of bitcasts. Differential revision: https://reviews.llvm.org/D40959 llvm-svn: 320562 2017-12-13 18:13:35 +08:00			`; CHECK-NEXT: move $fp, $sp`
			`; CHECK-NEXT: .cfi_def_cfa_register 30`
			`; CHECK-NEXT: addiu $1, $zero, -16`
			`; CHECK-NEXT: and $sp, $sp, $1`
[DAGCombiner] If a TokenFactor would be merged into its user, consider the user later. Summary: A number of optimizations are inhibited by single-use TokenFactors not being merged into the TokenFactor using it. This makes we consider if we can do the merge immediately. Most tests changes here are due to the change in visitation causing minor reorderings and associated reassociation of paired memory operations. CodeGen tests with non-reordering changes: X86/aligned-variadic.ll -- memory-based add folded into stored leaq value. X86/constant-combiners.ll -- Optimizes out overlap between stores. X86/pr40631_deadstore_elision -- folds constant byte store into preceding quad word constant store. Reviewers: RKSimon, craig.topper, spatel, efriedma, courbet Reviewed By: courbet Subscribers: dylanmckay, sdardis, nemanjai, jvesely, nhaehnle, javed.absar, eraman, hiraditya, kbarton, jrtc27, atanasyan, jsji, llvm-commits Tags: #llvm Differential Revision: https://reviews.llvm.org/D59260 llvm-svn: 356068 2019-03-14 01:07:09 +08:00			`; CHECK-NEXT: lw $1, 12($4)`
			`; CHECK-NEXT: lw $2, 0($4)`
			`; CHECK-NEXT: lw $3, 8($4)`
			`; CHECK-NEXT: sw $3, 8($sp)`
			`; CHECK-NEXT: sw $1, 12($sp)`
			`; CHECK-NEXT: sw $2, 0($sp)`
			`; CHECK-NEXT: lw $1, 4($4)`
			`; CHECK-NEXT: sw $1, 4($sp)`
			`; CHECK-NEXT: mtc1 $2, $f0`
[mips] Provide additional DSP bitconvert patterns Previously, v2i16 -> f32 bitcast could not be matched. Add patterns to support matching this and similar types of bitcasts. Differential revision: https://reviews.llvm.org/D40959 llvm-svn: 320562 2017-12-13 18:13:35 +08:00			`; CHECK-NEXT: move $sp, $fp`
[Mips] Always save RA when disabling frame pointer elimination This ensures that frame-based unwinding will continue to work when calling a noreturn function; there is not much use having the caller's frame pointer saved if you don't also have the caller's program counter. Patch by James Clarke. Differential Revision: https://reviews.llvm.org/D68542 llvm-svn: 373907 2019-10-07 22:01:37 +08:00			`; CHECK-NEXT: lw $fp, 24($sp) # 4-byte Folded Reload`
			`; CHECK-NEXT: lw $ra, 28($sp) # 4-byte Folded Reload`
[mips] Provide additional DSP bitconvert patterns Previously, v2i16 -> f32 bitcast could not be matched. Add patterns to support matching this and similar types of bitcasts. Differential revision: https://reviews.llvm.org/D40959 llvm-svn: 320562 2017-12-13 18:13:35 +08:00			`; CHECK-NEXT: jr $ra`
			`; CHECK-NEXT: addiu $sp, $sp, 32`
			`entry:`
			`%m = alloca <8 x i16>`
			`%0 = load <8 x i16>, <8 x i16>* %a`
			`store <8 x i16> %0, <8 x i16>* %m`
			`%1 = bitcast <8 x i16> %0 to <4 x float>`
			`%2 = shufflevector <4 x float> %1, <4 x float> undef, <8 x i32> <i32 0, i32 3, i32 2, i32 3, i32 undef, i32 undef, i32 undef, i32 undef>`
			`%3 = shufflevector <8 x float> zeroinitializer, <8 x float> %2, <8 x i32> <i32 8, i32 9, i32 10, i32 11, i32 4, i32 5, i32 6, i32 7>`
			`%4 = bitcast <8 x float> %3 to <8 x i32>`
			`%5 = extractelement <8 x i32> %4, i32 0`
			`%6 = bitcast i32 %5 to float`
			`ret float %6`
			`}`