llvm-project/llvm/test/CodeGen/AMDGPU/fast-ra-kills-vcc.mir

63 lines
2.3 KiB
YAML

# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py
# RUN: llc -verify-machineinstrs -mtriple=amdgcn-amd-amdhsa -mcpu=gfx900 -run-pass=regallocfast -o - %s | FileCheck %s
# Make sure incorrect kills aren't emitted on vcc
---
name: foo
tracksRegLiveness: true
machineFunctionInfo:
isEntryFunction: true
scratchRSrcReg: '$sgpr0_sgpr1_sgpr2_sgpr3'
stackPtrOffsetReg: '$sgpr32'
body: |
bb.0:
liveins: $vgpr0
; CHECK-LABEL: name: foo
; CHECK: liveins: $vgpr0
; CHECK: V_CMP_NE_U32_e32 0, killed $vgpr0, implicit-def $vcc, implicit $exec
; CHECK: $sgpr4_sgpr5 = COPY $vcc
; CHECK: renamable $vgpr0 = V_CNDMASK_B32_e64 0, -1, 0, 3, killed $vcc, implicit $exec
; CHECK: S_ENDPGM 0, implicit killed $vgpr0, implicit killed $sgpr4_sgpr5
%0:vgpr_32 = COPY $vgpr0
V_CMP_NE_U32_e32 0, %0, implicit-def $vcc, implicit $exec
$sgpr4_sgpr5 = COPY $vcc
%1:sreg_64_xexec = COPY $vcc
%2:vgpr_32 = V_CNDMASK_B32_e64 0, -1, 0, 3, %1, implicit $exec
$vgpr0 = COPY %2
S_ENDPGM 0, implicit $vgpr0, implicit $sgpr4_sgpr5
...
# This would hit "Unexpected reg unit state" assert.
---
name: bar
tracksRegLiveness: true
machineFunctionInfo:
isEntryFunction: true
scratchRSrcReg: '$sgpr0_sgpr1_sgpr2_sgpr3'
stackPtrOffsetReg: '$sgpr32'
body: |
bb.0:
liveins: $vgpr0
; CHECK-LABEL: name: bar
; CHECK: liveins: $vgpr0
; CHECK: V_CMP_NE_U32_e32 0, killed $vgpr0, implicit-def $vcc, implicit $exec
; CHECK: renamable $sgpr4_sgpr5 = COPY $vcc
; CHECK: SI_SPILL_S64_SAVE $sgpr4_sgpr5, %stack.0, implicit $exec, implicit $sgpr32 :: (store 8 into %stack.0, align 4, addrspace 5)
; CHECK: renamable $sgpr4_sgpr5 = COPY $vcc
; CHECK: $vcc = SI_SPILL_S64_RESTORE %stack.0, implicit $exec, implicit $sgpr32 :: (load 8 from %stack.0, align 4, addrspace 5)
; CHECK: renamable $vgpr0 = V_CNDMASK_B32_e64 0, -1, 0, 3, killed $sgpr4_sgpr5, implicit $exec
; CHECK: S_ENDPGM 0, implicit killed $vgpr0, implicit killed renamable $vcc
%0:vgpr_32 = COPY $vgpr0
V_CMP_NE_U32_e32 0, %0, implicit-def $vcc, implicit $exec
%3:sreg_64_xexec = COPY $vcc
%1:sreg_64_xexec = COPY $vcc
%2:vgpr_32 = V_CNDMASK_B32_e64 0, -1, 0, 3, %1, implicit $exec
$vgpr0 = COPY %2
S_ENDPGM 0, implicit $vgpr0, implicit %3
...