forked from OSchip/llvm-project
AMDGPU: Fix assert on inline asm on gfx90a
This was assuming all mayLoad instructions have one def.
This commit is contained in:
parent
e60d6e91e1
commit
b58332774f
|
@ -1655,7 +1655,7 @@ bool SIFoldOperands::tryFoldLCSSAPhi(MachineInstr &PHI) {
|
|||
// Attempt to convert VGPR load to an AGPR load.
|
||||
bool SIFoldOperands::tryFoldLoad(MachineInstr &MI) {
|
||||
assert(MI.mayLoad());
|
||||
if (!ST->hasGFX90AInsts() || !MI.getNumOperands())
|
||||
if (!ST->hasGFX90AInsts() || MI.getNumExplicitDefs() != 1)
|
||||
return false;
|
||||
|
||||
MachineOperand &Def = MI.getOperand(0);
|
||||
|
|
|
@ -0,0 +1,13 @@
|
|||
; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx90a < %s
|
||||
|
||||
define protected amdgpu_kernel void @foo(i64 addrspace(1)* %arg, i64 addrspace(1)* %arg1) {
|
||||
bb:
|
||||
%tmp = addrspacecast i64* addrspace(5)* null to i64**
|
||||
%tmp2 = call i64 @eggs(i64* undef) #1
|
||||
%tmp3 = load i64*, i64** %tmp, align 8
|
||||
%tmp4 = getelementptr inbounds i64, i64* %tmp3, i64 undef
|
||||
store i64 %tmp2, i64* %tmp4, align 8
|
||||
ret void
|
||||
}
|
||||
|
||||
declare hidden i64 @eggs(i64*)
|
|
@ -100,3 +100,18 @@ body: |
|
|||
S_ENDPGM 0
|
||||
|
||||
...
|
||||
|
||||
# This would crash looking for a def in any mayLoad instruction
|
||||
---
|
||||
name: fold_inlineasm_def
|
||||
tracksRegLiveness: true
|
||||
body: |
|
||||
bb.0:
|
||||
|
||||
; CHECK-LABEL: name: fold_inlineasm_def
|
||||
; CHECK: INLINEASM &"s_waitcnt vmcnt($0)", 41 /* sideeffect mayload isconvergent attdialect */, 13 /* imm */, 0
|
||||
; CHECK: S_ENDPGM 0
|
||||
INLINEASM &"s_waitcnt vmcnt($0)", 41 /* sideeffect mayload isconvergent attdialect */, 13 /* imm */, 0
|
||||
S_ENDPGM 0
|
||||
|
||||
...
|
||||
|
|
Loading…
Reference in New Issue