[AMDGPU] Remove -amdgpu-spill-sgpr-to-smem.
Summary: The implementation was never completed and never used except in tests.
Reviewers: arsenm, mareko
Subscribers: qcolombet, kzhuravl, jvesely, wdng, nhaehnle, yaxunl, dstuttard, tpr, t-tye, hiraditya, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D69163
llvm-svn: 375293
2019-10-19 05:48:22 +08:00
|
|
|
; RUN: llc -O0 -march=amdgcn -mcpu=fiji -verify-machineinstrs < %s | FileCheck -check-prefix=ALL -check-prefix=VGPR %s
|
|
|
|
; RUN: llc -O0 -march=amdgcn -mcpu=fiji -amdgpu-spill-sgpr-to-vgpr=0 -verify-machineinstrs < %s | FileCheck -check-prefix=ALL -check-prefix=VMEM %s
|
2016-12-02 08:54:45 +08:00
|
|
|
|
|
|
|
; ALL-LABEL: {{^}}spill_sgpr_x2:
|
|
|
|
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 0
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 1
|
|
|
|
; VGPR: s_cbranch_scc1
|
|
|
|
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 0
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 1
|
|
|
|
|
[AMDGPU] Remove -amdgpu-spill-sgpr-to-smem.
Summary: The implementation was never completed and never used except in tests.
Reviewers: arsenm, mareko
Subscribers: qcolombet, kzhuravl, jvesely, wdng, nhaehnle, yaxunl, dstuttard, tpr, t-tye, hiraditya, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D69163
llvm-svn: 375293
2019-10-19 05:48:22 +08:00
|
|
|
|
2016-12-02 08:54:45 +08:00
|
|
|
; VMEM: buffer_store_dword
|
|
|
|
; VMEM: s_cbranch_scc1
|
|
|
|
|
|
|
|
; VMEM: buffer_load_dword
|
|
|
|
define amdgpu_kernel void @spill_sgpr_x2(i32 addrspace(1)* %out, i32 %in) #0 {
|
|
|
|
%wide.sgpr = call <2 x i32> asm sideeffect "; def $0", "=s" () #0
|
|
|
|
%cmp = icmp eq i32 %in, 0
|
|
|
|
br i1 %cmp, label %bb0, label %ret
|
|
|
|
|
|
|
|
bb0:
|
|
|
|
call void asm sideeffect "; use $0", "s"(<2 x i32> %wide.sgpr) #0
|
|
|
|
br label %ret
|
|
|
|
|
|
|
|
ret:
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2019-03-21 20:01:21 +08:00
|
|
|
; ALL-LABEL: {{^}}spill_sgpr_x3:
|
|
|
|
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 0
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 1
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 2
|
|
|
|
; VGPR: s_cbranch_scc1
|
|
|
|
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 0
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 1
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 2
|
|
|
|
|
|
|
|
|
|
|
|
; VMEM: buffer_store_dword
|
|
|
|
; VMEM: s_cbranch_scc1
|
|
|
|
|
|
|
|
; VMEM: buffer_load_dword
|
|
|
|
define amdgpu_kernel void @spill_sgpr_x3(i32 addrspace(1)* %out, i32 %in) #0 {
|
|
|
|
%wide.sgpr = call <3 x i32> asm sideeffect "; def $0", "=s" () #0
|
|
|
|
%cmp = icmp eq i32 %in, 0
|
|
|
|
br i1 %cmp, label %bb0, label %ret
|
|
|
|
|
|
|
|
bb0:
|
|
|
|
call void asm sideeffect "; use $0", "s"(<3 x i32> %wide.sgpr) #0
|
|
|
|
br label %ret
|
|
|
|
|
|
|
|
ret:
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-12-02 08:54:45 +08:00
|
|
|
; ALL-LABEL: {{^}}spill_sgpr_x4:
|
|
|
|
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 0
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 1
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 2
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 3
|
|
|
|
; VGPR: s_cbranch_scc1
|
|
|
|
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 0
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 1
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 2
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 3
|
|
|
|
|
|
|
|
|
|
|
|
; VMEM: buffer_store_dword
|
|
|
|
; VMEM: s_cbranch_scc1
|
|
|
|
|
|
|
|
; VMEM: buffer_load_dword
|
|
|
|
define amdgpu_kernel void @spill_sgpr_x4(i32 addrspace(1)* %out, i32 %in) #0 {
|
|
|
|
%wide.sgpr = call <4 x i32> asm sideeffect "; def $0", "=s" () #0
|
|
|
|
%cmp = icmp eq i32 %in, 0
|
|
|
|
br i1 %cmp, label %bb0, label %ret
|
|
|
|
|
|
|
|
bb0:
|
|
|
|
call void asm sideeffect "; use $0", "s"(<4 x i32> %wide.sgpr) #0
|
|
|
|
br label %ret
|
|
|
|
|
|
|
|
ret:
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2019-03-22 18:11:21 +08:00
|
|
|
; ALL-LABEL: {{^}}spill_sgpr_x5:
|
|
|
|
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 0
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 1
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 2
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 3
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 4
|
|
|
|
; VGPR: s_cbranch_scc1
|
|
|
|
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 0
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 1
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 2
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 3
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 4
|
|
|
|
|
|
|
|
|
|
|
|
; VMEM: buffer_store_dword
|
|
|
|
; VMEM: s_cbranch_scc1
|
|
|
|
|
|
|
|
; VMEM: buffer_load_dword
|
|
|
|
define amdgpu_kernel void @spill_sgpr_x5(i32 addrspace(1)* %out, i32 %in) #0 {
|
|
|
|
%wide.sgpr = call <5 x i32> asm sideeffect "; def $0", "=s" () #0
|
|
|
|
%cmp = icmp eq i32 %in, 0
|
|
|
|
br i1 %cmp, label %bb0, label %ret
|
|
|
|
|
|
|
|
bb0:
|
|
|
|
call void asm sideeffect "; use $0", "s"(<5 x i32> %wide.sgpr) #0
|
|
|
|
br label %ret
|
|
|
|
|
|
|
|
ret:
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
2016-12-02 08:54:45 +08:00
|
|
|
; ALL-LABEL: {{^}}spill_sgpr_x8:
|
|
|
|
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 0
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 1
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 2
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 3
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 4
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 5
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 6
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 7
|
|
|
|
; VGPR: s_cbranch_scc1
|
|
|
|
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 0
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 1
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 2
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 3
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 4
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 5
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 6
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 7
|
|
|
|
|
|
|
|
; VMEM: buffer_store_dword
|
|
|
|
; VMEM: s_cbranch_scc1
|
|
|
|
|
|
|
|
; VMEM: buffer_load_dword
|
|
|
|
define amdgpu_kernel void @spill_sgpr_x8(i32 addrspace(1)* %out, i32 %in) #0 {
|
|
|
|
%wide.sgpr = call <8 x i32> asm sideeffect "; def $0", "=s" () #0
|
|
|
|
%cmp = icmp eq i32 %in, 0
|
|
|
|
br i1 %cmp, label %bb0, label %ret
|
|
|
|
|
|
|
|
bb0:
|
|
|
|
call void asm sideeffect "; use $0", "s"(<8 x i32> %wide.sgpr) #0
|
|
|
|
br label %ret
|
|
|
|
|
|
|
|
ret:
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
[AMDGPU] Remove assertion on S1024 SGPR to VGPR spill
Summary:
Replace an assertion that blocks S1024 SGPR to VGPR spill.
The assertion pre-dates S1024 and is not wave size dependent.
Reviewers: arsenm, sameerds, rampitec
Reviewed By: arsenm
Subscribers: qcolombet, kzhuravl, jvesely, wdng, nhaehnle, yaxunl, dstuttard, tpr, t-tye, hiraditya, kerbowa, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D80783
2020-05-30 10:15:39 +08:00
|
|
|
; ALL-LABEL: {{^}}spill_sgpr_x16:
|
|
|
|
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 0
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 1
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 2
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 3
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 4
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 5
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 6
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 7
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 8
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 9
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 10
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 11
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 12
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 13
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 14
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 15
|
|
|
|
; VGPR: s_cbranch_scc1
|
|
|
|
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 0
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 1
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 2
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 3
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 4
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 5
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 6
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 7
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 8
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 9
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 10
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 11
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 12
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 13
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 14
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 15
|
|
|
|
|
|
|
|
; VMEM: buffer_store_dword
|
|
|
|
; VMEM: s_cbranch_scc1
|
|
|
|
|
|
|
|
; VMEM: buffer_load_dword
|
|
|
|
define amdgpu_kernel void @spill_sgpr_x16(i32 addrspace(1)* %out, i32 %in) #0 {
|
|
|
|
%wide.sgpr = call <16 x i32> asm sideeffect "; def $0", "=s" () #0
|
|
|
|
%cmp = icmp eq i32 %in, 0
|
|
|
|
br i1 %cmp, label %bb0, label %ret
|
|
|
|
|
|
|
|
bb0:
|
|
|
|
call void asm sideeffect "; use $0", "s"(<16 x i32> %wide.sgpr) #0
|
|
|
|
br label %ret
|
|
|
|
|
|
|
|
ret:
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
; ALL-LABEL: {{^}}spill_sgpr_x32:
|
|
|
|
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 0
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 1
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 2
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 3
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 4
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 5
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 6
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 7
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 8
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 9
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 10
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 11
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 12
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 13
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 14
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 15
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 16
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 17
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 18
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 19
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 20
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 21
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 22
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 23
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 24
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 25
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 26
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 27
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 28
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 29
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 30
|
|
|
|
; VGPR: v_writelane_b32 v{{[0-9]+}}, s{{[0-9]+}}, 31
|
|
|
|
; VGPR: s_cbranch_scc1
|
|
|
|
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 0
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 1
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 2
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 3
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 4
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 5
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 6
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 7
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 8
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 9
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 10
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 11
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 12
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 13
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 14
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 15
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 16
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 17
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 18
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 19
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 20
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 21
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 22
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 23
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 24
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 25
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 26
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 27
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 28
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 29
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 30
|
|
|
|
; VGPR: v_readlane_b32 s{{[0-9]+}}, v{{[0-9]+}}, 31
|
|
|
|
|
|
|
|
; VMEM: buffer_store_dword
|
|
|
|
; VMEM: s_cbranch_scc1
|
|
|
|
|
|
|
|
; VMEM: buffer_load_dword
|
|
|
|
define amdgpu_kernel void @spill_sgpr_x32(i32 addrspace(1)* %out, i32 %in) #0 {
|
|
|
|
%wide.sgpr = call <32 x i32> asm sideeffect "; def $0", "=s" () #0
|
|
|
|
%cmp = icmp eq i32 %in, 0
|
|
|
|
br i1 %cmp, label %bb0, label %ret
|
|
|
|
|
|
|
|
bb0:
|
|
|
|
call void asm sideeffect "; use $0", "s"(<32 x i32> %wide.sgpr) #0
|
|
|
|
br label %ret
|
|
|
|
|
|
|
|
ret:
|
|
|
|
ret void
|
|
|
|
}
|
2016-12-02 08:54:45 +08:00
|
|
|
|
|
|
|
attributes #0 = { nounwind }
|