llvm-project/llvm/test/CodeGen/AMDGPU/llvm.amdgcn.sendmsg.ll

;RUN: llc -march=amdgcn -mcpu=verde -verify-machineinstrs < %s | FileCheck -check-prefix=GCN -check-prefix=SI -check-prefix=SIVI %s
;RUN: llc -march=amdgcn -mcpu=tonga -verify-machineinstrs < %s | FileCheck -check-prefix=GCN -check-prefix=VIPLUS -check-prefix=SIVI %s
;RUN: llc -march=amdgcn -mcpu=gfx900 -verify-machineinstrs < %s | FileCheck -check-prefix=GCN -check-prefix=VIPLUS -check-prefix=GFX9 %s

; GCN-LABEL: {{^}}test_interrupt:
; GCN: s_mov_b32 m0, 0
; GCN-NOT: s_mov_b32 m0
; GCN: s_sendmsg sendmsg(MSG_INTERRUPT)
define amdgpu_kernel void @test_interrupt() {
body:
  call void @llvm.amdgcn.s.sendmsg(i32 1, i32 0);
  ret void
}

; GCN-LABEL: {{^}}test_gs_emit:
; GCN: s_mov_b32 m0, 0
; GCN-NOT: s_mov_b32 m0
; GCN: s_sendmsg sendmsg(MSG_GS, GS_OP_EMIT, 0)
define amdgpu_kernel void @test_gs_emit() {
body:
  call void @llvm.amdgcn.s.sendmsg(i32 34, i32 0);
  ret void
}

; GCN-LABEL: {{^}}test_gs_cut:
; GCN: s_mov_b32 m0, 0
; GCN-NOT: s_mov_b32 m0
; GCN: s_sendmsg sendmsg(MSG_GS, GS_OP_CUT, 1)
define amdgpu_kernel void @test_gs_cut() {
body:
  call void @llvm.amdgcn.s.sendmsg(i32 274, i32 0);
  ret void
}

; GCN-LABEL: {{^}}test_gs_emit_cut:
; GCN: s_mov_b32 m0, 0
; GCN-NOT: s_mov_b32 m0
; GCN: s_sendmsg sendmsg(MSG_GS, GS_OP_EMIT_CUT, 2)
define amdgpu_kernel void @test_gs_emit_cut() {
body:
  call void @llvm.amdgcn.s.sendmsg(i32 562, i32 0)
  ret void
}

; GCN-LABEL: {{^}}test_gs_done:
; GCN: s_mov_b32 m0, 0
; GCN-NOT: s_mov_b32 m0
; GCN: s_sendmsg sendmsg(MSG_GS_DONE, GS_OP_NOP)
define amdgpu_kernel void @test_gs_done() {
body:
  call void @llvm.amdgcn.s.sendmsg(i32 3, i32 0)
  ret void
}

; GCN-LABEL: {{^}}test_gs_alloc_req:
; GCN: s_mov_b32 m0, s0
; GCN-NOT: s_mov_b32 m0
; VIPLUS-NEXT: s_nop 0
; SIVI: s_sendmsg sendmsg(9, 0, 0)
; GFX9: s_sendmsg sendmsg(MSG_GS_ALLOC_REQ)
define amdgpu_kernel void @test_gs_alloc_req(i32 inreg %a) {
body:
  call void @llvm.amdgcn.s.sendmsg(i32 9, i32 %a)
  ret void
}

; GCN-LABEL: {{^}}sendmsg:
; GCN: s_mov_b32 m0, s0
; VIPLUS-NEXT: s_nop 0
; GCN-NEXT: sendmsg(MSG_GS_DONE, GS_OP_NOP)
; GCN-NEXT: s_endpgm
define amdgpu_gs void @sendmsg(i32 inreg %a) #0 {
  call void @llvm.amdgcn.s.sendmsg(i32 3, i32 %a)
  ret void
}

; GCN-LABEL: {{^}}sendmsghalt:
; GCN: s_mov_b32 m0, s0
; VIPLUS-NEXT: s_nop 0
; GCN-NEXT: s_sendmsghalt sendmsg(MSG_INTERRUPT)
; GCN-NEXT: s_endpgm
define amdgpu_kernel void @sendmsghalt(i32 inreg %a) #0 {
  call void @llvm.amdgcn.s.sendmsghalt(i32 1, i32 %a)
  ret void
}

; GCN-LABEL: {{^}}test_interrupt_halt:
; GCN: s_mov_b32 m0, 0
; GCN-NOT: s_mov_b32 m0
; GCN: s_sendmsghalt sendmsg(MSG_INTERRUPT)
define amdgpu_kernel void @test_interrupt_halt() {
body:
  call void @llvm.amdgcn.s.sendmsghalt(i32 1, i32 0)
  ret void
}

; GCN-LABEL: {{^}}test_gs_emit_halt:
; GCN: s_mov_b32 m0, 0
; GCN-NOT: s_mov_b32 m0
; GCN: s_sendmsghalt sendmsg(MSG_GS, GS_OP_EMIT, 0)
define amdgpu_kernel void @test_gs_emit_halt() {
body:
  call void @llvm.amdgcn.s.sendmsghalt(i32 34, i32 0)
  ret void
}

; GCN-LABEL: {{^}}test_gs_cut_halt:
; GCN: s_mov_b32 m0, 0
; GCN-NOT: s_mov_b32 m0
; GCN: s_sendmsghalt sendmsg(MSG_GS, GS_OP_CUT, 1)
define amdgpu_kernel void @test_gs_cut_halt() {
body:
  call void @llvm.amdgcn.s.sendmsghalt(i32 274, i32 0)
  ret void
}

; GCN-LABEL: {{^}}test_gs_emit_cut_halt:
; GCN: s_mov_b32 m0, 0
; GCN-NOT: s_mov_b32 m0
; GCN: s_sendmsghalt sendmsg(MSG_GS, GS_OP_EMIT_CUT, 2)
define amdgpu_kernel void @test_gs_emit_cut_halt() {
body:
  call void @llvm.amdgcn.s.sendmsghalt(i32 562, i32 0)
  ret void
}

; GCN-LABEL: {{^}}test_gs_done_halt:
; GCN: s_mov_b32 m0, 0
; GCN-NOT: s_mov_b32 m0
; GCN: s_sendmsghalt sendmsg(MSG_GS_DONE, GS_OP_NOP)
define amdgpu_kernel void @test_gs_done_halt() {
body:
  call void @llvm.amdgcn.s.sendmsghalt(i32 3, i32 0)
  ret void
}

; TODO: This should use s_mul_i32 instead of v_mul_u32_u24 + v_readfirstlane!
;
; GCN-LABEL: {{^}}test_mul24:
; GCN: v_mul_u32_u24_e32
; GCN: v_readfirstlane_b32
; GCN: s_mov_b32 m0,
; GCN: s_sendmsg sendmsg(MSG_INTERRUPT)
define amdgpu_gs void @test_mul24(i32 inreg %arg) {
body:
  %tmp1 = and i32 %arg, 511
  %tmp2 = mul nuw nsw i32 %tmp1, 12288
  call void @llvm.amdgcn.s.sendmsg(i32 1, i32 %tmp2)
  ret void
}

; GCN-LABEL: {{^}}if_sendmsg:
; GCN: s_cbranch_execz
; GCN: s_sendmsg sendmsg(MSG_GS_DONE, GS_OP_NOP)
define amdgpu_gs void @if_sendmsg(i32 %flag) #0 {
  %cc = icmp eq i32 %flag, 0
  br i1 %cc, label %sendmsg, label %end

sendmsg:
  call void @llvm.amdgcn.s.sendmsg(i32 3, i32 0)
  br label %end

end:
  ret void
}

declare void @llvm.amdgcn.s.sendmsg(i32, i32) #0
declare void @llvm.amdgcn.s.sendmsghalt(i32, i32) #0

attributes #0 = { nounwind }
[AMDGPU] gfx1010 tests. NFC. llvm-svn: 360615 2019-05-14 03:30:06 +08:00			`;RUN: llc -march=amdgcn -mcpu=verde -verify-machineinstrs < %s \| FileCheck -check-prefix=GCN -check-prefix=SI -check-prefix=SIVI %s`
			`;RUN: llc -march=amdgcn -mcpu=tonga -verify-machineinstrs < %s \| FileCheck -check-prefix=GCN -check-prefix=VIPLUS -check-prefix=SIVI %s`
			`;RUN: llc -march=amdgcn -mcpu=gfx900 -verify-machineinstrs < %s \| FileCheck -check-prefix=GCN -check-prefix=VIPLUS -check-prefix=GFX9 %s`
AMDGPU: Consolidate sendmsg/sendmsghalt handling and tests llvm-svn: 295244 2017-02-16 06:17:09 +08:00
			`; GCN-LABEL: {{^}}test_interrupt:`
			`; GCN: s_mov_b32 m0, 0`
			`; GCN-NOT: s_mov_b32 m0`
			`; GCN: s_sendmsg sendmsg(MSG_INTERRUPT)`
AMDGPU: Mark all unspecified CC functions in tests as amdgpu_kernel Currently the default C calling convention functions are treated the same as compute kernels. Make this explicit so the default calling convention can be changed to a non-kernel. Converted with perl -pi -e 's/define void/define amdgpu_kernel void/' on the relevant test directories (and undoing in one place that actually wanted a non-kernel). llvm-svn: 298444 2017-03-22 05:39:51 +08:00			`define amdgpu_kernel void @test_interrupt() {`
AMDGPU: Consolidate sendmsg/sendmsghalt handling and tests llvm-svn: 295244 2017-02-16 06:17:09 +08:00			`body:`
			`call void @llvm.amdgcn.s.sendmsg(i32 1, i32 0);`
			`ret void`
			`}`

			`; GCN-LABEL: {{^}}test_gs_emit:`
			`; GCN: s_mov_b32 m0, 0`
			`; GCN-NOT: s_mov_b32 m0`
			`; GCN: s_sendmsg sendmsg(MSG_GS, GS_OP_EMIT, 0)`
AMDGPU: Mark all unspecified CC functions in tests as amdgpu_kernel Currently the default C calling convention functions are treated the same as compute kernels. Make this explicit so the default calling convention can be changed to a non-kernel. Converted with perl -pi -e 's/define void/define amdgpu_kernel void/' on the relevant test directories (and undoing in one place that actually wanted a non-kernel). llvm-svn: 298444 2017-03-22 05:39:51 +08:00			`define amdgpu_kernel void @test_gs_emit() {`
AMDGPU: Consolidate sendmsg/sendmsghalt handling and tests llvm-svn: 295244 2017-02-16 06:17:09 +08:00			`body:`
			`call void @llvm.amdgcn.s.sendmsg(i32 34, i32 0);`
			`ret void`
			`}`

			`; GCN-LABEL: {{^}}test_gs_cut:`
			`; GCN: s_mov_b32 m0, 0`
			`; GCN-NOT: s_mov_b32 m0`
			`; GCN: s_sendmsg sendmsg(MSG_GS, GS_OP_CUT, 1)`
AMDGPU: Mark all unspecified CC functions in tests as amdgpu_kernel Currently the default C calling convention functions are treated the same as compute kernels. Make this explicit so the default calling convention can be changed to a non-kernel. Converted with perl -pi -e 's/define void/define amdgpu_kernel void/' on the relevant test directories (and undoing in one place that actually wanted a non-kernel). llvm-svn: 298444 2017-03-22 05:39:51 +08:00			`define amdgpu_kernel void @test_gs_cut() {`
AMDGPU: Consolidate sendmsg/sendmsghalt handling and tests llvm-svn: 295244 2017-02-16 06:17:09 +08:00			`body:`
			`call void @llvm.amdgcn.s.sendmsg(i32 274, i32 0);`
			`ret void`
			`}`

			`; GCN-LABEL: {{^}}test_gs_emit_cut:`
			`; GCN: s_mov_b32 m0, 0`
			`; GCN-NOT: s_mov_b32 m0`
			`; GCN: s_sendmsg sendmsg(MSG_GS, GS_OP_EMIT_CUT, 2)`
AMDGPU: Mark all unspecified CC functions in tests as amdgpu_kernel Currently the default C calling convention functions are treated the same as compute kernels. Make this explicit so the default calling convention can be changed to a non-kernel. Converted with perl -pi -e 's/define void/define amdgpu_kernel void/' on the relevant test directories (and undoing in one place that actually wanted a non-kernel). llvm-svn: 298444 2017-03-22 05:39:51 +08:00			`define amdgpu_kernel void @test_gs_emit_cut() {`
AMDGPU: Consolidate sendmsg/sendmsghalt handling and tests llvm-svn: 295244 2017-02-16 06:17:09 +08:00			`body:`
			`call void @llvm.amdgcn.s.sendmsg(i32 562, i32 0)`
			`ret void`
			`}`

			`; GCN-LABEL: {{^}}test_gs_done:`
			`; GCN: s_mov_b32 m0, 0`
			`; GCN-NOT: s_mov_b32 m0`
			`; GCN: s_sendmsg sendmsg(MSG_GS_DONE, GS_OP_NOP)`
AMDGPU: Mark all unspecified CC functions in tests as amdgpu_kernel Currently the default C calling convention functions are treated the same as compute kernels. Make this explicit so the default calling convention can be changed to a non-kernel. Converted with perl -pi -e 's/define void/define amdgpu_kernel void/' on the relevant test directories (and undoing in one place that actually wanted a non-kernel). llvm-svn: 298444 2017-03-22 05:39:51 +08:00			`define amdgpu_kernel void @test_gs_done() {`
AMDGPU: Consolidate sendmsg/sendmsghalt handling and tests llvm-svn: 295244 2017-02-16 06:17:09 +08:00			`body:`
			`call void @llvm.amdgcn.s.sendmsg(i32 3, i32 0)`
			`ret void`
			`}`

[AMDGPU] gfx1010 tests. NFC. llvm-svn: 360615 2019-05-14 03:30:06 +08:00			`; GCN-LABEL: {{^}}test_gs_alloc_req:`
			`; GCN: s_mov_b32 m0, s0`
			`; GCN-NOT: s_mov_b32 m0`
			`; VIPLUS-NEXT: s_nop 0`
[AMDGPU][MC] Enabled constant expressions as operands of sendmsg See bug 40820: https://bugs.llvm.org/show_bug.cgi?id=40820 Reviewers: artem.tamazov, arsenm Differential Revision: https://reviews.llvm.org/D62735 llvm-svn: 364645 2019-06-28 22:14:02 +08:00			`; SIVI: s_sendmsg sendmsg(9, 0, 0)`
[AMDGPU] gfx1010 tests. NFC. llvm-svn: 360615 2019-05-14 03:30:06 +08:00			`; GFX9: s_sendmsg sendmsg(MSG_GS_ALLOC_REQ)`
			`define amdgpu_kernel void @test_gs_alloc_req(i32 inreg %a) {`
			`body:`
			`call void @llvm.amdgcn.s.sendmsg(i32 9, i32 %a)`
			`ret void`
			`}`

AMDGPU: Consolidate sendmsg/sendmsghalt handling and tests llvm-svn: 295244 2017-02-16 06:17:09 +08:00			`; GCN-LABEL: {{^}}sendmsg:`
			`; GCN: s_mov_b32 m0, s0`
[AMDGPU] gfx1010 tests. NFC. llvm-svn: 360615 2019-05-14 03:30:06 +08:00			`; VIPLUS-NEXT: s_nop 0`
AMDGPU: Consolidate sendmsg/sendmsghalt handling and tests llvm-svn: 295244 2017-02-16 06:17:09 +08:00			`; GCN-NEXT: sendmsg(MSG_GS_DONE, GS_OP_NOP)`
			`; GCN-NEXT: s_endpgm`
			`define amdgpu_gs void @sendmsg(i32 inreg %a) #0 {`
			`call void @llvm.amdgcn.s.sendmsg(i32 3, i32 %a)`
			`ret void`
			`}`

			`; GCN-LABEL: {{^}}sendmsghalt:`
			`; GCN: s_mov_b32 m0, s0`
[AMDGPU] gfx1010 tests. NFC. llvm-svn: 360615 2019-05-14 03:30:06 +08:00			`; VIPLUS-NEXT: s_nop 0`
AMDGPU: Consolidate sendmsg/sendmsghalt handling and tests llvm-svn: 295244 2017-02-16 06:17:09 +08:00			`; GCN-NEXT: s_sendmsghalt sendmsg(MSG_INTERRUPT)`
			`; GCN-NEXT: s_endpgm`
AMDGPU: Mark all unspecified CC functions in tests as amdgpu_kernel Currently the default C calling convention functions are treated the same as compute kernels. Make this explicit so the default calling convention can be changed to a non-kernel. Converted with perl -pi -e 's/define void/define amdgpu_kernel void/' on the relevant test directories (and undoing in one place that actually wanted a non-kernel). llvm-svn: 298444 2017-03-22 05:39:51 +08:00			`define amdgpu_kernel void @sendmsghalt(i32 inreg %a) #0 {`
AMDGPU: Consolidate sendmsg/sendmsghalt handling and tests llvm-svn: 295244 2017-02-16 06:17:09 +08:00			`call void @llvm.amdgcn.s.sendmsghalt(i32 1, i32 %a)`
			`ret void`
			`}`

			`; GCN-LABEL: {{^}}test_interrupt_halt:`
			`; GCN: s_mov_b32 m0, 0`
			`; GCN-NOT: s_mov_b32 m0`
			`; GCN: s_sendmsghalt sendmsg(MSG_INTERRUPT)`
AMDGPU: Mark all unspecified CC functions in tests as amdgpu_kernel Currently the default C calling convention functions are treated the same as compute kernels. Make this explicit so the default calling convention can be changed to a non-kernel. Converted with perl -pi -e 's/define void/define amdgpu_kernel void/' on the relevant test directories (and undoing in one place that actually wanted a non-kernel). llvm-svn: 298444 2017-03-22 05:39:51 +08:00			`define amdgpu_kernel void @test_interrupt_halt() {`
AMDGPU: Consolidate sendmsg/sendmsghalt handling and tests llvm-svn: 295244 2017-02-16 06:17:09 +08:00			`body:`
			`call void @llvm.amdgcn.s.sendmsghalt(i32 1, i32 0)`
			`ret void`
			`}`

			`; GCN-LABEL: {{^}}test_gs_emit_halt:`
			`; GCN: s_mov_b32 m0, 0`
			`; GCN-NOT: s_mov_b32 m0`
			`; GCN: s_sendmsghalt sendmsg(MSG_GS, GS_OP_EMIT, 0)`
AMDGPU: Mark all unspecified CC functions in tests as amdgpu_kernel Currently the default C calling convention functions are treated the same as compute kernels. Make this explicit so the default calling convention can be changed to a non-kernel. Converted with perl -pi -e 's/define void/define amdgpu_kernel void/' on the relevant test directories (and undoing in one place that actually wanted a non-kernel). llvm-svn: 298444 2017-03-22 05:39:51 +08:00			`define amdgpu_kernel void @test_gs_emit_halt() {`
AMDGPU: Consolidate sendmsg/sendmsghalt handling and tests llvm-svn: 295244 2017-02-16 06:17:09 +08:00			`body:`
			`call void @llvm.amdgcn.s.sendmsghalt(i32 34, i32 0)`
			`ret void`
			`}`

			`; GCN-LABEL: {{^}}test_gs_cut_halt:`
			`; GCN: s_mov_b32 m0, 0`
			`; GCN-NOT: s_mov_b32 m0`
			`; GCN: s_sendmsghalt sendmsg(MSG_GS, GS_OP_CUT, 1)`
AMDGPU: Mark all unspecified CC functions in tests as amdgpu_kernel Currently the default C calling convention functions are treated the same as compute kernels. Make this explicit so the default calling convention can be changed to a non-kernel. Converted with perl -pi -e 's/define void/define amdgpu_kernel void/' on the relevant test directories (and undoing in one place that actually wanted a non-kernel). llvm-svn: 298444 2017-03-22 05:39:51 +08:00			`define amdgpu_kernel void @test_gs_cut_halt() {`
AMDGPU: Consolidate sendmsg/sendmsghalt handling and tests llvm-svn: 295244 2017-02-16 06:17:09 +08:00			`body:`
			`call void @llvm.amdgcn.s.sendmsghalt(i32 274, i32 0)`
			`ret void`
			`}`

			`; GCN-LABEL: {{^}}test_gs_emit_cut_halt:`
			`; GCN: s_mov_b32 m0, 0`
			`; GCN-NOT: s_mov_b32 m0`
			`; GCN: s_sendmsghalt sendmsg(MSG_GS, GS_OP_EMIT_CUT, 2)`
AMDGPU: Mark all unspecified CC functions in tests as amdgpu_kernel Currently the default C calling convention functions are treated the same as compute kernels. Make this explicit so the default calling convention can be changed to a non-kernel. Converted with perl -pi -e 's/define void/define amdgpu_kernel void/' on the relevant test directories (and undoing in one place that actually wanted a non-kernel). llvm-svn: 298444 2017-03-22 05:39:51 +08:00			`define amdgpu_kernel void @test_gs_emit_cut_halt() {`
AMDGPU: Consolidate sendmsg/sendmsghalt handling and tests llvm-svn: 295244 2017-02-16 06:17:09 +08:00			`body:`
			`call void @llvm.amdgcn.s.sendmsghalt(i32 562, i32 0)`
			`ret void`
			`}`

			`; GCN-LABEL: {{^}}test_gs_done_halt:`
			`; GCN: s_mov_b32 m0, 0`
			`; GCN-NOT: s_mov_b32 m0`
			`; GCN: s_sendmsghalt sendmsg(MSG_GS_DONE, GS_OP_NOP)`
AMDGPU: Mark all unspecified CC functions in tests as amdgpu_kernel Currently the default C calling convention functions are treated the same as compute kernels. Make this explicit so the default calling convention can be changed to a non-kernel. Converted with perl -pi -e 's/define void/define amdgpu_kernel void/' on the relevant test directories (and undoing in one place that actually wanted a non-kernel). llvm-svn: 298444 2017-03-22 05:39:51 +08:00			`define amdgpu_kernel void @test_gs_done_halt() {`
AMDGPU: Consolidate sendmsg/sendmsghalt handling and tests llvm-svn: 295244 2017-02-16 06:17:09 +08:00			`body:`
			`call void @llvm.amdgcn.s.sendmsghalt(i32 3, i32 0)`
			`ret void`
			`}`

AMDGPU: Legalize the operand of SI_INIT_M0 Summary: This fixes a case where the argument to a sendmsg intrinsic ends up in a VGPR, for whatever reason. The underlying performance issue is that a multiplication that can be an s_mul_i32 is instead needlessly generated as v_mul_u32_u24, but this is not addressed by this patch. Change-Id: I61fd4034314d5acdf6074632c30b65364dfa7328 Reviewers: arsenm, rampitec Subscribers: kzhuravl, wdng, yaxunl, dstuttard, tpr, t-tye, llvm-commits Differential Revision: https://reviews.llvm.org/D45826 llvm-svn: 330393 2018-04-20 15:14:25 +08:00			`; TODO: This should use s_mul_i32 instead of v_mul_u32_u24 + v_readfirstlane!`
			`;`
			`; GCN-LABEL: {{^}}test_mul24:`
			`; GCN: v_mul_u32_u24_e32`
			`; GCN: v_readfirstlane_b32`
			`; GCN: s_mov_b32 m0,`
			`; GCN: s_sendmsg sendmsg(MSG_INTERRUPT)`
			`define amdgpu_gs void @test_mul24(i32 inreg %arg) {`
			`body:`
			`%tmp1 = and i32 %arg, 511`
			`%tmp2 = mul nuw nsw i32 %tmp1, 12288`
			`call void @llvm.amdgcn.s.sendmsg(i32 1, i32 %tmp2)`
			`ret void`
			`}`

AMDGPU: Force skip over s_sendmsg and exp instructions Summary: These instructions interact with hardware blocks outside the shader core, and they can have "scalar" side effects even when EXEC = 0. We don't want these scalar side effects to occur when all lanes want to skip these instructions, so always add the execz skip branch instruction for basic blocks that contain them. Also ensure that we skip scalar stores / atomics, though we don't code-gen those yet. Reviewers: arsenm, rampitec Subscribers: kzhuravl, wdng, yaxunl, dstuttard, tpr, t-tye, llvm-commits Differential Revision: https://reviews.llvm.org/D48431 Change-Id: Ieaeb58352e2789ffd64745603c14970c60819d44 llvm-svn: 338235 2018-07-30 17:23:59 +08:00			`; GCN-LABEL: {{^}}if_sendmsg:`
			`; GCN: s_cbranch_execz`
			`; GCN: s_sendmsg sendmsg(MSG_GS_DONE, GS_OP_NOP)`
			`define amdgpu_gs void @if_sendmsg(i32 %flag) #0 {`
			`%cc = icmp eq i32 %flag, 0`
			`br i1 %cc, label %sendmsg, label %end`

			`sendmsg:`
			`call void @llvm.amdgcn.s.sendmsg(i32 3, i32 0)`
			`br label %end`

			`end:`
			`ret void`
			`}`

AMDGPU: Consolidate sendmsg/sendmsghalt handling and tests llvm-svn: 295244 2017-02-16 06:17:09 +08:00			`declare void @llvm.amdgcn.s.sendmsg(i32, i32) #0`
			`declare void @llvm.amdgcn.s.sendmsghalt(i32, i32) #0`

			`attributes #0 = { nounwind }`