llvm-project/llvm/test/CodeGen/AMDGPU/parallelorifcollapse.ll

; Function Attrs: nounwind
; RUN: llc < %s -march=r600 -mcpu=redwood  | FileCheck %s
;
; CFG flattening should use parallel-or to generate branch conditions and
; then merge if-regions with the same bodies.

; FIXME: For some reason having the allocas here allowed the flatten cfg pass
; to do its transformation, however now that we are using local memory for
; allocas, the transformation isn't happening.
; XFAIL: *
;
; CHECK: OR_INT
; CHECK-NEXT: OR_INT
; CHECK-NEXT: OR_INT
define amdgpu_kernel void @_Z9chk1D_512v() #0 {
entry:
  %a0 = alloca i32, align 4
  %b0 = alloca i32, align 4
  %c0 = alloca i32, align 4
  %d0 = alloca i32, align 4
  %a1 = alloca i32, align 4
  %b1 = alloca i32, align 4
  %c1 = alloca i32, align 4
  %d1 = alloca i32, align 4
  %data = alloca i32, align 4
  %0 = load i32, i32* %a0, align 4
  %1 = load i32, i32* %b0, align 4
  %cmp = icmp ne i32 %0, %1
  br i1 %cmp, label %land.lhs.true, label %if.else

land.lhs.true:                                    ; preds = %entry
  %2 = load i32, i32* %c0, align 4
  %3 = load i32, i32* %d0, align 4
  %cmp1 = icmp ne i32 %2, %3
  br i1 %cmp1, label %if.then, label %if.else

if.then:                                          ; preds = %land.lhs.true
  br label %if.end

if.else:                                          ; preds = %land.lhs.true, %entry
  store i32 1, i32* %data, align 4
  br label %if.end

if.end:                                           ; preds = %if.else, %if.then
  %4 = load i32, i32* %a1, align 4
  %5 = load i32, i32* %b1, align 4
  %cmp2 = icmp ne i32 %4, %5
  br i1 %cmp2, label %land.lhs.true3, label %if.else6

land.lhs.true3:                                   ; preds = %if.end
  %6 = load i32, i32* %c1, align 4
  %7 = load i32, i32* %d1, align 4
  %cmp4 = icmp ne i32 %6, %7
  br i1 %cmp4, label %if.then5, label %if.else6

if.then5:                                         ; preds = %land.lhs.true3
  br label %if.end7

if.else6:                                         ; preds = %land.lhs.true3, %if.end
  store i32 1, i32* %data, align 4
  br label %if.end7

if.end7:                                          ; preds = %if.else6, %if.then5
  ret void
}
Factor FlattenCFG out from SimplifyCFG Patch by: Mei Ye llvm-svn: 187764 2013-08-06 10:43:45 +08:00			`; Function Attrs: nounwind`
			`; RUN: llc < %s -march=r600 -mcpu=redwood \| FileCheck %s`
			`;`
			`; CFG flattening should use parallel-or to generate branch conditions and`
			`; then merge if-regions with the same bodies.`
R600: Use LDS and vectors for private memory llvm-svn: 211110 2014-06-18 00:53:14 +08:00
			`; FIXME: For some reason having the allocas here allowed the flatten cfg pass`
fix typos in comments; NFC llvm-svn: 308127 2017-07-16 16:11:56 +08:00			`; to do its transformation, however now that we are using local memory for`
R600: Use LDS and vectors for private memory llvm-svn: 211110 2014-06-18 00:53:14 +08:00			`; allocas, the transformation isn't happening.`
			`; XFAIL: *`
Factor FlattenCFG out from SimplifyCFG Patch by: Mei Ye llvm-svn: 187764 2013-08-06 10:43:45 +08:00			`;`
			`; CHECK: OR_INT`
			`; CHECK-NEXT: OR_INT`
			`; CHECK-NEXT: OR_INT`
AMDGPU: Mark all unspecified CC functions in tests as amdgpu_kernel Currently the default C calling convention functions are treated the same as compute kernels. Make this explicit so the default calling convention can be changed to a non-kernel. Converted with perl -pi -e 's/define void/define amdgpu_kernel void/' on the relevant test directories (and undoing in one place that actually wanted a non-kernel). llvm-svn: 298444 2017-03-22 05:39:51 +08:00			`define amdgpu_kernel void @_Z9chk1D_512v() #0 {`
Factor FlattenCFG out from SimplifyCFG Patch by: Mei Ye llvm-svn: 187764 2013-08-06 10:43:45 +08:00			`entry:`
			`%a0 = alloca i32, align 4`
			`%b0 = alloca i32, align 4`
			`%c0 = alloca i32, align 4`
			`%d0 = alloca i32, align 4`
			`%a1 = alloca i32, align 4`
			`%b1 = alloca i32, align 4`
			`%c1 = alloca i32, align 4`
			`%d1 = alloca i32, align 4`
			`%data = alloca i32, align 4`
[opaque pointer type] Add textual IR support for explicit type parameter to load instruction Essentially the same as the GEP change in r230786. A similar migration script can be used to update test cases, though a few more test case improvements/changes were required this time around: (r229269-r229278) import fileinput import sys import re pat = re.compile(r"((?:=\|:\|^)\sload (?:atomic )?(?:volatile )?(.?))(\| addrspace\(\d+\) )\($\| (?:%\|@\|null\|undef\|blockaddress\|getelementptr\|addrspacecast\|bitcast\|inttoptr\|\[\[[a-zA-Z]\|\{\{).$)") for line in sys.stdin: sys.stdout.write(re.sub(pat, r"\1, \2\3*\4", line)) Reviewers: rafael, dexonsmith, grosser Differential Revision: http://reviews.llvm.org/D7649 llvm-svn: 230794 2015-02-28 05:17:42 +08:00			`%0 = load i32, i32* %a0, align 4`
			`%1 = load i32, i32* %b0, align 4`
Factor FlattenCFG out from SimplifyCFG Patch by: Mei Ye llvm-svn: 187764 2013-08-06 10:43:45 +08:00			`%cmp = icmp ne i32 %0, %1`
			`br i1 %cmp, label %land.lhs.true, label %if.else`

			`land.lhs.true: ; preds = %entry`
[opaque pointer type] Add textual IR support for explicit type parameter to load instruction Essentially the same as the GEP change in r230786. A similar migration script can be used to update test cases, though a few more test case improvements/changes were required this time around: (r229269-r229278) import fileinput import sys import re pat = re.compile(r"((?:=\|:\|^)\sload (?:atomic )?(?:volatile )?(.?))(\| addrspace\(\d+\) )\($\| (?:%\|@\|null\|undef\|blockaddress\|getelementptr\|addrspacecast\|bitcast\|inttoptr\|\[\[[a-zA-Z]\|\{\{).$)") for line in sys.stdin: sys.stdout.write(re.sub(pat, r"\1, \2\3*\4", line)) Reviewers: rafael, dexonsmith, grosser Differential Revision: http://reviews.llvm.org/D7649 llvm-svn: 230794 2015-02-28 05:17:42 +08:00			`%2 = load i32, i32* %c0, align 4`
			`%3 = load i32, i32* %d0, align 4`
Factor FlattenCFG out from SimplifyCFG Patch by: Mei Ye llvm-svn: 187764 2013-08-06 10:43:45 +08:00			`%cmp1 = icmp ne i32 %2, %3`
			`br i1 %cmp1, label %if.then, label %if.else`

			`if.then: ; preds = %land.lhs.true`
			`br label %if.end`

			`if.else: ; preds = %land.lhs.true, %entry`
			`store i32 1, i32* %data, align 4`
			`br label %if.end`

			`if.end: ; preds = %if.else, %if.then`
[opaque pointer type] Add textual IR support for explicit type parameter to load instruction Essentially the same as the GEP change in r230786. A similar migration script can be used to update test cases, though a few more test case improvements/changes were required this time around: (r229269-r229278) import fileinput import sys import re pat = re.compile(r"((?:=\|:\|^)\sload (?:atomic )?(?:volatile )?(.?))(\| addrspace\(\d+\) )\($\| (?:%\|@\|null\|undef\|blockaddress\|getelementptr\|addrspacecast\|bitcast\|inttoptr\|\[\[[a-zA-Z]\|\{\{).$)") for line in sys.stdin: sys.stdout.write(re.sub(pat, r"\1, \2\3*\4", line)) Reviewers: rafael, dexonsmith, grosser Differential Revision: http://reviews.llvm.org/D7649 llvm-svn: 230794 2015-02-28 05:17:42 +08:00			`%4 = load i32, i32* %a1, align 4`
			`%5 = load i32, i32* %b1, align 4`
Factor FlattenCFG out from SimplifyCFG Patch by: Mei Ye llvm-svn: 187764 2013-08-06 10:43:45 +08:00			`%cmp2 = icmp ne i32 %4, %5`
			`br i1 %cmp2, label %land.lhs.true3, label %if.else6`

			`land.lhs.true3: ; preds = %if.end`
[opaque pointer type] Add textual IR support for explicit type parameter to load instruction Essentially the same as the GEP change in r230786. A similar migration script can be used to update test cases, though a few more test case improvements/changes were required this time around: (r229269-r229278) import fileinput import sys import re pat = re.compile(r"((?:=\|:\|^)\sload (?:atomic )?(?:volatile )?(.?))(\| addrspace\(\d+\) )\($\| (?:%\|@\|null\|undef\|blockaddress\|getelementptr\|addrspacecast\|bitcast\|inttoptr\|\[\[[a-zA-Z]\|\{\{).$)") for line in sys.stdin: sys.stdout.write(re.sub(pat, r"\1, \2\3*\4", line)) Reviewers: rafael, dexonsmith, grosser Differential Revision: http://reviews.llvm.org/D7649 llvm-svn: 230794 2015-02-28 05:17:42 +08:00			`%6 = load i32, i32* %c1, align 4`
			`%7 = load i32, i32* %d1, align 4`
Factor FlattenCFG out from SimplifyCFG Patch by: Mei Ye llvm-svn: 187764 2013-08-06 10:43:45 +08:00			`%cmp4 = icmp ne i32 %6, %7`
			`br i1 %cmp4, label %if.then5, label %if.else6`

			`if.then5: ; preds = %land.lhs.true3`
			`br label %if.end7`

			`if.else6: ; preds = %land.lhs.true3, %if.end`
			`store i32 1, i32* %data, align 4`
			`br label %if.end7`

			`if.end7: ; preds = %if.else6, %if.then5`
			`ret void`
			`}`