forked from OSchip/llvm-project
197 lines
4.8 KiB
LLVM
197 lines
4.8 KiB
LLVM
|
; RUN: opt -S -codegenprepare < %s | FileCheck %s
|
||
|
|
||
|
target datalayout =
|
||
|
"e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128"
|
||
|
target triple = "x86_64-unknown-linux-gnu"
|
||
|
|
||
|
; Can we sink single addressing mode computation to use?
|
||
|
define void @test1(i1 %cond, i64* %base) {
|
||
|
; CHECK-LABEL: @test1
|
||
|
; CHECK: add i64 {{.+}}, 40
|
||
|
entry:
|
||
|
%addr = getelementptr inbounds i64, i64* %base, i64 5
|
||
|
%casted = bitcast i64* %addr to i32*
|
||
|
br i1 %cond, label %if.then, label %fallthrough
|
||
|
|
||
|
if.then:
|
||
|
%v = load i32, i32* %casted, align 4
|
||
|
br label %fallthrough
|
||
|
|
||
|
fallthrough:
|
||
|
ret void
|
||
|
}
|
||
|
|
||
|
declare void @foo(i32)
|
||
|
|
||
|
; Make sure sinking two copies of addressing mode into different blocks works
|
||
|
define void @test2(i1 %cond, i64* %base) {
|
||
|
; CHECK-LABEL: @test2
|
||
|
entry:
|
||
|
%addr = getelementptr inbounds i64, i64* %base, i64 5
|
||
|
%casted = bitcast i64* %addr to i32*
|
||
|
br i1 %cond, label %if.then, label %fallthrough
|
||
|
|
||
|
if.then:
|
||
|
; CHECK-LABEL: if.then:
|
||
|
; CHECK: add i64 {{.+}}, 40
|
||
|
%v1 = load i32, i32* %casted, align 4
|
||
|
call void @foo(i32 %v1)
|
||
|
%cmp = icmp eq i32 %v1, 0
|
||
|
br i1 %cmp, label %next, label %fallthrough
|
||
|
|
||
|
next:
|
||
|
; CHECK-LABEL: next:
|
||
|
; CHECK: add i64 {{.+}}, 40
|
||
|
%v2 = load i32, i32* %casted, align 4
|
||
|
call void @foo(i32 %v2)
|
||
|
br label %fallthrough
|
||
|
|
||
|
fallthrough:
|
||
|
ret void
|
||
|
}
|
||
|
|
||
|
; If we have two loads in the same block, only need one copy of addressing mode
|
||
|
; - instruction selection will duplicate if needed
|
||
|
define void @test3(i1 %cond, i64* %base) {
|
||
|
; CHECK-LABEL: @test3
|
||
|
entry:
|
||
|
%addr = getelementptr inbounds i64, i64* %base, i64 5
|
||
|
%casted = bitcast i64* %addr to i32*
|
||
|
br i1 %cond, label %if.then, label %fallthrough
|
||
|
|
||
|
if.then:
|
||
|
; CHECK-LABEL: if.then:
|
||
|
; CHECK: add i64 {{.+}}, 40
|
||
|
%v1 = load i32, i32* %casted, align 4
|
||
|
call void @foo(i32 %v1)
|
||
|
; CHECK-NOT: add i64 {{.+}}, 40
|
||
|
%v2 = load i32, i32* %casted, align 4
|
||
|
call void @foo(i32 %v2)
|
||
|
br label %fallthrough
|
||
|
|
||
|
fallthrough:
|
||
|
ret void
|
||
|
}
|
||
|
|
||
|
; Can we still sink addressing mode if there's a cold use of the
|
||
|
; address itself?
|
||
|
define void @test4(i1 %cond, i64* %base) {
|
||
|
; CHECK-LABEL: @test4
|
||
|
entry:
|
||
|
%addr = getelementptr inbounds i64, i64* %base, i64 5
|
||
|
%casted = bitcast i64* %addr to i32*
|
||
|
br i1 %cond, label %if.then, label %fallthrough
|
||
|
|
||
|
if.then:
|
||
|
; CHECK-LABEL: if.then:
|
||
|
; CHECK: add i64 {{.+}}, 40
|
||
|
%v1 = load i32, i32* %casted, align 4
|
||
|
call void @foo(i32 %v1)
|
||
|
%cmp = icmp eq i32 %v1, 0
|
||
|
br i1 %cmp, label %rare.1, label %fallthrough
|
||
|
|
||
|
fallthrough:
|
||
|
ret void
|
||
|
|
||
|
rare.1:
|
||
|
; CHECK-LABEL: rare.1:
|
||
|
; CHECK: add i64 {{.+}}, 40
|
||
|
call void @slowpath(i32 %v1, i32* %casted) cold
|
||
|
br label %fallthrough
|
||
|
}
|
||
|
|
||
|
; Negative test - don't want to duplicate addressing into hot path
|
||
|
define void @test5(i1 %cond, i64* %base) {
|
||
|
; CHECK-LABEL: @test5
|
||
|
entry:
|
||
|
; CHECK: %addr = getelementptr
|
||
|
%addr = getelementptr inbounds i64, i64* %base, i64 5
|
||
|
%casted = bitcast i64* %addr to i32*
|
||
|
br i1 %cond, label %if.then, label %fallthrough
|
||
|
|
||
|
if.then:
|
||
|
; CHECK-LABEL: if.then:
|
||
|
; CHECK-NOT: add i64 {{.+}}, 40
|
||
|
%v1 = load i32, i32* %casted, align 4
|
||
|
call void @foo(i32 %v1)
|
||
|
%cmp = icmp eq i32 %v1, 0
|
||
|
br i1 %cmp, label %rare.1, label %fallthrough
|
||
|
|
||
|
fallthrough:
|
||
|
ret void
|
||
|
|
||
|
rare.1:
|
||
|
call void @slowpath(i32 %v1, i32* %casted) ;; NOT COLD
|
||
|
br label %fallthrough
|
||
|
}
|
||
|
|
||
|
; Negative test - opt for size
|
||
|
define void @test6(i1 %cond, i64* %base) minsize {
|
||
|
; CHECK-LABEL: @test6
|
||
|
entry:
|
||
|
; CHECK: %addr = getelementptr
|
||
|
%addr = getelementptr inbounds i64, i64* %base, i64 5
|
||
|
%casted = bitcast i64* %addr to i32*
|
||
|
br i1 %cond, label %if.then, label %fallthrough
|
||
|
|
||
|
if.then:
|
||
|
; CHECK-LABEL: if.then:
|
||
|
; CHECK-NOT: add i64 {{.+}}, 40
|
||
|
%v1 = load i32, i32* %casted, align 4
|
||
|
call void @foo(i32 %v1)
|
||
|
%cmp = icmp eq i32 %v1, 0
|
||
|
br i1 %cmp, label %rare.1, label %fallthrough
|
||
|
|
||
|
fallthrough:
|
||
|
ret void
|
||
|
|
||
|
rare.1:
|
||
|
call void @slowpath(i32 %v1, i32* %casted) cold
|
||
|
br label %fallthrough
|
||
|
}
|
||
|
|
||
|
|
||
|
; Make sure sinking two copies of addressing mode into different blocks works
|
||
|
; when there are cold paths for each.
|
||
|
define void @test7(i1 %cond, i64* %base) {
|
||
|
; CHECK-LABEL: @test7
|
||
|
entry:
|
||
|
%addr = getelementptr inbounds i64, i64* %base, i64 5
|
||
|
%casted = bitcast i64* %addr to i32*
|
||
|
br i1 %cond, label %if.then, label %fallthrough
|
||
|
|
||
|
if.then:
|
||
|
; CHECK-LABEL: if.then:
|
||
|
; CHECK: add i64 {{.+}}, 40
|
||
|
%v1 = load i32, i32* %casted, align 4
|
||
|
call void @foo(i32 %v1)
|
||
|
%cmp = icmp eq i32 %v1, 0
|
||
|
br i1 %cmp, label %rare.1, label %next
|
||
|
|
||
|
next:
|
||
|
; CHECK-LABEL: next:
|
||
|
; CHECK: add i64 {{.+}}, 40
|
||
|
%v2 = load i32, i32* %casted, align 4
|
||
|
call void @foo(i32 %v2)
|
||
|
%cmp2 = icmp eq i32 %v2, 0
|
||
|
br i1 %cmp2, label %rare.1, label %fallthrough
|
||
|
|
||
|
fallthrough:
|
||
|
ret void
|
||
|
|
||
|
rare.1:
|
||
|
; CHECK-LABEL: rare.1:
|
||
|
; CHECK: add i64 {{.+}}, 40
|
||
|
call void @slowpath(i32 %v1, i32* %casted) cold
|
||
|
br label %next
|
||
|
|
||
|
rare.2:
|
||
|
; CHECK-LABEL: rare.2:
|
||
|
; CHECK: add i64 {{.+}}, 40
|
||
|
call void @slowpath(i32 %v2, i32* %casted) cold
|
||
|
br label %fallthrough
|
||
|
}
|
||
|
|
||
|
|
||
|
declare void @slowpath(i32, i32*)
|