2017-07-12 06:04:36 +08:00
|
|
|
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
|
|
|
; RUN: llc < %s -verify-machineinstrs -mtriple=x86_64-unknown-unknown -disable-cgp-select2branch | FileCheck %s
|
2009-09-15 10:25:21 +08:00
|
|
|
target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128"
|
2009-09-15 10:22:47 +08:00
|
|
|
|
|
|
|
define i32 @test1(i32 %x, i32 %n, i32 %w, i32* %vp) nounwind readnone {
|
2013-07-14 04:38:47 +08:00
|
|
|
; CHECK-LABEL: test1:
|
2017-07-12 06:04:36 +08:00
|
|
|
; CHECK: # BB#0: # %entry
|
|
|
|
; CHECK-NEXT: btl %esi, %edi
|
|
|
|
; CHECK-NEXT: movl $12, %eax
|
|
|
|
; CHECK-NEXT: cmovael (%rcx), %eax
|
|
|
|
; CHECK-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = lshr i32 %x, %n
|
|
|
|
%1 = and i32 %0, 1
|
|
|
|
%toBool = icmp eq i32 %1, 0
|
2015-02-28 05:17:42 +08:00
|
|
|
%v = load i32, i32* %vp
|
2017-07-12 06:04:36 +08:00
|
|
|
%.0 = select i1 %toBool, i32 %v, i32 12
|
2009-09-15 10:22:47 +08:00
|
|
|
ret i32 %.0
|
|
|
|
}
|
2017-07-12 06:04:36 +08:00
|
|
|
|
2009-09-15 10:22:47 +08:00
|
|
|
define i32 @test2(i32 %x, i32 %n, i32 %w, i32* %vp) nounwind readnone {
|
2013-07-14 04:38:47 +08:00
|
|
|
; CHECK-LABEL: test2:
|
2017-07-12 06:04:36 +08:00
|
|
|
; CHECK: # BB#0: # %entry
|
|
|
|
; CHECK-NEXT: btl %esi, %edi
|
|
|
|
; CHECK-NEXT: movl $12, %eax
|
|
|
|
; CHECK-NEXT: cmovbl (%rcx), %eax
|
|
|
|
; CHECK-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = lshr i32 %x, %n
|
|
|
|
%1 = and i32 %0, 1
|
|
|
|
%toBool = icmp eq i32 %1, 0
|
2015-02-28 05:17:42 +08:00
|
|
|
%v = load i32, i32* %vp
|
2017-07-12 06:04:36 +08:00
|
|
|
%.0 = select i1 %toBool, i32 12, i32 %v
|
2009-09-15 10:22:47 +08:00
|
|
|
ret i32 %.0
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2016-07-29 23:09:54 +08:00
|
|
|
; x86's 32-bit cmov zeroes the high 32 bits of the destination. Make
|
|
|
|
; sure CodeGen takes advantage of that to avoid an unnecessary
|
|
|
|
; zero-extend (movl) after the cmov.
|
2009-09-15 23:09:54 +08:00
|
|
|
|
2009-09-15 10:22:47 +08:00
|
|
|
declare void @bar(i64) nounwind
|
|
|
|
|
|
|
|
define void @test3(i64 %a, i64 %b, i1 %p) nounwind {
|
2013-07-14 04:38:47 +08:00
|
|
|
; CHECK-LABEL: test3:
|
2017-07-12 06:04:36 +08:00
|
|
|
; CHECK: # BB#0:
|
|
|
|
; CHECK-NEXT: pushq %rax
|
|
|
|
; CHECK-NEXT: testb $1, %dl
|
|
|
|
; CHECK-NEXT: cmovel %esi, %edi
|
|
|
|
; CHECK-NEXT: callq bar
|
|
|
|
; CHECK-NEXT: popq %rax
|
|
|
|
; CHECK-NEXT: retq
|
2009-09-15 10:22:47 +08:00
|
|
|
%c = trunc i64 %a to i32
|
|
|
|
%d = trunc i64 %b to i32
|
|
|
|
%e = select i1 %p, i32 %c, i32 %d
|
|
|
|
%f = zext i32 %e to i64
|
|
|
|
call void @bar(i64 %f)
|
|
|
|
ret void
|
|
|
|
}
|
2009-09-15 10:25:21 +08:00
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
; CodeGen shouldn't try to do a setne after an expanded 8-bit conditional
|
|
|
|
; move without recomputing EFLAGS, because the expansion of the conditional
|
|
|
|
; move with control flow may clobber EFLAGS (e.g., with xor, to set the
|
|
|
|
; register to zero).
|
|
|
|
|
|
|
|
; The test is a little awkward; the important part is that there's a test before the
|
|
|
|
; setne.
|
|
|
|
; PR4814
|
|
|
|
|
|
|
|
|
2017-07-12 06:04:36 +08:00
|
|
|
@g_3 = external global i8
|
|
|
|
@g_96 = external global i8
|
|
|
|
@g_100 = external global i8
|
|
|
|
@_2E_str = external constant [15 x i8], align 1
|
2009-09-15 10:25:21 +08:00
|
|
|
|
2017-01-25 00:36:07 +08:00
|
|
|
define i1 @test4() nounwind {
|
2017-07-12 06:04:36 +08:00
|
|
|
; CHECK-LABEL: test4:
|
|
|
|
; CHECK: # BB#0: # %entry
|
|
|
|
; CHECK-NEXT: movsbl {{.*}}(%rip), %edx
|
|
|
|
; CHECK-NEXT: movl %edx, %eax
|
|
|
|
; CHECK-NEXT: shrb $7, %al
|
|
|
|
; CHECK-NEXT: movzbl %al, %ecx
|
|
|
|
; CHECK-NEXT: xorl $1, %ecx
|
|
|
|
; CHECK-NEXT: # kill: %CL<def> %CL<kill> %ECX<kill>
|
|
|
|
; CHECK-NEXT: sarl %cl, %edx
|
|
|
|
; CHECK-NEXT: movb {{.*}}(%rip), %al
|
|
|
|
; CHECK-NEXT: testb %al, %al
|
|
|
|
; CHECK-NEXT: je .LBB3_2
|
|
|
|
; CHECK-NEXT: # BB#1: # %bb.i.i.i
|
|
|
|
; CHECK-NEXT: movb {{.*}}(%rip), %cl
|
|
|
|
; CHECK-NEXT: .LBB3_2: # %func_4.exit.i
|
|
|
|
; CHECK-NEXT: pushq %rbx
|
|
|
|
; CHECK-NEXT: testb %dl, %dl
|
|
|
|
; CHECK-NEXT: setne %bl
|
|
|
|
; CHECK-NEXT: movb %al, %cl
|
|
|
|
; CHECK-NEXT: je .LBB3_4
|
|
|
|
; CHECK-NEXT: # BB#3: # %func_4.exit.i
|
|
|
|
; CHECK-NEXT: xorl %ecx, %ecx
|
|
|
|
; CHECK-NEXT: .LBB3_4: # %func_4.exit.i
|
|
|
|
; CHECK-NEXT: testb %al, %al
|
|
|
|
; CHECK-NEXT: je .LBB3_7
|
|
|
|
; CHECK-NEXT: # BB#5: # %func_4.exit.i
|
|
|
|
; CHECK-NEXT: testb %bl, %bl
|
|
|
|
; CHECK-NEXT: jne .LBB3_7
|
|
|
|
; CHECK-NEXT: # BB#6: # %bb.i.i
|
|
|
|
; CHECK-NEXT: movb {{.*}}(%rip), %cl
|
|
|
|
; CHECK-NEXT: xorl %ebx, %ebx
|
|
|
|
; CHECK-NEXT: movb %al, %cl
|
|
|
|
; CHECK-NEXT: .LBB3_7: # %func_1.exit
|
|
|
|
; CHECK-NEXT: movb %cl, {{.*}}(%rip)
|
|
|
|
; CHECK-NEXT: movzbl %cl, %esi
|
|
|
|
; CHECK-NEXT: movl $_2E_str, %edi
|
|
|
|
; CHECK-NEXT: xorl %eax, %eax
|
|
|
|
; CHECK-NEXT: callq printf
|
|
|
|
; CHECK-NEXT: movl %ebx, %eax
|
|
|
|
; CHECK-NEXT: popq %rbx
|
|
|
|
; CHECK-NEXT: retq
|
2009-09-15 10:25:21 +08:00
|
|
|
entry:
|
2017-07-12 06:04:36 +08:00
|
|
|
%0 = load i8, i8* @g_3, align 1
|
|
|
|
%1 = sext i8 %0 to i32
|
|
|
|
%.lobit.i = lshr i8 %0, 7
|
|
|
|
%tmp.i = zext i8 %.lobit.i to i32
|
|
|
|
%tmp.not.i = xor i32 %tmp.i, 1
|
|
|
|
%iftmp.17.0.i.i = ashr i32 %1, %tmp.not.i
|
|
|
|
%retval56.i.i = trunc i32 %iftmp.17.0.i.i to i8
|
|
|
|
%2 = icmp eq i8 %retval56.i.i, 0
|
|
|
|
%g_96.promoted.i = load i8, i8* @g_96
|
|
|
|
%3 = icmp eq i8 %g_96.promoted.i, 0
|
2009-09-15 10:25:21 +08:00
|
|
|
br i1 %3, label %func_4.exit.i, label %bb.i.i.i
|
|
|
|
|
2017-07-12 06:04:36 +08:00
|
|
|
bb.i.i.i:
|
|
|
|
%4 = load volatile i8, i8* @g_100, align 1
|
2009-09-15 10:25:21 +08:00
|
|
|
br label %func_4.exit.i
|
|
|
|
|
2017-07-12 06:04:36 +08:00
|
|
|
func_4.exit.i:
|
|
|
|
%.not.i = xor i1 %2, true
|
|
|
|
%brmerge.i = or i1 %3, %.not.i
|
|
|
|
%.mux.i = select i1 %2, i8 %g_96.promoted.i, i8 0
|
2009-09-15 10:25:21 +08:00
|
|
|
br i1 %brmerge.i, label %func_1.exit, label %bb.i.i
|
|
|
|
|
2017-07-12 06:04:36 +08:00
|
|
|
bb.i.i:
|
|
|
|
%5 = load volatile i8, i8* @g_100, align 1
|
2009-09-15 10:25:21 +08:00
|
|
|
br label %func_1.exit
|
|
|
|
|
2017-07-12 06:04:36 +08:00
|
|
|
func_1.exit:
|
|
|
|
%g_96.tmp.0.i = phi i8 [ %g_96.promoted.i, %bb.i.i ], [ %.mux.i, %func_4.exit.i ]
|
2017-01-25 00:36:07 +08:00
|
|
|
%ret = phi i1 [ 0, %bb.i.i ], [ %.not.i, %func_4.exit.i ]
|
2009-09-15 10:25:21 +08:00
|
|
|
store i8 %g_96.tmp.0.i, i8* @g_96
|
2017-07-12 06:04:36 +08:00
|
|
|
%6 = zext i8 %g_96.tmp.0.i to i32
|
|
|
|
%7 = tail call i32 (i8*, ...) @printf(i8* noalias getelementptr ([15 x i8], [15 x i8]* @_2E_str, i64 0, i64 0), i32 %6) nounwind
|
2017-01-25 00:36:07 +08:00
|
|
|
ret i1 %ret
|
2009-09-15 10:25:21 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
declare i32 @printf(i8* nocapture, ...) nounwind
|
|
|
|
|
|
|
|
|
|
|
|
; Should compile to setcc | -2.
|
|
|
|
; rdar://6668608
|
|
|
|
define i32 @test5(i32* nocapture %P) nounwind readonly {
|
2013-07-14 04:38:47 +08:00
|
|
|
; CHECK-LABEL: test5:
|
2017-07-12 06:04:36 +08:00
|
|
|
; CHECK: # BB#0: # %entry
|
|
|
|
; CHECK-NEXT: xorl %eax, %eax
|
|
|
|
; CHECK-NEXT: cmpl $41, (%rdi)
|
|
|
|
; CHECK-NEXT: setg %al
|
|
|
|
; CHECK-NEXT: orl $-2, %eax
|
|
|
|
; CHECK-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = load i32, i32* %P, align 4
|
|
|
|
%1 = icmp sgt i32 %0, 41
|
|
|
|
%iftmp.0.0 = select i1 %1, i32 -1, i32 -2
|
2009-09-15 10:25:21 +08:00
|
|
|
ret i32 %iftmp.0.0
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32 @test6(i32* nocapture %P) nounwind readonly {
|
2013-07-14 04:38:47 +08:00
|
|
|
; CHECK-LABEL: test6:
|
2017-07-12 06:04:36 +08:00
|
|
|
; CHECK: # BB#0: # %entry
|
|
|
|
; CHECK-NEXT: xorl %eax, %eax
|
|
|
|
; CHECK-NEXT: cmpl $42, (%rdi)
|
|
|
|
; CHECK-NEXT: setl %al
|
|
|
|
; CHECK-NEXT: leal 4(%rax,%rax,8), %eax
|
|
|
|
; CHECK-NEXT: retq
|
|
|
|
entry:
|
|
|
|
%0 = load i32, i32* %P, align 4
|
|
|
|
%1 = icmp sgt i32 %0, 41
|
|
|
|
%iftmp.0.0 = select i1 %1, i32 4, i32 13
|
2009-09-15 10:25:21 +08:00
|
|
|
ret i32 %iftmp.0.0
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2009-09-15 10:27:23 +08:00
|
|
|
; Don't try to use a 16-bit conditional move to do an 8-bit select,
|
|
|
|
; because it isn't worth it. Just use a branch instead.
|
|
|
|
define i8 @test7(i1 inreg %c, i8 inreg %a, i8 inreg %b) nounwind {
|
2013-07-14 04:38:47 +08:00
|
|
|
; CHECK-LABEL: test7:
|
2017-07-12 06:04:36 +08:00
|
|
|
; CHECK: # BB#0:
|
|
|
|
; CHECK-NEXT: testb $1, %dil
|
|
|
|
; CHECK-NEXT: jne .LBB6_2
|
|
|
|
; CHECK-NEXT: # BB#1:
|
|
|
|
; CHECK-NEXT: movb %dl, %sil
|
|
|
|
; CHECK-NEXT: .LBB6_2:
|
|
|
|
; CHECK-NEXT: movl %esi, %eax
|
|
|
|
; CHECK-NEXT: retq
|
2009-09-15 10:27:23 +08:00
|
|
|
%d = select i1 %c, i8 %a, i8 %b
|
|
|
|
ret i8 %d
|
|
|
|
}
|
2017-01-06 02:35:44 +08:00
|
|
|
|
|
|
|
define i32 @smin(i32 %x) {
|
|
|
|
; CHECK-LABEL: smin:
|
2017-07-12 06:04:36 +08:00
|
|
|
; CHECK: # BB#0:
|
2017-01-06 02:35:44 +08:00
|
|
|
; CHECK-NEXT: xorl $-1, %edi
|
|
|
|
; CHECK-NEXT: movl $-1, %eax
|
[x86] fix usage of stale operands when lowering select
I noticed this problem as part of the ongoing attempt to canonicalize min/max ops in IR.
The debug output shows nodes like this:
t4: i32 = xor t2, Constant:i32<-1>
t21: i8 = setcc t4, Constant:i32<0>, setlt:ch
t14: i32 = select t21, t4, Constant:i32<-1>
And because the select is holding onto the t4 (xor) node while EmitTest creates a new
x86-specific xor node, the lowering results in:
t4: i32 = xor t2, Constant:i32<-1>
t25: i32,i32 = X86ISD::XOR t2, Constant:i32<-1>
t28: i32,glue = X86ISD::CMOV Constant:i32<-1>, t4, Constant:i8<15>, t25:1
Differential Revision: https://reviews.llvm.org/D28374
llvm-svn: 291392
2017-01-08 23:53:40 +08:00
|
|
|
; CHECK-NEXT: cmovsl %edi, %eax
|
2017-01-06 02:35:44 +08:00
|
|
|
; CHECK-NEXT: retq
|
|
|
|
%not_x = xor i32 %x, -1
|
|
|
|
%1 = icmp slt i32 %not_x, -1
|
|
|
|
%sel = select i1 %1, i32 %not_x, i32 -1
|
|
|
|
ret i32 %sel
|
|
|
|
}
|
|
|
|
|