From 1cc8a74de345b66fd340ddc71580ad412e8e2abf Mon Sep 17 00:00:00 2001 From: Craig Topper Date: Tue, 31 Dec 2019 15:05:21 -0800 Subject: [PATCH] [X86] Use carry flag from add for (seteq (add X, -1), -1). If we just subtracted 1 and are checking if the result is -1. We can use the carry flag from the ADD instead of an explicit CMP. I'm using the same checks for the add users as EmitTest. Fixes one case from PR44412 Differential Revision: https://reviews.llvm.org/D72019 --- llvm/lib/Target/X86/X86ISelLowering.cpp | 41 +++++++++++++++++++------ llvm/test/CodeGen/X86/pr44412.ll | 10 +++--- 2 files changed, 35 insertions(+), 16 deletions(-) diff --git a/llvm/lib/Target/X86/X86ISelLowering.cpp b/llvm/lib/Target/X86/X86ISelLowering.cpp index bb6e8aeb67e0..dda0b4311771 100644 --- a/llvm/lib/Target/X86/X86ISelLowering.cpp +++ b/llvm/lib/Target/X86/X86ISelLowering.cpp @@ -20551,6 +20551,19 @@ static bool hasNonFlagsUse(SDValue Op) { return false; } +// Transform to an x86-specific ALU node with flags if there is a chance of +// using an RMW op or only the flags are used. Otherwise, leave +// the node alone and emit a 'cmp' or 'test' instruction. +static bool isProfitableToUseFlagOp(SDValue Op) { + for (SDNode *U : Op->uses()) + if (U->getOpcode() != ISD::CopyToReg && + U->getOpcode() != ISD::SETCC && + U->getOpcode() != ISD::STORE) + return false; + + return true; +} + /// Emit nodes that will be selected as "test Op0,Op0", or something /// equivalent. static SDValue EmitTest(SDValue Op, unsigned X86CC, const SDLoc &dl, @@ -20614,15 +20627,8 @@ static SDValue EmitTest(SDValue Op, unsigned X86CC, const SDLoc &dl, case ISD::SUB: case ISD::OR: case ISD::XOR: - // Transform to an x86-specific ALU node with flags if there is a chance of - // using an RMW op or only the flags are used. Otherwise, leave - // the node alone and emit a 'test' instruction. - for (SDNode::use_iterator UI = Op.getNode()->use_begin(), - UE = Op.getNode()->use_end(); UI != UE; ++UI) - if (UI->getOpcode() != ISD::CopyToReg && - UI->getOpcode() != ISD::SETCC && - UI->getOpcode() != ISD::STORE) - goto default_case; + if (!isProfitableToUseFlagOp(Op)) + break; // Otherwise use a regular EFLAGS-setting instruction. switch (ArithOp.getOpcode()) { @@ -20650,7 +20656,6 @@ static SDValue EmitTest(SDValue Op, unsigned X86CC, const SDLoc &dl, Op->getOperand(1)).getValue(1); } default: - default_case: break; } @@ -21688,6 +21693,22 @@ SDValue X86TargetLowering::emitFlagsForSetcc(SDValue Op0, SDValue Op1, } } + // Try to use the carry flag from the add in place of an separate CMP for: + // (seteq (add X, -1), -1). Similar for setne. + if (isAllOnesConstant(Op1) && Op0.getOpcode() == ISD::ADD && + Op0.getOperand(1) == Op1 && (CC == ISD::SETEQ || CC == ISD::SETNE)) { + if (isProfitableToUseFlagOp(Op0)) { + SDVTList VTs = DAG.getVTList(Op0.getValueType(), MVT::i32); + + SDValue New = DAG.getNode(X86ISD::ADD, dl, VTs, Op0.getOperand(0), + Op0.getOperand(1)); + DAG.ReplaceAllUsesOfValueWith(SDValue(Op0.getNode(), 0), New); + X86::CondCode CCode = CC == ISD::SETEQ ? X86::COND_AE : X86::COND_B; + X86CC = DAG.getTargetConstant(CCode, dl, MVT::i8); + return SDValue(New.getNode(), 1); + } + } + bool IsFP = Op1.getSimpleValueType().isFloatingPoint(); X86::CondCode CondCode = TranslateX86CC(CC, dl, IsFP, Op0, Op1, DAG); if (CondCode == X86::COND_INVALID) diff --git a/llvm/test/CodeGen/X86/pr44412.ll b/llvm/test/CodeGen/X86/pr44412.ll index 38d11edbf739..dbd0a4e6ea5c 100644 --- a/llvm/test/CodeGen/X86/pr44412.ll +++ b/llvm/test/CodeGen/X86/pr44412.ll @@ -14,9 +14,8 @@ define void @bar(i32 %0, i32 %1) nounwind { ; CHECK-NEXT: .LBB0_2: # =>This Inner Loop Header: Depth=1 ; CHECK-NEXT: movl %ebx, %edi ; CHECK-NEXT: callq foo -; CHECK-NEXT: decl %ebx -; CHECK-NEXT: cmpl $-1, %ebx -; CHECK-NEXT: jne .LBB0_2 +; CHECK-NEXT: addl $-1, %ebx +; CHECK-NEXT: jb .LBB0_2 ; CHECK-NEXT: .LBB0_3: ; CHECK-NEXT: popq %rbx ; CHECK-NEXT: retq @@ -47,9 +46,8 @@ define void @baz(i32 %0, i32 %1) nounwind { ; CHECK-NEXT: .LBB1_2: # =>This Inner Loop Header: Depth=1 ; CHECK-NEXT: movl %ebx, %edi ; CHECK-NEXT: callq foo -; CHECK-NEXT: decl %ebx -; CHECK-NEXT: cmpl $-1, %ebx -; CHECK-NEXT: je .LBB1_2 +; CHECK-NEXT: addl $-1, %ebx +; CHECK-NEXT: jae .LBB1_2 ; CHECK-NEXT: .LBB1_3: ; CHECK-NEXT: popq %rbx ; CHECK-NEXT: retq