From 21a1d4cf719e977b1712cb4387b0f12b5175b916 Mon Sep 17 00:00:00 2001 From: Jay Foad Date: Fri, 29 Oct 2021 13:54:35 +0100 Subject: [PATCH] [AMDGPU] Change numBitsSigned for simplicity and document it. NFC. Change numBitsSigned to return the minimum size of a signed integer that can hold the value. This is different by one from the previous result but is more consistent with numBitsUnsigned. Update all callers. All callers are now more consistent between the signed and unsigned cases, and some callers get simpler, especially the ones that deal with quantities like numBitsSigned(LHS) + numBitsSigned(RHS). Differential Revision: https://reviews.llvm.org/D112813 --- .../Target/AMDGPU/AMDGPUCodeGenPrepare.cpp | 19 ++++++++++++------- llvm/lib/Target/AMDGPU/AMDGPUISelLowering.cpp | 4 ++-- llvm/lib/Target/AMDGPU/AMDGPUISelLowering.h | 7 +++++++ llvm/lib/Target/AMDGPU/SIISelLowering.cpp | 2 +- 4 files changed, 22 insertions(+), 10 deletions(-) diff --git a/llvm/lib/Target/AMDGPU/AMDGPUCodeGenPrepare.cpp b/llvm/lib/Target/AMDGPU/AMDGPUCodeGenPrepare.cpp index c8bea9b1a240..a55729586b8d 100644 --- a/llvm/lib/Target/AMDGPU/AMDGPUCodeGenPrepare.cpp +++ b/llvm/lib/Target/AMDGPU/AMDGPUCodeGenPrepare.cpp @@ -148,8 +148,14 @@ class AMDGPUCodeGenPrepare : public FunctionPass, /// \returns True. bool promoteUniformBitreverseToI32(IntrinsicInst &I) const; - + /// \returns The minimum number of bits needed to store the value of \Op as an + /// unsigned integer. Truncating to this size and then zero-extending to + /// ScalarSize will not change the value. unsigned numBitsUnsigned(Value *Op, unsigned ScalarSize) const; + + /// \returns The minimum number of bits needed to store the value of \Op as a + /// signed integer. Truncating to this size and then sign-extending to + /// ScalarSize will not change the value. unsigned numBitsSigned(Value *Op, unsigned ScalarSize) const; /// Replace mul instructions with llvm.amdgcn.mul.u24 or llvm.amdgcn.mul.s24. @@ -449,7 +455,7 @@ unsigned AMDGPUCodeGenPrepare::numBitsSigned(Value *Op, unsigned ScalarSize) const { // In order for this to be a signed 24-bit value, bit 23, must // be a sign bit. - return ScalarSize - ComputeNumSignBits(Op, *DL, 0, AC); + return ScalarSize - ComputeNumSignBits(Op, *DL, 0, AC) + 1; } static void extractValues(IRBuilder<> &Builder, @@ -482,13 +488,13 @@ static Value *insertValues(IRBuilder<> &Builder, // width of the original destination. static Value *getMul24(IRBuilder<> &Builder, Value *LHS, Value *RHS, unsigned Size, unsigned NumBits, bool IsSigned) { - if (Size <= 32 || (IsSigned ? NumBits <= 30 : NumBits <= 32)) { + if (Size <= 32 || NumBits <= 32) { Intrinsic::ID ID = IsSigned ? Intrinsic::amdgcn_mul_i24 : Intrinsic::amdgcn_mul_u24; return Builder.CreateIntrinsic(ID, {}, {LHS, RHS}); } - assert(IsSigned ? NumBits <= 46 : NumBits <= 48); + assert(NumBits <= 48); Intrinsic::ID LoID = IsSigned ? Intrinsic::amdgcn_mul_i24 : Intrinsic::amdgcn_mul_u24; @@ -530,9 +536,8 @@ bool AMDGPUCodeGenPrepare::replaceMulWithMul24(BinaryOperator &I) const { (RHSBits = numBitsUnsigned(RHS, Size)) <= 24) { IsSigned = false; - } else if (ST->hasMulI24() && - (LHSBits = numBitsSigned(LHS, Size)) < 24 && - (RHSBits = numBitsSigned(RHS, Size)) < 24) { + } else if (ST->hasMulI24() && (LHSBits = numBitsSigned(LHS, Size)) <= 24 && + (RHSBits = numBitsSigned(RHS, Size)) <= 24) { IsSigned = true; } else diff --git a/llvm/lib/Target/AMDGPU/AMDGPUISelLowering.cpp b/llvm/lib/Target/AMDGPU/AMDGPUISelLowering.cpp index 4d316a5869a6..16d9b302348c 100644 --- a/llvm/lib/Target/AMDGPU/AMDGPUISelLowering.cpp +++ b/llvm/lib/Target/AMDGPU/AMDGPUISelLowering.cpp @@ -53,7 +53,7 @@ unsigned AMDGPUTargetLowering::numBitsSigned(SDValue Op, SelectionDAG &DAG) { // In order for this to be a signed 24-bit value, bit 23, must // be a sign bit. - return VT.getSizeInBits() - DAG.ComputeNumSignBits(Op); + return VT.getSizeInBits() - DAG.ComputeNumSignBits(Op) + 1; } AMDGPUTargetLowering::AMDGPUTargetLowering(const TargetMachine &TM, @@ -2875,7 +2875,7 @@ static bool isI24(SDValue Op, SelectionDAG &DAG) { EVT VT = Op.getValueType(); return VT.getSizeInBits() >= 24 && // Types less than 24-bit should be treated // as unsigned 24-bit values. - AMDGPUTargetLowering::numBitsSigned(Op, DAG) < 24; + AMDGPUTargetLowering::numBitsSigned(Op, DAG) <= 24; } static SDValue simplifyMul24(SDNode *Node24, diff --git a/llvm/lib/Target/AMDGPU/AMDGPUISelLowering.h b/llvm/lib/Target/AMDGPU/AMDGPUISelLowering.h index 53371d03364d..6bbcef2fe721 100644 --- a/llvm/lib/Target/AMDGPU/AMDGPUISelLowering.h +++ b/llvm/lib/Target/AMDGPU/AMDGPUISelLowering.h @@ -35,7 +35,14 @@ private: SDValue getFFBX_U32(SelectionDAG &DAG, SDValue Op, const SDLoc &DL, unsigned Opc) const; public: + /// \returns The minimum number of bits needed to store the value of \Op as an + /// unsigned integer. Truncating to this size and then zero-extending to the + /// original size will not change the value. static unsigned numBitsUnsigned(SDValue Op, SelectionDAG &DAG); + + /// \returns The minimum number of bits needed to store the value of \Op as a + /// signed integer. Truncating to this size and then sign-extending to the + /// original size will not change the value. static unsigned numBitsSigned(SDValue Op, SelectionDAG &DAG); protected: diff --git a/llvm/lib/Target/AMDGPU/SIISelLowering.cpp b/llvm/lib/Target/AMDGPU/SIISelLowering.cpp index 09f3d6752c27..a3be162432da 100644 --- a/llvm/lib/Target/AMDGPU/SIISelLowering.cpp +++ b/llvm/lib/Target/AMDGPU/SIISelLowering.cpp @@ -10464,7 +10464,7 @@ SDValue SITargetLowering::performAddCombine(SDNode *N, return getMad64_32(DAG, SL, VT, MulLHS, MulRHS, AddRHS, false); } - if (numBitsSigned(MulLHS, DAG) < 32 && numBitsSigned(MulRHS, DAG) < 32) { + if (numBitsSigned(MulLHS, DAG) <= 32 && numBitsSigned(MulRHS, DAG) <= 32) { MulLHS = DAG.getSExtOrTrunc(MulLHS, SL, MVT::i32); MulRHS = DAG.getSExtOrTrunc(MulRHS, SL, MVT::i32); AddRHS = DAG.getSExtOrTrunc(AddRHS, SL, MVT::i64);