diff --git a/llvm/lib/Target/SystemZ/SystemZISelDAGToDAG.cpp b/llvm/lib/Target/SystemZ/SystemZISelDAGToDAG.cpp index 2bc186b07f99..d1bd2d647773 100644 --- a/llvm/lib/Target/SystemZ/SystemZISelDAGToDAG.cpp +++ b/llvm/lib/Target/SystemZ/SystemZISelDAGToDAG.cpp @@ -46,9 +46,10 @@ namespace { SDValue IndexReg; int64_t Disp; + bool isRI; - SystemZRRIAddressMode() - : BaseType(RegBase), IndexReg(), Disp(0) { + SystemZRRIAddressMode(bool RI = false) + : BaseType(RegBase), IndexReg(), Disp(0), isRI(RI) { } void dump() { @@ -61,9 +62,11 @@ namespace { } else { cerr << " Base.FrameIndex " << Base.FrameIndex << '\n'; } - cerr << "IndexReg "; - if (IndexReg.getNode() != 0) IndexReg.getNode()->dump(); - else cerr << "nul"; + if (!isRI) { + cerr << "IndexReg "; + if (IndexReg.getNode() != 0) IndexReg.getNode()->dump(); + else cerr << "nul"; + } cerr << " Disp " << Disp << '\n'; } }; @@ -77,6 +80,8 @@ namespace { SystemZTargetLowering &Lowering; const SystemZSubtarget &Subtarget; + void getAddressOperandsRI(const SystemZRRIAddressMode &AM, + SDValue &Base, SDValue &Disp); void getAddressOperands(const SystemZRRIAddressMode &AM, SDValue &Base, SDValue &Disp, SDValue &Index); @@ -109,9 +114,9 @@ namespace { #include "SystemZGenDAGISel.inc" private: - bool SelectAddrRI32(const SDValue& Op, SDValue& Addr, + bool SelectAddrRI12(SDValue Op, SDValue& Addr, SDValue &Base, SDValue &Disp); - bool SelectAddrRI(const SDValue& Op, SDValue& Addr, + bool SelectAddrRI(SDValue Op, SDValue& Addr, SDValue &Base, SDValue &Disp); bool SelectAddrRRI12(SDValue Op, SDValue Addr, SDValue &Base, SDValue &Disp, SDValue &Index); @@ -124,6 +129,8 @@ namespace { bool MatchAddress(SDValue N, SystemZRRIAddressMode &AM, bool is12Bit, unsigned Depth = 0); bool MatchAddressBase(SDValue N, SystemZRRIAddressMode &AM); + bool MatchAddressRI(SDValue N, SystemZRRIAddressMode &AM, + bool is12Bit); #ifndef NDEBUG unsigned Indent; @@ -151,17 +158,6 @@ static bool isImmSExt20(int64_t Val, int64_t &Imm) { return false; } -static bool isImmSExt20(SDNode *N, int64_t &Imm) { - if (N->getOpcode() != ISD::Constant) - return false; - - return isImmSExt20(cast(N)->getSExtValue(), Imm); -} - -static bool isImmSExt20(SDValue Op, int64_t &Imm) { - return isImmSExt20(Op.getNode(), Imm); -} - /// isImmZExt12 - This method tests to see if the node is either a 32-bit /// or 64-bit immediate, and if the value can be accurately represented as a /// zero extension from a 12-bit value. If so, this returns true and the @@ -174,139 +170,6 @@ static bool isImmZExt12(int64_t Val, int64_t &Imm) { return false; } -static bool isImmZExt12(SDNode *N, int64_t &Imm) { - if (N->getOpcode() != ISD::Constant) - return false; - - return isImmZExt12(cast(N)->getSExtValue(), Imm); -} - -static bool isImmZExt12(SDValue Op, int64_t &Imm) { - return isImmZExt12(Op.getNode(), Imm); -} - -/// Returns true if the address can be represented by a base register plus -/// an unsigned 12-bit displacement [r+imm]. -bool SystemZDAGToDAGISel::SelectAddrRI32(const SDValue& Op, SDValue& Addr, - SDValue &Base, SDValue &Disp) { - // FIXME dl should come from parent load or store, not from address - DebugLoc dl = Addr.getDebugLoc(); - MVT VT = Addr.getValueType(); - - if (Addr.getOpcode() == ISD::ADD) { - int64_t Imm = 0; - if (isImmZExt12(Addr.getOperand(1), Imm)) { - Disp = CurDAG->getTargetConstant(Imm, MVT::i64); - if (FrameIndexSDNode *FI = - dyn_cast(Addr.getOperand(0))) { - Base = CurDAG->getTargetFrameIndex(FI->getIndex(), VT); - } else { - Base = Addr.getOperand(0); - } - return true; // [r+i] - } - } else if (Addr.getOpcode() == ISD::OR) { - int64_t Imm = 0; - if (isImmZExt12(Addr.getOperand(1), Imm)) { - // If this is an or of disjoint bitfields, we can codegen this as an add - // (for better address arithmetic) if the LHS and RHS of the OR are - // provably disjoint. - APInt LHSKnownZero, LHSKnownOne; - CurDAG->ComputeMaskedBits(Addr.getOperand(0), - APInt::getAllOnesValue(Addr.getOperand(0) - .getValueSizeInBits()), - LHSKnownZero, LHSKnownOne); - - if ((LHSKnownZero.getZExtValue()|~(uint64_t)Imm) == ~0ULL) { - // If all of the bits are known zero on the LHS or RHS, the add won't - // carry. - Base = Addr.getOperand(0); - Disp = CurDAG->getTargetConstant(Imm, MVT::i64); - return true; - } - } - } else if (ConstantSDNode *CN = dyn_cast(Addr)) { - // Loading from a constant address. - - // If this address fits entirely in a 12-bit zext immediate field, codegen - // this as "d(r0)" - int64_t Imm; - if (isImmZExt12(CN, Imm)) { - Disp = CurDAG->getTargetConstant(Imm, MVT::i64); - Base = CurDAG->getRegister(0, VT); - return true; - } - } - - Disp = CurDAG->getTargetConstant(0, MVT::i64); - if (FrameIndexSDNode *FI = dyn_cast(Addr)) - Base = CurDAG->getTargetFrameIndex(FI->getIndex(), VT); - else - Base = Addr; - return true; // [r+0] -} - -/// Returns true if the address can be represented by a base register plus -/// a signed 20-bit displacement [r+imm]. -bool SystemZDAGToDAGISel::SelectAddrRI(const SDValue& Op, SDValue& Addr, - SDValue &Base, SDValue &Disp) { - // FIXME dl should come from parent load or store, not from address - DebugLoc dl = Addr.getDebugLoc(); - MVT VT = Addr.getValueType(); - - if (Addr.getOpcode() == ISD::ADD) { - int64_t Imm = 0; - if (isImmSExt20(Addr.getOperand(1), Imm)) { - Disp = CurDAG->getTargetConstant(Imm, MVT::i64); - if (FrameIndexSDNode *FI = - dyn_cast(Addr.getOperand(0))) { - Base = CurDAG->getTargetFrameIndex(FI->getIndex(), VT); - } else { - Base = Addr.getOperand(0); - } - return true; // [r+i] - } - } else if (Addr.getOpcode() == ISD::OR) { - int64_t Imm = 0; - if (isImmSExt20(Addr.getOperand(1), Imm)) { - // If this is an or of disjoint bitfields, we can codegen this as an add - // (for better address arithmetic) if the LHS and RHS of the OR are - // provably disjoint. - APInt LHSKnownZero, LHSKnownOne; - CurDAG->ComputeMaskedBits(Addr.getOperand(0), - APInt::getAllOnesValue(Addr.getOperand(0) - .getValueSizeInBits()), - LHSKnownZero, LHSKnownOne); - - if ((LHSKnownZero.getZExtValue()|~(uint64_t)Imm) == ~0ULL) { - // If all of the bits are known zero on the LHS or RHS, the add won't - // carry. - Base = Addr.getOperand(0); - Disp = CurDAG->getTargetConstant(Imm, MVT::i64); - return true; - } - } - } else if (ConstantSDNode *CN = dyn_cast(Addr)) { - // Loading from a constant address. - - // If this address fits entirely in a 20-bit sext immediate field, codegen - // this as "d(r0)" - int64_t Imm; - if (isImmSExt20(CN, Imm)) { - Disp = CurDAG->getTargetConstant(Imm, MVT::i64); - Base = CurDAG->getRegister(0, VT); - return true; - } - } - - Disp = CurDAG->getTargetConstant(0, MVT::i64); - if (FrameIndexSDNode *FI = dyn_cast(Addr)) - Base = CurDAG->getTargetFrameIndex(FI->getIndex(), VT); - else - Base = Addr; - return true; // [r+0] -} - /// MatchAddress - Add the specified node to the specified addressing mode, /// returning true if it cannot be done. This just pattern matches for the /// addressing mode. @@ -360,7 +223,7 @@ bool SystemZDAGToDAGISel::MatchAddress(SDValue N, SystemZRRIAddressMode &AM, break; } // Test if the index field is free for use. - if (AM.IndexReg.getNode()) { + if (AM.IndexReg.getNode() && !AM.isRI) { AM = Backup; break; } @@ -407,7 +270,8 @@ bool SystemZDAGToDAGISel::MatchAddress(SDValue N, SystemZRRIAddressMode &AM, // If we couldn't fold both operands into the address at the same time, // see if we can just put each operand into a register and fold at least // the add. - if (AM.BaseType == SystemZRRIAddressMode::RegBase && + if (!AM.isRI && + AM.BaseType == SystemZRRIAddressMode::RegBase && !AM.Base.Reg.getNode() && !AM.IndexReg.getNode()) { AM.Base.Reg = N.getNode()->getOperand(0); AM.IndexReg = N.getNode()->getOperand(1); @@ -448,8 +312,8 @@ bool SystemZDAGToDAGISel::MatchAddressBase(SDValue N, SystemZRRIAddressMode &AM) { // Is the base register already occupied? if (AM.BaseType != SystemZRRIAddressMode::RegBase || AM.Base.Reg.getNode()) { - // If so, check to see if the scale index register is set. - if (AM.IndexReg.getNode() == 0) { + // If so, check to see if the scale register is set. + if (AM.IndexReg.getNode() == 0 && !AM.isRI) { AM.IndexReg = N; return false; } @@ -464,22 +328,118 @@ bool SystemZDAGToDAGISel::MatchAddressBase(SDValue N, return false; } -void SystemZDAGToDAGISel::getAddressOperands(const SystemZRRIAddressMode &AM, - SDValue &Base, SDValue &Disp, - SDValue &Index) { +void SystemZDAGToDAGISel::getAddressOperandsRI(const SystemZRRIAddressMode &AM, + SDValue &Base, SDValue &Disp) { if (AM.BaseType == SystemZRRIAddressMode::RegBase) Base = AM.Base.Reg; else Base = CurDAG->getTargetFrameIndex(AM.Base.FrameIndex, TLI.getPointerTy()); - Index = AM.IndexReg; Disp = CurDAG->getTargetConstant(AM.Disp, MVT::i64); } +void SystemZDAGToDAGISel::getAddressOperands(const SystemZRRIAddressMode &AM, + SDValue &Base, SDValue &Disp, + SDValue &Index) { + getAddressOperandsRI(AM, Base, Disp); + Index = AM.IndexReg; +} + +/// Returns true if the address can be represented by a base register plus +/// an unsigned 12-bit displacement [r+imm]. +bool SystemZDAGToDAGISel::SelectAddrRI12(SDValue Op, SDValue& Addr, + SDValue &Base, SDValue &Disp) { + SystemZRRIAddressMode AM20(/*isRI*/true), AM12(/*isRI*/true); + bool Done = false; + + if (!Addr.hasOneUse()) { + unsigned Opcode = Addr.getOpcode(); + if (Opcode != ISD::Constant && Opcode != ISD::FrameIndex) { + // If we are able to fold N into addressing mode, then we'll allow it even + // if N has multiple uses. In general, addressing computation is used as + // addresses by all of its uses. But watch out for CopyToReg uses, that + // means the address computation is liveout. It will be computed by a LA + // so we want to avoid computing the address twice. + for (SDNode::use_iterator UI = Addr.getNode()->use_begin(), + UE = Addr.getNode()->use_end(); UI != UE; ++UI) { + if (UI->getOpcode() == ISD::CopyToReg) { + MatchAddressBase(Addr, AM12); + Done = true; + break; + } + } + } + } + if (!Done && MatchAddress(Addr, AM12, /* is12Bit */ true)) + return false; + + // Check, whether we can match stuff using 20-bit displacements + if (!Done && !MatchAddress(Addr, AM20, /* is12Bit */ false)) + if (AM12.Disp == 0 && AM20.Disp != 0) + return false; + + DOUT << "MatchAddress (final): "; DEBUG(AM12.dump()); + + MVT VT = Addr.getValueType(); + if (AM12.BaseType == SystemZRRIAddressMode::RegBase) { + if (!AM12.Base.Reg.getNode()) + AM12.Base.Reg = CurDAG->getRegister(0, VT); + } + + assert(AM12.IndexReg.getNode() == 0 && "Invalid reg-imm address mode!"); + + getAddressOperandsRI(AM12, Base, Disp); + + return true; +} + +/// Returns true if the address can be represented by a base register plus +/// a signed 20-bit displacement [r+imm]. +bool SystemZDAGToDAGISel::SelectAddrRI(SDValue Op, SDValue& Addr, + SDValue &Base, SDValue &Disp) { + SystemZRRIAddressMode AM(/*isRI*/true); + bool Done = false; + + if (!Addr.hasOneUse()) { + unsigned Opcode = Addr.getOpcode(); + if (Opcode != ISD::Constant && Opcode != ISD::FrameIndex) { + // If we are able to fold N into addressing mode, then we'll allow it even + // if N has multiple uses. In general, addressing computation is used as + // addresses by all of its uses. But watch out for CopyToReg uses, that + // means the address computation is liveout. It will be computed by a LA + // so we want to avoid computing the address twice. + for (SDNode::use_iterator UI = Addr.getNode()->use_begin(), + UE = Addr.getNode()->use_end(); UI != UE; ++UI) { + if (UI->getOpcode() == ISD::CopyToReg) { + MatchAddressBase(Addr, AM); + Done = true; + break; + } + } + } + } + if (!Done && MatchAddress(Addr, AM, /* is12Bit */ false)) + return false; + + DOUT << "MatchAddress (final): "; DEBUG(AM.dump()); + + MVT VT = Addr.getValueType(); + if (AM.BaseType == SystemZRRIAddressMode::RegBase) { + if (!AM.Base.Reg.getNode()) + AM.Base.Reg = CurDAG->getRegister(0, VT); + } + + assert(AM.IndexReg.getNode() == 0 && "Invalid reg-imm address mode!"); + + getAddressOperandsRI(AM, Base, Disp); + + return true; +} + /// Returns true if the address can be represented by a base register plus /// index register plus an unsigned 12-bit displacement [base + idx + imm]. bool SystemZDAGToDAGISel::SelectAddrRRI12(SDValue Op, SDValue Addr, SDValue &Base, SDValue &Disp, SDValue &Index) { - SystemZRRIAddressMode AM20, AM12; + SystemZRRIAddressMode AM20(/*isRI*/true), AM12(/*isRI*/true); bool Done = false; if (!Addr.hasOneUse()) { diff --git a/llvm/lib/Target/SystemZ/SystemZInstrInfo.cpp b/llvm/lib/Target/SystemZ/SystemZInstrInfo.cpp index 82018e8550cf..c82aa0b9b4a4 100644 --- a/llvm/lib/Target/SystemZ/SystemZInstrInfo.cpp +++ b/llvm/lib/Target/SystemZ/SystemZInstrInfo.cpp @@ -351,6 +351,9 @@ SystemZInstrInfo::getLongDispOpc(unsigned Opc) const { case SystemZ::MOV64m32r: Opc = SystemZ::MOV64m32ry; break; + case SystemZ::MOV8mi: + Opc = SystemZ::MOV8miy; + break; case SystemZ::MUL32rm: Opc = SystemZ::MUL32rmy; break; diff --git a/llvm/lib/Target/SystemZ/SystemZInstrInfo.td b/llvm/lib/Target/SystemZ/SystemZInstrInfo.td index 845b5f0da374..0be70077b261 100644 --- a/llvm/lib/Target/SystemZ/SystemZInstrInfo.td +++ b/llvm/lib/Target/SystemZ/SystemZInstrInfo.td @@ -244,22 +244,24 @@ def MOV64mr : Pseudo<(outs), (ins rriaddr:$dst, GR64:$src), "stg\t{$src, $dst}", [(store GR64:$src, rriaddr:$dst)]>; -// FIXME: displacements here are really 12 bit, not 20! -def MOV8mi : Pseudo<(outs), (ins riaddr:$dst, i32i8imm:$src), +def MOV8mi : Pseudo<(outs), (ins riaddr12:$dst, i32i8imm:$src), + "mvi\t{$dst, $src}", + [(truncstorei8 (i32 i32immSExt8:$src), riaddr12:$dst)]>; +def MOV8miy : Pseudo<(outs), (ins riaddr:$dst, i32i8imm:$src), "mviy\t{$dst, $src}", [(truncstorei8 (i32 i32immSExt8:$src), riaddr:$dst)]>; -def MOV16mi : Pseudo<(outs), (ins riaddr:$dst, s16imm:$src), +def MOV16mi : Pseudo<(outs), (ins riaddr12:$dst, s16imm:$src), "mvhhi\t{$dst, $src}", - [(truncstorei16 (i32 i32immSExt16:$src), riaddr:$dst)]>, + [(truncstorei16 (i32 i32immSExt16:$src), riaddr12:$dst)]>, Requires<[IsZ10]>; -def MOV32mi16 : Pseudo<(outs), (ins riaddr:$dst, s32imm:$src), +def MOV32mi16 : Pseudo<(outs), (ins riaddr12:$dst, s32imm:$src), "mvhi\t{$dst, $src}", - [(store (i32 immSExt16:$src), riaddr:$dst)]>, + [(store (i32 immSExt16:$src), riaddr12:$dst)]>, Requires<[IsZ10]>; -def MOV64mi16 : Pseudo<(outs), (ins riaddr:$dst, s32imm64:$src), +def MOV64mi16 : Pseudo<(outs), (ins riaddr12:$dst, s32imm64:$src), "mvghi\t{$dst, $src}", - [(store (i64 immSExt16:$src), riaddr:$dst)]>, + [(store (i64 immSExt16:$src), riaddr12:$dst)]>, Requires<[IsZ10]>; // sexts diff --git a/llvm/lib/Target/SystemZ/SystemZOperands.td b/llvm/lib/Target/SystemZ/SystemZOperands.td index 7ac6cc28c11d..495a9d5d5643 100644 --- a/llvm/lib/Target/SystemZ/SystemZOperands.td +++ b/llvm/lib/Target/SystemZ/SystemZOperands.td @@ -252,11 +252,17 @@ def s32imm64 : Operand { // riaddr := reg + imm def riaddr32 : Operand, - ComplexPattern { + ComplexPattern { let PrintMethod = "printRIAddrOperand"; let MIOperandInfo = (ops ADDR32:$base, u12imm:$disp); } +def riaddr12 : Operand, + ComplexPattern { + let PrintMethod = "printRIAddrOperand"; + let MIOperandInfo = (ops ADDR64:$base, u12imm64:$disp); +} + def riaddr : Operand, ComplexPattern { let PrintMethod = "printRIAddrOperand"; diff --git a/llvm/test/CodeGen/SystemZ/05-MemImmStores.ll b/llvm/test/CodeGen/SystemZ/05-MemImmStores.ll index b58214414481..1a1d2f0d649b 100644 --- a/llvm/test/CodeGen/SystemZ/05-MemImmStores.ll +++ b/llvm/test/CodeGen/SystemZ/05-MemImmStores.ll @@ -1,7 +1,8 @@ ; RUN: llvm-as < %s | llc -mattr=+z10 | grep mvghi | count 1 ; RUN: llvm-as < %s | llc -mattr=+z10 | grep mvhi | count 1 ; RUN: llvm-as < %s | llc -mattr=+z10 | grep mvhhi | count 1 -; RUN: llvm-as < %s | llc | grep mvi | count 1 +; RUN: llvm-as < %s | llc | grep mvi | count 2 +; RUN: llvm-as < %s | llc | grep mviy | count 1 target datalayout = "E-p:64:64:64-i1:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-f128:128:128" target triple = "s390x-unknown-linux-gnu" @@ -33,3 +34,17 @@ entry: store i8 4, i8* %add.ptr ret void } + +define void @foo5(i8* nocapture %a, i64 %idx) nounwind { +entry: + %add.ptr = getelementptr i8* %a, i64 -1 ; [#uses=1] + store i8 4, i8* %add.ptr + ret void +} + +define void @foo6(i16* nocapture %a, i64 %idx) nounwind { +entry: + %add.ptr = getelementptr i16* %a, i64 -1 ; [#uses=1] + store i16 3, i16* %add.ptr + ret void +}