forked from OSchip/llvm-project
R600/SI: Implement add i64, but do not yet enable.
Test doesn't actually check the output. I need to fix add i64 being matched for the addressing calculations. llvm-svn: 195040
This commit is contained in:
parent
bf6e1e7ff7
commit
fb826fa6e1
|
@ -424,6 +424,7 @@ SDValue SITargetLowering::LowerOperation(SDValue Op, SelectionDAG &DAG) const {
|
|||
SIMachineFunctionInfo *MFI = MF.getInfo<SIMachineFunctionInfo>();
|
||||
switch (Op.getOpcode()) {
|
||||
default: return AMDGPUTargetLowering::LowerOperation(Op, DAG);
|
||||
case ISD::ADD: return LowerADD(Op, DAG);
|
||||
case ISD::BRCOND: return LowerBRCOND(Op, DAG);
|
||||
case ISD::LOAD: {
|
||||
LoadSDNode *Load = dyn_cast<LoadSDNode>(Op);
|
||||
|
@ -560,6 +561,33 @@ SDValue SITargetLowering::LowerOperation(SDValue Op, SelectionDAG &DAG) const {
|
|||
return SDValue();
|
||||
}
|
||||
|
||||
SDValue SITargetLowering::LowerADD(SDValue Op,
|
||||
SelectionDAG &DAG) const {
|
||||
if (Op.getValueType() != MVT::i64)
|
||||
return SDValue();
|
||||
|
||||
SDLoc DL(Op);
|
||||
SDValue LHS = Op.getOperand(0);
|
||||
SDValue RHS = Op.getOperand(1);
|
||||
|
||||
SDValue Zero = DAG.getConstant(0, MVT::i32);
|
||||
SDValue One = DAG.getConstant(1, MVT::i32);
|
||||
|
||||
SDValue Lo0 = DAG.getNode(ISD::EXTRACT_ELEMENT, DL, MVT::i32, LHS, Zero);
|
||||
SDValue Hi0 = DAG.getNode(ISD::EXTRACT_ELEMENT, DL, MVT::i32, LHS, One);
|
||||
|
||||
SDValue Lo1 = DAG.getNode(ISD::EXTRACT_ELEMENT, DL, MVT::i32, RHS, Zero);
|
||||
SDValue Hi1 = DAG.getNode(ISD::EXTRACT_ELEMENT, DL, MVT::i32, RHS, One);
|
||||
|
||||
SDVTList VTList = DAG.getVTList(MVT::i32, MVT::Glue);
|
||||
|
||||
SDValue AddLo = DAG.getNode(ISD::ADDC, DL, VTList, Lo0, Lo1);
|
||||
SDValue Carry = AddLo.getValue(1);
|
||||
SDValue AddHi = DAG.getNode(ISD::ADDE, DL, VTList, Hi0, Hi1, Carry);
|
||||
|
||||
return DAG.getNode(ISD::BUILD_PAIR, DL, MVT::i64, AddLo, AddHi.getValue(0));
|
||||
}
|
||||
|
||||
/// \brief Helper function for LowerBRCOND
|
||||
static SDNode *findUser(SDValue Value, unsigned Opcode) {
|
||||
|
||||
|
|
|
@ -30,6 +30,7 @@ class SITargetLowering : public AMDGPUTargetLowering {
|
|||
SDValue LowerSIGN_EXTEND(SDValue Op, SelectionDAG &DAG) const;
|
||||
SDValue LowerSTORE(SDValue Op, SelectionDAG &DAG) const;
|
||||
SDValue LowerZERO_EXTEND(SDValue Op, SelectionDAG &DAG) const;
|
||||
SDValue LowerADD(SDValue Op, SelectionDAG &DAG) const;
|
||||
SDValue LowerBRCOND(SDValue Op, SelectionDAG &DAG) const;
|
||||
|
||||
SDValue ResourceDescriptorToi128(SDValue Op, SelectionDAG &DAG) const;
|
||||
|
|
|
@ -0,0 +1,45 @@
|
|||
; XFAIL: *
|
||||
; This will fail until i64 add is enabled
|
||||
|
||||
; RUN: llc < %s -march=r600 -mcpu=SI | FileCheck --check-prefix=SI %s
|
||||
|
||||
|
||||
declare i32 @llvm.SI.tid() readnone
|
||||
|
||||
; SI-LABEL: @test_i64_vreg:
|
||||
define void @test_i64_vreg(i64 addrspace(1)* noalias %out, i64 addrspace(1)* noalias %inA, i64 addrspace(1)* noalias %inB) {
|
||||
%tid = call i32 @llvm.SI.tid() readnone
|
||||
%a_ptr = getelementptr i64 addrspace(1)* %inA, i32 %tid
|
||||
%b_ptr = getelementptr i64 addrspace(1)* %inB, i32 %tid
|
||||
%a = load i64 addrspace(1)* %a_ptr
|
||||
%b = load i64 addrspace(1)* %b_ptr
|
||||
%result = add i64 %a, %b
|
||||
store i64 %result, i64 addrspace(1)* %out
|
||||
ret void
|
||||
}
|
||||
|
||||
; SI-LABEL: @test_i64_sreg:
|
||||
define void @test_i64_sreg(i64 addrspace(1)* noalias %out, i64 %a, i64 %b) {
|
||||
%result = add i64 %a, %b
|
||||
store i64 %result, i64 addrspace(1)* %out
|
||||
ret void
|
||||
}
|
||||
|
||||
; SI-LABEL: @test_v2i64_sreg:
|
||||
define void @test_v2i64_sreg(<2 x i64> addrspace(1)* noalias %out, <2 x i64> %a, <2 x i64> %b) {
|
||||
%result = add <2 x i64> %a, %b
|
||||
store <2 x i64> %result, <2 x i64> addrspace(1)* %out
|
||||
ret void
|
||||
}
|
||||
|
||||
; SI-LABEL: @test_v2i64_vreg:
|
||||
define void @test_v2i64_vreg(<2 x i64> addrspace(1)* noalias %out, <2 x i64> addrspace(1)* noalias %inA, <2 x i64> addrspace(1)* noalias %inB) {
|
||||
%tid = call i32 @llvm.SI.tid() readnone
|
||||
%a_ptr = getelementptr <2 x i64> addrspace(1)* %inA, i32 %tid
|
||||
%b_ptr = getelementptr <2 x i64> addrspace(1)* %inB, i32 %tid
|
||||
%a = load <2 x i64> addrspace(1)* %a_ptr
|
||||
%b = load <2 x i64> addrspace(1)* %b_ptr
|
||||
%result = add <2 x i64> %a, %b
|
||||
store <2 x i64> %result, <2 x i64> addrspace(1)* %out
|
||||
ret void
|
||||
}
|
Loading…
Reference in New Issue