[Hexagon] Adding halfword to doubleword multiplies.

llvm-svn: 224289
This commit is contained in:
Colin LeMahieu 2014-12-15 23:29:37 +00:00
parent 64ffd52943
commit 18c927620a
2 changed files with 83 additions and 0 deletions

View File

@ -2220,6 +2220,65 @@ def : T_MType_acc_pat1 <M2_macsin, mul, sub, u8ExtPred>;
def : T_MType_acc_pat1 <M2_naccii, add, sub, s8_16ExtPred>; def : T_MType_acc_pat1 <M2_naccii, add, sub, s8_16ExtPred>;
def : T_MType_acc_pat2 <M2_nacci, add, sub>; def : T_MType_acc_pat2 <M2_nacci, add, sub>;
//===----------------------------------------------------------------------===//
// Template Class -- Multiply signed/unsigned halfwords with and without
// saturation and rounding
//===----------------------------------------------------------------------===//
class T_M2_mpyd < bits<2> LHbits, bit isRnd, bit hasShift, bit isUnsigned >
: MInst < (outs DoubleRegs:$Rdd), (ins IntRegs:$Rs, IntRegs:$Rt),
"$Rdd = "#!if(isUnsigned,"mpyu","mpy")#"($Rs."#!if(LHbits{1},"h","l")
#", $Rt."#!if(LHbits{0},"h)","l)")
#!if(hasShift,":<<1","")
#!if(isRnd,":rnd",""),
[] > {
bits<5> Rdd;
bits<5> Rs;
bits<5> Rt;
let IClass = 0b1110;
let Inst{27-24} = 0b0100;
let Inst{23} = hasShift;
let Inst{22} = isUnsigned;
let Inst{21} = isRnd;
let Inst{6-5} = LHbits;
let Inst{4-0} = Rdd;
let Inst{20-16} = Rs;
let Inst{12-8} = Rt;
}
let isCodeGenOnly = 0 in {
def M2_mpyd_hh_s0: T_M2_mpyd<0b11, 0, 0, 0>;
def M2_mpyd_hl_s0: T_M2_mpyd<0b10, 0, 0, 0>;
def M2_mpyd_lh_s0: T_M2_mpyd<0b01, 0, 0, 0>;
def M2_mpyd_ll_s0: T_M2_mpyd<0b00, 0, 0, 0>;
def M2_mpyd_hh_s1: T_M2_mpyd<0b11, 0, 1, 0>;
def M2_mpyd_hl_s1: T_M2_mpyd<0b10, 0, 1, 0>;
def M2_mpyd_lh_s1: T_M2_mpyd<0b01, 0, 1, 0>;
def M2_mpyd_ll_s1: T_M2_mpyd<0b00, 0, 1, 0>;
def M2_mpyd_rnd_hh_s0: T_M2_mpyd<0b11, 1, 0, 0>;
def M2_mpyd_rnd_hl_s0: T_M2_mpyd<0b10, 1, 0, 0>;
def M2_mpyd_rnd_lh_s0: T_M2_mpyd<0b01, 1, 0, 0>;
def M2_mpyd_rnd_ll_s0: T_M2_mpyd<0b00, 1, 0, 0>;
def M2_mpyd_rnd_hh_s1: T_M2_mpyd<0b11, 1, 1, 0>;
def M2_mpyd_rnd_hl_s1: T_M2_mpyd<0b10, 1, 1, 0>;
def M2_mpyd_rnd_lh_s1: T_M2_mpyd<0b01, 1, 1, 0>;
def M2_mpyd_rnd_ll_s1: T_M2_mpyd<0b00, 1, 1, 0>;
//Rdd=mpyu(Rs.[HL],Rt.[HL])[:<<1]
def M2_mpyud_hh_s0: T_M2_mpyd<0b11, 0, 0, 1>;
def M2_mpyud_hl_s0: T_M2_mpyd<0b10, 0, 0, 1>;
def M2_mpyud_lh_s0: T_M2_mpyd<0b01, 0, 0, 1>;
def M2_mpyud_ll_s0: T_M2_mpyd<0b00, 0, 0, 1>;
def M2_mpyud_hh_s1: T_M2_mpyd<0b11, 0, 1, 1>;
def M2_mpyud_hl_s1: T_M2_mpyd<0b10, 0, 1, 1>;
def M2_mpyud_lh_s1: T_M2_mpyd<0b01, 0, 1, 1>;
def M2_mpyud_ll_s1: T_M2_mpyd<0b00, 0, 1, 1>;
}
// Multiply and use lower result. // Multiply and use lower result.
// Rd=+mpyi(Rs,#u8) // Rd=+mpyi(Rs,#u8)

View File

@ -12,6 +12,22 @@
# CHECK: r17 = mpyi(r21, r31) # CHECK: r17 = mpyi(r21, r31)
0x11 0xdf 0x15 0xef 0x11 0xdf 0x15 0xef
# CHECK: r17 += mpyi(r21, r31) # CHECK: r17 += mpyi(r21, r31)
0x10 0xdf 0x95 0xe4
# CHECK: r17:16 = mpy(r21.l, r31.l):<<1
0x30 0xdf 0x95 0xe4
# CHECK: r17:16 = mpy(r21.l, r31.h):<<1
0x50 0xdf 0x95 0xe4
# CHECK: r17:16 = mpy(r21.h, r31.l):<<1
0x70 0xdf 0x95 0xe4
# CHECK: r17:16 = mpy(r21.h, r31.h):<<1
0x10 0xdf 0xb5 0xe4
# CHECK: r17:16 = mpy(r21.l, r31.l):<<1:rnd
0x30 0xdf 0xb5 0xe4
# CHECK: r17:16 = mpy(r21.l, r31.h):<<1:rnd
0x50 0xdf 0xb5 0xe4
# CHECK: r17:16 = mpy(r21.h, r31.l):<<1:rnd
0x70 0xdf 0xb5 0xe4
# CHECK: r17:16 = mpy(r21.h, r31.h):<<1:rnd
0x10 0xdf 0x95 0xe6 0x10 0xdf 0x95 0xe6
# CHECK: r17:16 += mpy(r21.l, r31.l):<<1 # CHECK: r17:16 += mpy(r21.l, r31.l):<<1
0x30 0xdf 0x95 0xe6 0x30 0xdf 0x95 0xe6
@ -92,6 +108,14 @@
# CHECK: r17 -= mpy(r21.h, r31.l):<<1:sat # CHECK: r17 -= mpy(r21.h, r31.l):<<1:sat
0xf1 0xdf 0xb5 0xee 0xf1 0xdf 0xb5 0xee
# CHECK: r17 -= mpy(r21.h, r31.h):<<1:sat # CHECK: r17 -= mpy(r21.h, r31.h):<<1:sat
0x10 0xdf 0xd5 0xe4
# CHECK: r17:16 = mpyu(r21.l, r31.l):<<1
0x30 0xdf 0xd5 0xe4
# CHECK: r17:16 = mpyu(r21.l, r31.h):<<1
0x50 0xdf 0xd5 0xe4
# CHECK: r17:16 = mpyu(r21.h, r31.l):<<1
0x70 0xdf 0xd5 0xe4
# CHECK: r17:16 = mpyu(r21.h, r31.h):<<1
0x10 0xdf 0xd5 0xe6 0x10 0xdf 0xd5 0xe6
# CHECK: r17:16 += mpyu(r21.l, r31.l):<<1 # CHECK: r17:16 += mpyu(r21.l, r31.l):<<1
0x30 0xdf 0xd5 0xe6 0x30 0xdf 0xd5 0xe6