2012-02-18 20:03:15 +08:00
|
|
|
//===-- X86InstrExtension.td - Sign and Zero Extensions ----*- tablegen -*-===//
|
|
|
|
//
|
2010-10-05 14:52:35 +08:00
|
|
|
// The LLVM Compiler Infrastructure
|
|
|
|
//
|
|
|
|
// This file is distributed under the University of Illinois Open Source
|
|
|
|
// License. See LICENSE.TXT for details.
|
2012-02-18 20:03:15 +08:00
|
|
|
//
|
2010-10-05 14:52:35 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
//
|
|
|
|
// This file describes the sign and zero extension operations.
|
|
|
|
//
|
2017-12-12 01:01:21 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
let hasSideEffects = 0 in {
|
|
|
|
let Defs = [AX], Uses = [AL] in // AX = signext(AL)
|
|
|
|
def CBW : I<0x98, RawFrm, (outs), (ins),
|
|
|
|
"{cbtw|cbw}", [], IIC_CBW>, OpSize16, Sched<[WriteALU]>;
|
|
|
|
let Defs = [EAX], Uses = [AX] in // EAX = signext(AX)
|
|
|
|
def CWDE : I<0x98, RawFrm, (outs), (ins),
|
|
|
|
"{cwtl|cwde}", [], IIC_CBW>, OpSize32, Sched<[WriteALU]>;
|
|
|
|
|
|
|
|
let Defs = [AX,DX], Uses = [AX] in // DX:AX = signext(AX)
|
|
|
|
def CWD : I<0x99, RawFrm, (outs), (ins),
|
|
|
|
"{cwtd|cwd}", [], IIC_CBW>, OpSize16, Sched<[WriteALU]>;
|
|
|
|
let Defs = [EAX,EDX], Uses = [EAX] in // EDX:EAX = signext(EAX)
|
|
|
|
def CDQ : I<0x99, RawFrm, (outs), (ins),
|
|
|
|
"{cltd|cdq}", [], IIC_CBW>, OpSize32, Sched<[WriteALU]>;
|
|
|
|
|
|
|
|
|
|
|
|
let Defs = [RAX], Uses = [EAX] in // RAX = signext(EAX)
|
|
|
|
def CDQE : RI<0x98, RawFrm, (outs), (ins),
|
|
|
|
"{cltq|cdqe}", [], IIC_CBW>, Sched<[WriteALU]>;
|
|
|
|
|
|
|
|
let Defs = [RAX,RDX], Uses = [RAX] in // RDX:RAX = signext(RAX)
|
|
|
|
def CQO : RI<0x99, RawFrm, (outs), (ins),
|
|
|
|
"{cqto|cqo}", [], IIC_CBW>, Sched<[WriteALU]>;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Sign/Zero extenders
|
|
|
|
let hasSideEffects = 0 in {
|
|
|
|
def MOVSX16rr8 : I<0xBE, MRMSrcReg, (outs GR16:$dst), (ins GR8:$src),
|
2012-03-01 03:44:41 +08:00
|
|
|
"movs{bw|x}\t{$src, $dst|$dst, $src}", [], IIC_MOVSX_R16_R8>,
|
2014-02-02 17:25:09 +08:00
|
|
|
TB, OpSize16, Sched<[WriteALU]>;
|
2012-07-30 15:14:07 +08:00
|
|
|
let mayLoad = 1 in
|
2011-05-21 03:04:40 +08:00
|
|
|
def MOVSX16rm8 : I<0xBE, MRMSrcMem, (outs GR16:$dst), (ins i8mem:$src),
|
2012-03-01 03:44:41 +08:00
|
|
|
"movs{bw|x}\t{$src, $dst|$dst, $src}", [], IIC_MOVSX_R16_M8>,
|
2014-02-02 17:25:09 +08:00
|
|
|
TB, OpSize16, Sched<[WriteALULd]>;
|
2014-11-26 08:46:26 +08:00
|
|
|
} // hasSideEffects = 0
|
2011-05-21 03:04:40 +08:00
|
|
|
def MOVSX32rr8 : I<0xBE, MRMSrcReg, (outs GR32:$dst), (ins GR8:$src),
|
2010-10-05 14:52:35 +08:00
|
|
|
"movs{bl|x}\t{$src, $dst|$dst, $src}",
|
2013-03-20 02:03:58 +08:00
|
|
|
[(set GR32:$dst, (sext GR8:$src))], IIC_MOVSX>, TB,
|
2014-02-02 17:25:09 +08:00
|
|
|
OpSize32, Sched<[WriteALU]>;
|
2010-10-05 14:52:35 +08:00
|
|
|
def MOVSX32rm8 : I<0xBE, MRMSrcMem, (outs GR32:$dst), (ins i8mem :$src),
|
|
|
|
"movs{bl|x}\t{$src, $dst|$dst, $src}",
|
2013-03-20 02:03:58 +08:00
|
|
|
[(set GR32:$dst, (sextloadi32i8 addr:$src))], IIC_MOVSX>, TB,
|
2014-02-02 17:25:09 +08:00
|
|
|
OpSize32, Sched<[WriteALULd]>;
|
2010-10-05 14:52:35 +08:00
|
|
|
def MOVSX32rr16: I<0xBF, MRMSrcReg, (outs GR32:$dst), (ins GR16:$src),
|
|
|
|
"movs{wl|x}\t{$src, $dst|$dst, $src}",
|
2013-03-20 02:03:58 +08:00
|
|
|
[(set GR32:$dst, (sext GR16:$src))], IIC_MOVSX>, TB,
|
2014-02-02 17:25:09 +08:00
|
|
|
OpSize32, Sched<[WriteALU]>;
|
2010-10-05 14:52:35 +08:00
|
|
|
def MOVSX32rm16: I<0xBF, MRMSrcMem, (outs GR32:$dst), (ins i16mem:$src),
|
|
|
|
"movs{wl|x}\t{$src, $dst|$dst, $src}",
|
2012-03-01 03:44:41 +08:00
|
|
|
[(set GR32:$dst, (sextloadi32i16 addr:$src))], IIC_MOVSX>,
|
2014-02-02 17:25:09 +08:00
|
|
|
OpSize32, TB, Sched<[WriteALULd]>;
|
2010-10-05 14:52:35 +08:00
|
|
|
|
2014-11-26 08:46:26 +08:00
|
|
|
let hasSideEffects = 0 in {
|
2011-05-21 03:04:40 +08:00
|
|
|
def MOVZX16rr8 : I<0xB6, MRMSrcReg, (outs GR16:$dst), (ins GR8:$src),
|
2012-03-01 03:44:41 +08:00
|
|
|
"movz{bw|x}\t{$src, $dst|$dst, $src}", [], IIC_MOVZX_R16_R8>,
|
2014-02-02 17:25:09 +08:00
|
|
|
TB, OpSize16, Sched<[WriteALU]>;
|
2012-07-30 15:14:07 +08:00
|
|
|
let mayLoad = 1 in
|
2011-05-21 03:04:40 +08:00
|
|
|
def MOVZX16rm8 : I<0xB6, MRMSrcMem, (outs GR16:$dst), (ins i8mem:$src),
|
2012-03-01 03:44:41 +08:00
|
|
|
"movz{bw|x}\t{$src, $dst|$dst, $src}", [], IIC_MOVZX_R16_M8>,
|
2014-02-02 17:25:09 +08:00
|
|
|
TB, OpSize16, Sched<[WriteALULd]>;
|
2014-11-26 08:46:26 +08:00
|
|
|
} // hasSideEffects = 0
|
2010-10-05 14:52:35 +08:00
|
|
|
def MOVZX32rr8 : I<0xB6, MRMSrcReg, (outs GR32:$dst), (ins GR8 :$src),
|
|
|
|
"movz{bl|x}\t{$src, $dst|$dst, $src}",
|
2013-03-20 02:03:58 +08:00
|
|
|
[(set GR32:$dst, (zext GR8:$src))], IIC_MOVZX>, TB,
|
2014-02-02 17:25:09 +08:00
|
|
|
OpSize32, Sched<[WriteALU]>;
|
2010-10-05 14:52:35 +08:00
|
|
|
def MOVZX32rm8 : I<0xB6, MRMSrcMem, (outs GR32:$dst), (ins i8mem :$src),
|
|
|
|
"movz{bl|x}\t{$src, $dst|$dst, $src}",
|
2013-03-20 02:03:58 +08:00
|
|
|
[(set GR32:$dst, (zextloadi32i8 addr:$src))], IIC_MOVZX>, TB,
|
2014-02-02 17:25:09 +08:00
|
|
|
OpSize32, Sched<[WriteALULd]>;
|
2010-10-05 14:52:35 +08:00
|
|
|
def MOVZX32rr16: I<0xB7, MRMSrcReg, (outs GR32:$dst), (ins GR16:$src),
|
|
|
|
"movz{wl|x}\t{$src, $dst|$dst, $src}",
|
2013-03-20 02:03:58 +08:00
|
|
|
[(set GR32:$dst, (zext GR16:$src))], IIC_MOVZX>, TB,
|
2014-02-02 17:25:09 +08:00
|
|
|
OpSize32, Sched<[WriteALU]>;
|
2010-10-05 14:52:35 +08:00
|
|
|
def MOVZX32rm16: I<0xB7, MRMSrcMem, (outs GR32:$dst), (ins i16mem:$src),
|
|
|
|
"movz{wl|x}\t{$src, $dst|$dst, $src}",
|
2012-03-01 03:44:41 +08:00
|
|
|
[(set GR32:$dst, (zextloadi32i16 addr:$src))], IIC_MOVZX>,
|
2014-02-02 17:25:09 +08:00
|
|
|
TB, OpSize32, Sched<[WriteALULd]>;
|
2010-10-05 14:52:35 +08:00
|
|
|
|
|
|
|
// These are the same as the regular MOVZX32rr8 and MOVZX32rm8
|
|
|
|
// except that they use GR32_NOREX for the output operand register class
|
|
|
|
// instead of GR32. This allows them to operate on h registers on x86-64.
|
2017-09-28 04:34:17 +08:00
|
|
|
let hasSideEffects = 0, isCodeGenOnly = 1 in {
|
|
|
|
def MOVZX32_NOREXrr8 : I<0xB6, MRMSrcReg,
|
2011-10-08 04:15:54 +08:00
|
|
|
(outs GR32_NOREX:$dst), (ins GR8_NOREX:$src),
|
2017-09-28 04:34:17 +08:00
|
|
|
"movz{bl|x}\t{$src, $dst|$dst, $src} # NOREX",
|
|
|
|
[], IIC_MOVZX>, TB, OpSize32, Sched<[WriteALU]>;
|
2010-10-05 14:52:35 +08:00
|
|
|
let mayLoad = 1 in
|
2017-09-28 04:34:17 +08:00
|
|
|
def MOVZX32_NOREXrm8 : I<0xB6, MRMSrcMem,
|
2011-10-08 04:15:54 +08:00
|
|
|
(outs GR32_NOREX:$dst), (ins i8mem_NOREX:$src),
|
2017-09-28 04:34:17 +08:00
|
|
|
"movz{bl|x}\t{$src, $dst|$dst, $src} # NOREX",
|
|
|
|
[], IIC_MOVZX>, TB, OpSize32, Sched<[WriteALULd]>;
|
[X86] 8bit divrem: Improve codegen for AH register extraction.
For 8-bit divrems where the remainder is used, we used to generate:
divb %sil
shrw $8, %ax
movzbl %al, %eax
That was to avoid an H-reg access, which is problematic mainly because
it isn't possible in REX-prefixed instructions.
This patch optimizes that to:
divb %sil
movzbl %ah, %eax
To do that, we explicitly extend AH, and extract the L-subreg in the
resulting register. The extension is done using the NOREX variants of
MOVZX. To support signed operations, MOVSX_NOREX is also added.
Further, this introduces a new SDNode type, [us]divrem_ext_hreg, which is
then lowered to a sequence containing a single zext (rather than 2).
Differential Revision: http://reviews.llvm.org/D6064
llvm-svn: 221176
2014-11-04 04:26:35 +08:00
|
|
|
|
2017-09-28 04:34:17 +08:00
|
|
|
def MOVSX32_NOREXrr8 : I<0xBE, MRMSrcReg,
|
[X86] 8bit divrem: Improve codegen for AH register extraction.
For 8-bit divrems where the remainder is used, we used to generate:
divb %sil
shrw $8, %ax
movzbl %al, %eax
That was to avoid an H-reg access, which is problematic mainly because
it isn't possible in REX-prefixed instructions.
This patch optimizes that to:
divb %sil
movzbl %ah, %eax
To do that, we explicitly extend AH, and extract the L-subreg in the
resulting register. The extension is done using the NOREX variants of
MOVZX. To support signed operations, MOVSX_NOREX is also added.
Further, this introduces a new SDNode type, [us]divrem_ext_hreg, which is
then lowered to a sequence containing a single zext (rather than 2).
Differential Revision: http://reviews.llvm.org/D6064
llvm-svn: 221176
2014-11-04 04:26:35 +08:00
|
|
|
(outs GR32_NOREX:$dst), (ins GR8_NOREX:$src),
|
2017-09-28 04:34:17 +08:00
|
|
|
"movs{bl|x}\t{$src, $dst|$dst, $src} # NOREX",
|
|
|
|
[], IIC_MOVSX>, TB, OpSize32, Sched<[WriteALU]>;
|
[X86] 8bit divrem: Improve codegen for AH register extraction.
For 8-bit divrems where the remainder is used, we used to generate:
divb %sil
shrw $8, %ax
movzbl %al, %eax
That was to avoid an H-reg access, which is problematic mainly because
it isn't possible in REX-prefixed instructions.
This patch optimizes that to:
divb %sil
movzbl %ah, %eax
To do that, we explicitly extend AH, and extract the L-subreg in the
resulting register. The extension is done using the NOREX variants of
MOVZX. To support signed operations, MOVSX_NOREX is also added.
Further, this introduces a new SDNode type, [us]divrem_ext_hreg, which is
then lowered to a sequence containing a single zext (rather than 2).
Differential Revision: http://reviews.llvm.org/D6064
llvm-svn: 221176
2014-11-04 04:26:35 +08:00
|
|
|
let mayLoad = 1 in
|
2017-09-28 04:34:17 +08:00
|
|
|
def MOVSX32_NOREXrm8 : I<0xBE, MRMSrcMem,
|
[X86] 8bit divrem: Improve codegen for AH register extraction.
For 8-bit divrems where the remainder is used, we used to generate:
divb %sil
shrw $8, %ax
movzbl %al, %eax
That was to avoid an H-reg access, which is problematic mainly because
it isn't possible in REX-prefixed instructions.
This patch optimizes that to:
divb %sil
movzbl %ah, %eax
To do that, we explicitly extend AH, and extract the L-subreg in the
resulting register. The extension is done using the NOREX variants of
MOVZX. To support signed operations, MOVSX_NOREX is also added.
Further, this introduces a new SDNode type, [us]divrem_ext_hreg, which is
then lowered to a sequence containing a single zext (rather than 2).
Differential Revision: http://reviews.llvm.org/D6064
llvm-svn: 221176
2014-11-04 04:26:35 +08:00
|
|
|
(outs GR32_NOREX:$dst), (ins i8mem_NOREX:$src),
|
2017-09-28 04:34:17 +08:00
|
|
|
"movs{bl|x}\t{$src, $dst|$dst, $src} # NOREX",
|
|
|
|
[], IIC_MOVSX>, TB, OpSize32, Sched<[WriteALULd]>;
|
2012-07-30 14:48:11 +08:00
|
|
|
}
|
2010-10-05 14:52:35 +08:00
|
|
|
|
|
|
|
// MOVSX64rr8 always has a REX prefix and it has an 8-bit register
|
|
|
|
// operand, which makes it a rare instruction with an 8-bit register
|
|
|
|
// operand that can never access an h register. If support for h registers
|
|
|
|
// were generalized, this would require a special register class.
|
|
|
|
def MOVSX64rr8 : RI<0xBE, MRMSrcReg, (outs GR64:$dst), (ins GR8 :$src),
|
|
|
|
"movs{bq|x}\t{$src, $dst|$dst, $src}",
|
2013-03-20 02:03:58 +08:00
|
|
|
[(set GR64:$dst, (sext GR8:$src))], IIC_MOVSX>, TB,
|
|
|
|
Sched<[WriteALU]>;
|
2010-10-05 14:52:35 +08:00
|
|
|
def MOVSX64rm8 : RI<0xBE, MRMSrcMem, (outs GR64:$dst), (ins i8mem :$src),
|
|
|
|
"movs{bq|x}\t{$src, $dst|$dst, $src}",
|
2012-03-01 03:44:41 +08:00
|
|
|
[(set GR64:$dst, (sextloadi64i8 addr:$src))], IIC_MOVSX>,
|
2013-03-20 02:03:58 +08:00
|
|
|
TB, Sched<[WriteALULd]>;
|
2010-10-05 14:52:35 +08:00
|
|
|
def MOVSX64rr16: RI<0xBF, MRMSrcReg, (outs GR64:$dst), (ins GR16:$src),
|
|
|
|
"movs{wq|x}\t{$src, $dst|$dst, $src}",
|
2013-03-20 02:03:58 +08:00
|
|
|
[(set GR64:$dst, (sext GR16:$src))], IIC_MOVSX>, TB,
|
|
|
|
Sched<[WriteALU]>;
|
2010-10-05 14:52:35 +08:00
|
|
|
def MOVSX64rm16: RI<0xBF, MRMSrcMem, (outs GR64:$dst), (ins i16mem:$src),
|
|
|
|
"movs{wq|x}\t{$src, $dst|$dst, $src}",
|
2012-03-01 03:44:41 +08:00
|
|
|
[(set GR64:$dst, (sextloadi64i16 addr:$src))], IIC_MOVSX>,
|
2013-03-20 02:03:58 +08:00
|
|
|
TB, Sched<[WriteALULd]>;
|
2010-10-05 14:52:35 +08:00
|
|
|
def MOVSX64rr32: RI<0x63, MRMSrcReg, (outs GR64:$dst), (ins GR32:$src),
|
|
|
|
"movs{lq|xd}\t{$src, $dst|$dst, $src}",
|
2013-03-20 02:03:58 +08:00
|
|
|
[(set GR64:$dst, (sext GR32:$src))], IIC_MOVSX>,
|
2015-02-03 19:03:43 +08:00
|
|
|
Sched<[WriteALU]>, Requires<[In64BitMode]>;
|
2010-10-05 14:52:35 +08:00
|
|
|
def MOVSX64rm32: RI<0x63, MRMSrcMem, (outs GR64:$dst), (ins i32mem:$src),
|
|
|
|
"movs{lq|xd}\t{$src, $dst|$dst, $src}",
|
2013-03-20 02:03:58 +08:00
|
|
|
[(set GR64:$dst, (sextloadi64i32 addr:$src))], IIC_MOVSX>,
|
2015-02-03 19:03:43 +08:00
|
|
|
Sched<[WriteALULd]>, Requires<[In64BitMode]>;
|
2010-10-05 14:52:35 +08:00
|
|
|
|
|
|
|
// movzbq and movzwq encodings for the disassembler
|
2016-01-07 13:57:39 +08:00
|
|
|
let hasSideEffects = 0 in {
|
|
|
|
def MOVZX64rr8 : RI<0xB6, MRMSrcReg, (outs GR64:$dst), (ins GR8:$src),
|
|
|
|
"movz{bq|x}\t{$src, $dst|$dst, $src}", [], IIC_MOVZX>,
|
|
|
|
TB, Sched<[WriteALU]>;
|
|
|
|
let mayLoad = 1 in
|
|
|
|
def MOVZX64rm8 : RI<0xB6, MRMSrcMem, (outs GR64:$dst), (ins i8mem:$src),
|
|
|
|
"movz{bq|x}\t{$src, $dst|$dst, $src}", [], IIC_MOVZX>,
|
|
|
|
TB, Sched<[WriteALULd]>;
|
|
|
|
def MOVZX64rr16 : RI<0xB7, MRMSrcReg, (outs GR64:$dst), (ins GR16:$src),
|
|
|
|
"movz{wq|x}\t{$src, $dst|$dst, $src}", [], IIC_MOVZX>,
|
|
|
|
TB, Sched<[WriteALU]>;
|
|
|
|
let mayLoad = 1 in
|
|
|
|
def MOVZX64rm16 : RI<0xB7, MRMSrcMem, (outs GR64:$dst), (ins i16mem:$src),
|
|
|
|
"movz{wq|x}\t{$src, $dst|$dst, $src}", [], IIC_MOVZX>,
|
|
|
|
TB, Sched<[WriteALULd]>;
|
|
|
|
}
|
2010-10-05 14:52:35 +08:00
|
|
|
|
2013-05-30 18:43:18 +08:00
|
|
|
// 64-bit zero-extension patterns use SUBREG_TO_REG and an operation writing a
|
|
|
|
// 32-bit register.
|
|
|
|
def : Pat<(i64 (zext GR8:$src)),
|
|
|
|
(SUBREG_TO_REG (i64 0), (MOVZX32rr8 GR8:$src), sub_32bit)>;
|
|
|
|
def : Pat<(zextloadi64i8 addr:$src),
|
|
|
|
(SUBREG_TO_REG (i64 0), (MOVZX32rm8 addr:$src), sub_32bit)>;
|
|
|
|
|
|
|
|
def : Pat<(i64 (zext GR16:$src)),
|
|
|
|
(SUBREG_TO_REG (i64 0), (MOVZX32rr16 GR16:$src), sub_32bit)>;
|
|
|
|
def : Pat<(zextloadi64i16 addr:$src),
|
|
|
|
(SUBREG_TO_REG (i64 0), (MOVZX32rm16 addr:$src), sub_32bit)>;
|
|
|
|
|
|
|
|
// The preferred way to do 32-bit-to-64-bit zero extension on x86-64 is to use a
|
|
|
|
// SUBREG_TO_REG to utilize implicit zero-extension, however this isn't possible
|
|
|
|
// when the 32-bit value is defined by a truncate or is copied from something
|
|
|
|
// where the high bits aren't necessarily all zero. In such cases, we fall back
|
|
|
|
// to these explicit zext instructions.
|
|
|
|
def : Pat<(i64 (zext GR32:$src)),
|
|
|
|
(SUBREG_TO_REG (i64 0), (MOV32rr GR32:$src), sub_32bit)>;
|
|
|
|
def : Pat<(i64 (zextloadi64i32 addr:$src)),
|
|
|
|
(SUBREG_TO_REG (i64 0), (MOV32rm addr:$src), sub_32bit)>;
|