2002-11-18 05:03:35 +08:00
|
|
|
//===-- X86InstrBuilder.h - Functions to aid building x86 insts -*- C++ -*-===//
|
2005-04-22 07:38:14 +08:00
|
|
|
//
|
2003-10-21 23:17:13 +08:00
|
|
|
// The LLVM Compiler Infrastructure
|
|
|
|
//
|
2007-12-30 04:36:04 +08:00
|
|
|
// This file is distributed under the University of Illinois Open Source
|
|
|
|
// License. See LICENSE.TXT for details.
|
2005-04-22 07:38:14 +08:00
|
|
|
//
|
2003-10-21 23:17:13 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
2002-11-18 05:03:35 +08:00
|
|
|
//
|
|
|
|
// This file exposes functions that may be used with BuildMI from the
|
|
|
|
// MachineInstrBuilder.h file to handle X86'isms in a clean way.
|
|
|
|
//
|
|
|
|
// The BuildMem function may be used with the BuildMI function to add entire
|
|
|
|
// memory references in a single, typed, function call. X86 memory references
|
|
|
|
// can be very complex expressions (described in the README), so wrapping them
|
|
|
|
// up behind an easier to use interface makes sense. Descriptions of the
|
|
|
|
// functions are included below.
|
|
|
|
//
|
2002-12-13 17:28:50 +08:00
|
|
|
// For reference, the order of operands for memory references is:
|
|
|
|
// (Operand), Base, Scale, Index, Displacement.
|
|
|
|
//
|
2002-11-18 05:03:35 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
#ifndef X86INSTRBUILDER_H
|
|
|
|
#define X86INSTRBUILDER_H
|
|
|
|
|
2008-12-04 02:11:40 +08:00
|
|
|
#include "llvm/CodeGen/MachineFrameInfo.h"
|
2002-11-18 05:03:35 +08:00
|
|
|
#include "llvm/CodeGen/MachineInstrBuilder.h"
|
2009-09-26 04:36:54 +08:00
|
|
|
#include "llvm/CodeGen/MachineMemOperand.h"
|
2002-11-18 05:03:35 +08:00
|
|
|
|
2003-11-12 06:41:34 +08:00
|
|
|
namespace llvm {
|
|
|
|
|
2004-08-30 08:13:26 +08:00
|
|
|
/// X86AddressMode - This struct holds a generalized full x86 address mode.
|
|
|
|
/// The base register can be a frame index, which will eventually be replaced
|
2004-10-15 12:43:20 +08:00
|
|
|
/// with BP or SP and Disp being offsetted accordingly. The displacement may
|
|
|
|
/// also include the offset of a global value.
|
2004-08-30 08:13:26 +08:00
|
|
|
struct X86AddressMode {
|
2005-01-18 07:25:45 +08:00
|
|
|
enum {
|
|
|
|
RegBase,
|
2006-05-25 01:04:05 +08:00
|
|
|
FrameIndexBase
|
2005-01-18 07:25:45 +08:00
|
|
|
} BaseType;
|
2005-04-22 07:38:14 +08:00
|
|
|
|
2005-01-18 07:25:45 +08:00
|
|
|
union {
|
|
|
|
unsigned Reg;
|
|
|
|
int FrameIndex;
|
|
|
|
} Base;
|
2005-04-22 07:38:14 +08:00
|
|
|
|
2005-01-18 07:25:45 +08:00
|
|
|
unsigned Scale;
|
|
|
|
unsigned IndexReg;
|
2009-09-16 02:27:02 +08:00
|
|
|
int Disp;
|
2010-04-15 09:51:59 +08:00
|
|
|
const GlobalValue *GV;
|
2009-07-01 11:27:19 +08:00
|
|
|
unsigned GVOpFlags;
|
2005-04-22 07:38:14 +08:00
|
|
|
|
2009-07-01 11:27:19 +08:00
|
|
|
X86AddressMode()
|
|
|
|
: BaseType(RegBase), Scale(1), IndexReg(0), Disp(0), GV(0), GVOpFlags(0) {
|
2005-01-18 07:25:45 +08:00
|
|
|
Base.Reg = 0;
|
|
|
|
}
|
2012-06-23 06:07:19 +08:00
|
|
|
|
|
|
|
|
implement rdar://6653118 - fastisel should fold loads where possible.
Since mem2reg isn't run at -O0, we get a ton of reloads from the stack,
for example, before, this code:
int foo(int x, int y, int z) {
return x+y+z;
}
used to compile into:
_foo: ## @foo
subq $12, %rsp
movl %edi, 8(%rsp)
movl %esi, 4(%rsp)
movl %edx, (%rsp)
movl 8(%rsp), %edx
movl 4(%rsp), %esi
addl %edx, %esi
movl (%rsp), %edx
addl %esi, %edx
movl %edx, %eax
addq $12, %rsp
ret
Now we produce:
_foo: ## @foo
subq $12, %rsp
movl %edi, 8(%rsp)
movl %esi, 4(%rsp)
movl %edx, (%rsp)
movl 8(%rsp), %edx
addl 4(%rsp), %edx ## Folded load
addl (%rsp), %edx ## Folded load
movl %edx, %eax
addq $12, %rsp
ret
Fewer instructions and less register use = faster compiles.
llvm-svn: 113102
2010-09-05 10:18:34 +08:00
|
|
|
void getFullAddress(SmallVectorImpl<MachineOperand> &MO) {
|
|
|
|
assert(Scale == 1 || Scale == 2 || Scale == 4 || Scale == 8);
|
2012-06-23 06:07:19 +08:00
|
|
|
|
implement rdar://6653118 - fastisel should fold loads where possible.
Since mem2reg isn't run at -O0, we get a ton of reloads from the stack,
for example, before, this code:
int foo(int x, int y, int z) {
return x+y+z;
}
used to compile into:
_foo: ## @foo
subq $12, %rsp
movl %edi, 8(%rsp)
movl %esi, 4(%rsp)
movl %edx, (%rsp)
movl 8(%rsp), %edx
movl 4(%rsp), %esi
addl %edx, %esi
movl (%rsp), %edx
addl %esi, %edx
movl %edx, %eax
addq $12, %rsp
ret
Now we produce:
_foo: ## @foo
subq $12, %rsp
movl %edi, 8(%rsp)
movl %esi, 4(%rsp)
movl %edx, (%rsp)
movl 8(%rsp), %edx
addl 4(%rsp), %edx ## Folded load
addl (%rsp), %edx ## Folded load
movl %edx, %eax
addq $12, %rsp
ret
Fewer instructions and less register use = faster compiles.
llvm-svn: 113102
2010-09-05 10:18:34 +08:00
|
|
|
if (BaseType == X86AddressMode::RegBase)
|
|
|
|
MO.push_back(MachineOperand::CreateReg(Base.Reg, false, false,
|
|
|
|
false, false, false, 0, false));
|
|
|
|
else {
|
|
|
|
assert(BaseType == X86AddressMode::FrameIndexBase);
|
|
|
|
MO.push_back(MachineOperand::CreateFI(Base.FrameIndex));
|
|
|
|
}
|
2012-06-23 06:07:19 +08:00
|
|
|
|
implement rdar://6653118 - fastisel should fold loads where possible.
Since mem2reg isn't run at -O0, we get a ton of reloads from the stack,
for example, before, this code:
int foo(int x, int y, int z) {
return x+y+z;
}
used to compile into:
_foo: ## @foo
subq $12, %rsp
movl %edi, 8(%rsp)
movl %esi, 4(%rsp)
movl %edx, (%rsp)
movl 8(%rsp), %edx
movl 4(%rsp), %esi
addl %edx, %esi
movl (%rsp), %edx
addl %esi, %edx
movl %edx, %eax
addq $12, %rsp
ret
Now we produce:
_foo: ## @foo
subq $12, %rsp
movl %edi, 8(%rsp)
movl %esi, 4(%rsp)
movl %edx, (%rsp)
movl 8(%rsp), %edx
addl 4(%rsp), %edx ## Folded load
addl (%rsp), %edx ## Folded load
movl %edx, %eax
addq $12, %rsp
ret
Fewer instructions and less register use = faster compiles.
llvm-svn: 113102
2010-09-05 10:18:34 +08:00
|
|
|
MO.push_back(MachineOperand::CreateImm(Scale));
|
|
|
|
MO.push_back(MachineOperand::CreateReg(IndexReg, false, false,
|
|
|
|
false, false, false, 0, false));
|
2012-06-23 06:07:19 +08:00
|
|
|
|
implement rdar://6653118 - fastisel should fold loads where possible.
Since mem2reg isn't run at -O0, we get a ton of reloads from the stack,
for example, before, this code:
int foo(int x, int y, int z) {
return x+y+z;
}
used to compile into:
_foo: ## @foo
subq $12, %rsp
movl %edi, 8(%rsp)
movl %esi, 4(%rsp)
movl %edx, (%rsp)
movl 8(%rsp), %edx
movl 4(%rsp), %esi
addl %edx, %esi
movl (%rsp), %edx
addl %esi, %edx
movl %edx, %eax
addq $12, %rsp
ret
Now we produce:
_foo: ## @foo
subq $12, %rsp
movl %edi, 8(%rsp)
movl %esi, 4(%rsp)
movl %edx, (%rsp)
movl 8(%rsp), %edx
addl 4(%rsp), %edx ## Folded load
addl (%rsp), %edx ## Folded load
movl %edx, %eax
addq $12, %rsp
ret
Fewer instructions and less register use = faster compiles.
llvm-svn: 113102
2010-09-05 10:18:34 +08:00
|
|
|
if (GV)
|
|
|
|
MO.push_back(MachineOperand::CreateGA(GV, Disp, GVOpFlags));
|
|
|
|
else
|
|
|
|
MO.push_back(MachineOperand::CreateImm(Disp));
|
2012-06-23 06:07:19 +08:00
|
|
|
|
implement rdar://6653118 - fastisel should fold loads where possible.
Since mem2reg isn't run at -O0, we get a ton of reloads from the stack,
for example, before, this code:
int foo(int x, int y, int z) {
return x+y+z;
}
used to compile into:
_foo: ## @foo
subq $12, %rsp
movl %edi, 8(%rsp)
movl %esi, 4(%rsp)
movl %edx, (%rsp)
movl 8(%rsp), %edx
movl 4(%rsp), %esi
addl %edx, %esi
movl (%rsp), %edx
addl %esi, %edx
movl %edx, %eax
addq $12, %rsp
ret
Now we produce:
_foo: ## @foo
subq $12, %rsp
movl %edi, 8(%rsp)
movl %esi, 4(%rsp)
movl %edx, (%rsp)
movl 8(%rsp), %edx
addl 4(%rsp), %edx ## Folded load
addl (%rsp), %edx ## Folded load
movl %edx, %eax
addq $12, %rsp
ret
Fewer instructions and less register use = faster compiles.
llvm-svn: 113102
2010-09-05 10:18:34 +08:00
|
|
|
MO.push_back(MachineOperand::CreateReg(0, false, false,
|
|
|
|
false, false, false, 0, false));
|
|
|
|
}
|
2004-08-30 08:13:26 +08:00
|
|
|
};
|
|
|
|
|
2002-11-18 05:03:35 +08:00
|
|
|
/// addDirectMem - This function is used to add a direct memory reference to the
|
2002-12-29 04:26:58 +08:00
|
|
|
/// current instruction -- that is, a dereference of an address in a register,
|
|
|
|
/// with no scale, index or displacement. An example is: DWORD PTR [EAX].
|
|
|
|
///
|
2009-07-16 22:03:08 +08:00
|
|
|
static inline const MachineInstrBuilder &
|
|
|
|
addDirectMem(const MachineInstrBuilder &MIB, unsigned Reg) {
|
2010-07-09 07:46:44 +08:00
|
|
|
// Because memory references are always represented with five
|
|
|
|
// values, this adds: Reg, 1, NoReg, 0, NoReg to the instruction.
|
|
|
|
return MIB.addReg(Reg).addImm(1).addReg(0).addImm(0).addReg(0);
|
2002-11-18 05:03:35 +08:00
|
|
|
}
|
|
|
|
|
2009-04-09 05:14:34 +08:00
|
|
|
|
2009-07-16 22:03:08 +08:00
|
|
|
static inline const MachineInstrBuilder &
|
|
|
|
addOffset(const MachineInstrBuilder &MIB, int Offset) {
|
2010-07-09 07:46:44 +08:00
|
|
|
return MIB.addImm(1).addReg(0).addImm(Offset).addReg(0);
|
2009-04-09 05:14:34 +08:00
|
|
|
}
|
2002-11-23 06:42:12 +08:00
|
|
|
|
2002-12-29 04:26:58 +08:00
|
|
|
/// addRegOffset - This function is used to add a memory reference of the form
|
|
|
|
/// [Reg + Offset], i.e., one with no scale or index, but with a
|
|
|
|
/// displacement. An example is: DWORD PTR [EAX + 4].
|
|
|
|
///
|
2009-07-16 22:03:08 +08:00
|
|
|
static inline const MachineInstrBuilder &
|
|
|
|
addRegOffset(const MachineInstrBuilder &MIB,
|
|
|
|
unsigned Reg, bool isKill, int Offset) {
|
2009-05-14 05:33:08 +08:00
|
|
|
return addOffset(MIB.addReg(Reg, getKillRegState(isKill)), Offset);
|
2009-04-09 05:14:34 +08:00
|
|
|
}
|
|
|
|
|
2005-01-02 10:38:18 +08:00
|
|
|
/// addRegReg - This function is used to add a memory reference of the form:
|
|
|
|
/// [Reg + Reg].
|
2009-07-16 22:03:08 +08:00
|
|
|
static inline const MachineInstrBuilder &addRegReg(const MachineInstrBuilder &MIB,
|
2008-07-03 17:09:37 +08:00
|
|
|
unsigned Reg1, bool isKill1,
|
|
|
|
unsigned Reg2, bool isKill2) {
|
2009-05-14 05:33:08 +08:00
|
|
|
return MIB.addReg(Reg1, getKillRegState(isKill1)).addImm(1)
|
2010-07-09 07:46:44 +08:00
|
|
|
.addReg(Reg2, getKillRegState(isKill2)).addImm(0).addReg(0);
|
2005-01-02 10:38:18 +08:00
|
|
|
}
|
|
|
|
|
2009-07-16 22:03:08 +08:00
|
|
|
static inline const MachineInstrBuilder &
|
2010-07-09 07:46:44 +08:00
|
|
|
addFullAddress(const MachineInstrBuilder &MIB,
|
|
|
|
const X86AddressMode &AM) {
|
|
|
|
assert(AM.Scale == 1 || AM.Scale == 2 || AM.Scale == 4 || AM.Scale == 8);
|
2012-06-23 06:07:19 +08:00
|
|
|
|
2004-08-30 08:13:26 +08:00
|
|
|
if (AM.BaseType == X86AddressMode::RegBase)
|
|
|
|
MIB.addReg(AM.Base.Reg);
|
implement rdar://6653118 - fastisel should fold loads where possible.
Since mem2reg isn't run at -O0, we get a ton of reloads from the stack,
for example, before, this code:
int foo(int x, int y, int z) {
return x+y+z;
}
used to compile into:
_foo: ## @foo
subq $12, %rsp
movl %edi, 8(%rsp)
movl %esi, 4(%rsp)
movl %edx, (%rsp)
movl 8(%rsp), %edx
movl 4(%rsp), %esi
addl %edx, %esi
movl (%rsp), %edx
addl %esi, %edx
movl %edx, %eax
addq $12, %rsp
ret
Now we produce:
_foo: ## @foo
subq $12, %rsp
movl %edi, 8(%rsp)
movl %esi, 4(%rsp)
movl %edx, (%rsp)
movl 8(%rsp), %edx
addl 4(%rsp), %edx ## Folded load
addl (%rsp), %edx ## Folded load
movl %edx, %eax
addq $12, %rsp
ret
Fewer instructions and less register use = faster compiles.
llvm-svn: 113102
2010-09-05 10:18:34 +08:00
|
|
|
else {
|
|
|
|
assert(AM.BaseType == X86AddressMode::FrameIndexBase);
|
2004-08-30 08:13:26 +08:00
|
|
|
MIB.addFrameIndex(AM.Base.FrameIndex);
|
implement rdar://6653118 - fastisel should fold loads where possible.
Since mem2reg isn't run at -O0, we get a ton of reloads from the stack,
for example, before, this code:
int foo(int x, int y, int z) {
return x+y+z;
}
used to compile into:
_foo: ## @foo
subq $12, %rsp
movl %edi, 8(%rsp)
movl %esi, 4(%rsp)
movl %edx, (%rsp)
movl 8(%rsp), %edx
movl 4(%rsp), %esi
addl %edx, %esi
movl (%rsp), %edx
addl %esi, %edx
movl %edx, %eax
addq $12, %rsp
ret
Now we produce:
_foo: ## @foo
subq $12, %rsp
movl %edi, 8(%rsp)
movl %esi, 4(%rsp)
movl %edx, (%rsp)
movl 8(%rsp), %edx
addl 4(%rsp), %edx ## Folded load
addl (%rsp), %edx ## Folded load
movl %edx, %eax
addq $12, %rsp
ret
Fewer instructions and less register use = faster compiles.
llvm-svn: 113102
2010-09-05 10:18:34 +08:00
|
|
|
}
|
|
|
|
|
2006-05-05 02:16:01 +08:00
|
|
|
MIB.addImm(AM.Scale).addReg(AM.IndexReg);
|
2004-10-15 12:43:20 +08:00
|
|
|
if (AM.GV)
|
2010-07-09 07:46:44 +08:00
|
|
|
MIB.addGlobalAddress(AM.GV, AM.Disp, AM.GVOpFlags);
|
2004-10-15 12:43:20 +08:00
|
|
|
else
|
2010-07-09 07:46:44 +08:00
|
|
|
MIB.addImm(AM.Disp);
|
2012-06-23 06:07:19 +08:00
|
|
|
|
2010-07-09 07:46:44 +08:00
|
|
|
return MIB.addReg(0);
|
2009-04-09 05:14:34 +08:00
|
|
|
}
|
|
|
|
|
2002-12-29 04:26:58 +08:00
|
|
|
/// addFrameReference - This function is used to add a reference to the base of
|
|
|
|
/// an abstract object on the stack frame of the current function. This
|
2003-01-13 08:45:53 +08:00
|
|
|
/// reference has base register as the FrameIndex offset until it is resolved.
|
|
|
|
/// This allows a constant offset to be specified as well...
|
2002-12-29 04:26:58 +08:00
|
|
|
///
|
2009-07-16 22:03:08 +08:00
|
|
|
static inline const MachineInstrBuilder &
|
2003-01-13 08:45:53 +08:00
|
|
|
addFrameReference(const MachineInstrBuilder &MIB, int FI, int Offset = 0) {
|
2008-12-04 02:11:40 +08:00
|
|
|
MachineInstr *MI = MIB;
|
|
|
|
MachineFunction &MF = *MI->getParent()->getParent();
|
|
|
|
MachineFrameInfo &MFI = *MF.getFrameInfo();
|
2011-06-29 03:10:37 +08:00
|
|
|
const MCInstrDesc &MCID = MI->getDesc();
|
2008-12-04 02:11:40 +08:00
|
|
|
unsigned Flags = 0;
|
2011-06-29 03:10:37 +08:00
|
|
|
if (MCID.mayLoad())
|
2008-12-04 02:11:40 +08:00
|
|
|
Flags |= MachineMemOperand::MOLoad;
|
2011-06-29 03:10:37 +08:00
|
|
|
if (MCID.mayStore())
|
2008-12-04 02:11:40 +08:00
|
|
|
Flags |= MachineMemOperand::MOStore;
|
2009-09-26 04:36:54 +08:00
|
|
|
MachineMemOperand *MMO =
|
2010-09-21 14:22:23 +08:00
|
|
|
MF.getMachineMemOperand(MachinePointerInfo::getFixedStack(FI, Offset),
|
2010-09-21 12:39:43 +08:00
|
|
|
Flags, MFI.getObjectSize(FI),
|
2009-09-26 04:36:54 +08:00
|
|
|
MFI.getObjectAlignment(FI));
|
2009-04-09 05:14:34 +08:00
|
|
|
return addOffset(MIB.addFrameIndex(FI), Offset)
|
2008-12-04 02:11:40 +08:00
|
|
|
.addMemOperand(MMO);
|
2003-01-13 08:45:53 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
/// addConstantPoolReference - This function is used to add a reference to the
|
|
|
|
/// base of a constant value spilled to the per-function constant pool. The
|
2008-09-30 09:21:32 +08:00
|
|
|
/// reference uses the abstract ConstantPoolIndex which is retained until
|
|
|
|
/// either machine code emission or assembly output. In PIC mode on x86-32,
|
|
|
|
/// the GlobalBaseReg parameter can be used to make this a
|
|
|
|
/// GlobalBaseReg-relative reference.
|
2003-01-13 08:45:53 +08:00
|
|
|
///
|
2009-07-16 22:03:08 +08:00
|
|
|
static inline const MachineInstrBuilder &
|
2008-09-30 09:21:32 +08:00
|
|
|
addConstantPoolReference(const MachineInstrBuilder &MIB, unsigned CPI,
|
2009-06-27 09:31:51 +08:00
|
|
|
unsigned GlobalBaseReg, unsigned char OpFlags) {
|
2009-04-09 05:14:34 +08:00
|
|
|
//FIXME: factor this
|
|
|
|
return MIB.addReg(GlobalBaseReg).addImm(1).addReg(0)
|
2009-06-27 09:31:51 +08:00
|
|
|
.addConstantPoolIndex(CPI, 0, OpFlags).addReg(0);
|
2002-12-29 04:26:58 +08:00
|
|
|
}
|
|
|
|
|
2003-11-12 06:41:34 +08:00
|
|
|
} // End llvm namespace
|
|
|
|
|
2002-11-18 05:03:35 +08:00
|
|
|
#endif
|