2010-06-09 00:52:24 +08:00
|
|
|
//===-- ArchSpec.cpp --------------------------------------------*- C++ -*-===//
|
|
|
|
//
|
|
|
|
// The LLVM Compiler Infrastructure
|
|
|
|
//
|
|
|
|
// This file is distributed under the University of Illinois Open Source
|
|
|
|
// License. See LICENSE.TXT for details.
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
#include "lldb/Core/ArchSpec.h"
|
|
|
|
|
2010-06-11 12:26:08 +08:00
|
|
|
#include <stdio.h>
|
2010-06-09 00:52:24 +08:00
|
|
|
|
|
|
|
#include <string>
|
|
|
|
|
2010-06-11 11:25:34 +08:00
|
|
|
#include "llvm/Support/ELF.h"
|
2011-02-25 03:13:58 +08:00
|
|
|
#include "llvm/Support/Host.h"
|
2010-06-11 11:25:34 +08:00
|
|
|
#include "llvm/Support/MachO.h"
|
2011-02-16 05:59:32 +08:00
|
|
|
#include "lldb/Host/Endian.h"
|
|
|
|
#include "lldb/Host/Host.h"
|
2011-04-08 06:46:35 +08:00
|
|
|
#include "lldb/Target/Platform.h"
|
2010-06-11 11:25:34 +08:00
|
|
|
|
2010-06-09 00:52:24 +08:00
|
|
|
using namespace lldb;
|
|
|
|
using namespace lldb_private;
|
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
#define ARCH_SPEC_SEPARATOR_CHAR '-'
|
2010-06-09 00:52:24 +08:00
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
namespace lldb_private {
|
2010-06-09 00:52:24 +08:00
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
struct CoreDefinition
|
|
|
|
{
|
|
|
|
ByteOrder default_byte_order;
|
|
|
|
uint32_t addr_byte_size;
|
Added the ability to get the min and max instruction byte size for
an architecture into ArchSpec:
uint32_t
ArchSpec::GetMinimumOpcodeByteSize() const;
uint32_t
ArchSpec::GetMaximumOpcodeByteSize() const;
Added an AddressClass to the Instruction class in Disassembler.h.
This allows decoded instructions to know know if they are code,
code with alternate ISA (thumb), or even data which can be mixed
into code. The instruction does have an address, but it is a good
idea to cache this value so we don't have to look it up more than
once.
Fixed an issue in Opcode::SetOpcodeBytes() where the length wasn't
getting set.
Changed:
bool
SymbolContextList::AppendIfUnique (const SymbolContext& sc);
To:
bool
SymbolContextList::AppendIfUnique (const SymbolContext& sc,
bool merge_symbol_into_function);
This function was typically being used when looking up functions
and symbols. Now if you lookup a function, then find the symbol,
they can be merged into the same symbol context and not cause
multiple symbol contexts to appear in a symbol context list that
describes the same function.
Fixed the SymbolContext not equal operator which was causing mixed
mode disassembly to not work ("disassembler --mixed --name main").
Modified the disassembler classes to know about the fact we know,
for a given architecture, what the min and max opcode byte sizes
are. The InstructionList class was modified to return the max
opcode byte size for all of the instructions in its list.
These two fixes means when disassemble a list of instructions and dump
them and show the opcode bytes, we can format the output more
intelligently when showing opcode bytes. This affects any architectures
that have varying opcode byte sizes (x86_64 and i386). Knowing the max
opcode byte size also helps us to be able to disassemble N instructions
without having to re-read data if we didn't read enough bytes.
Added the ability to set the architecture for the disassemble command.
This means you can easily cross disassemble data for any supported
architecture. I also added the ability to specify "thumb" as an
architecture so that we can force disassembly into thumb mode when
needed. In GDB this was done using a hack of specifying an odd
address when disassembling. I don't want to repeat this hack in LLDB,
so the auto detection between ARM and thumb is failing, just specify
thumb when disassembling:
(lldb) disassemble --arch thumb --name main
You can also have data in say an x86_64 file executable and disassemble
data as any other supported architecture:
% lldb a.out
Current executable set to 'a.out' (x86_64).
(lldb) b main
(lldb) run
(lldb) disassemble --arch thumb --count 2 --start-address 0x0000000100001080 --bytes
0x100001080: 0xb580 push {r7, lr}
0x100001082: 0xaf00 add r7, sp, #0
Fixed Target::ReadMemory(...) to be able to deal with Address argument object
that isn't section offset. When an address object was supplied that was
out on the heap or stack, target read memory would fail. Disassembly uses
Target::ReadMemory(...), and the example above where we disassembler thumb
opcodes in an x86 binary was failing do to this bug.
llvm-svn: 128347
2011-03-27 03:14:58 +08:00
|
|
|
uint32_t min_opcode_byte_size;
|
|
|
|
uint32_t max_opcode_byte_size;
|
2011-02-23 08:35:02 +08:00
|
|
|
llvm::Triple::ArchType machine;
|
|
|
|
ArchSpec::Core core;
|
|
|
|
const char *name;
|
|
|
|
};
|
2010-06-09 00:52:24 +08:00
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
}
|
2010-06-11 11:25:34 +08:00
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
// This core information can be looked using the ArchSpec::Core as the index
|
|
|
|
static const CoreDefinition g_core_definitions[ArchSpec::kNumCores] =
|
2010-06-11 11:25:34 +08:00
|
|
|
{
|
Added the ability to get the min and max instruction byte size for
an architecture into ArchSpec:
uint32_t
ArchSpec::GetMinimumOpcodeByteSize() const;
uint32_t
ArchSpec::GetMaximumOpcodeByteSize() const;
Added an AddressClass to the Instruction class in Disassembler.h.
This allows decoded instructions to know know if they are code,
code with alternate ISA (thumb), or even data which can be mixed
into code. The instruction does have an address, but it is a good
idea to cache this value so we don't have to look it up more than
once.
Fixed an issue in Opcode::SetOpcodeBytes() where the length wasn't
getting set.
Changed:
bool
SymbolContextList::AppendIfUnique (const SymbolContext& sc);
To:
bool
SymbolContextList::AppendIfUnique (const SymbolContext& sc,
bool merge_symbol_into_function);
This function was typically being used when looking up functions
and symbols. Now if you lookup a function, then find the symbol,
they can be merged into the same symbol context and not cause
multiple symbol contexts to appear in a symbol context list that
describes the same function.
Fixed the SymbolContext not equal operator which was causing mixed
mode disassembly to not work ("disassembler --mixed --name main").
Modified the disassembler classes to know about the fact we know,
for a given architecture, what the min and max opcode byte sizes
are. The InstructionList class was modified to return the max
opcode byte size for all of the instructions in its list.
These two fixes means when disassemble a list of instructions and dump
them and show the opcode bytes, we can format the output more
intelligently when showing opcode bytes. This affects any architectures
that have varying opcode byte sizes (x86_64 and i386). Knowing the max
opcode byte size also helps us to be able to disassemble N instructions
without having to re-read data if we didn't read enough bytes.
Added the ability to set the architecture for the disassemble command.
This means you can easily cross disassemble data for any supported
architecture. I also added the ability to specify "thumb" as an
architecture so that we can force disassembly into thumb mode when
needed. In GDB this was done using a hack of specifying an odd
address when disassembling. I don't want to repeat this hack in LLDB,
so the auto detection between ARM and thumb is failing, just specify
thumb when disassembling:
(lldb) disassemble --arch thumb --name main
You can also have data in say an x86_64 file executable and disassemble
data as any other supported architecture:
% lldb a.out
Current executable set to 'a.out' (x86_64).
(lldb) b main
(lldb) run
(lldb) disassemble --arch thumb --count 2 --start-address 0x0000000100001080 --bytes
0x100001080: 0xb580 push {r7, lr}
0x100001082: 0xaf00 add r7, sp, #0
Fixed Target::ReadMemory(...) to be able to deal with Address argument object
that isn't section offset. When an address object was supplied that was
out on the heap or stack, target read memory would fail. Disassembly uses
Target::ReadMemory(...), and the example above where we disassembler thumb
opcodes in an x86 binary was failing do to this bug.
llvm-svn: 128347
2011-03-27 03:14:58 +08:00
|
|
|
// TODO: verify alpha has 32 bit fixed instructions
|
|
|
|
{ eByteOrderLittle, 4, 4, 4, llvm::Triple::alpha , ArchSpec::eCore_alpha_generic , "alpha" },
|
|
|
|
|
|
|
|
{ eByteOrderLittle, 4, 2, 4, llvm::Triple::arm , ArchSpec::eCore_arm_generic , "arm" },
|
|
|
|
{ eByteOrderLittle, 4, 2, 4, llvm::Triple::arm , ArchSpec::eCore_arm_armv4 , "armv4" },
|
|
|
|
{ eByteOrderLittle, 4, 2, 4, llvm::Triple::arm , ArchSpec::eCore_arm_armv4t , "armv4t" },
|
|
|
|
{ eByteOrderLittle, 4, 2, 4, llvm::Triple::arm , ArchSpec::eCore_arm_armv5 , "armv5" },
|
|
|
|
{ eByteOrderLittle, 4, 2, 4, llvm::Triple::arm , ArchSpec::eCore_arm_armv5t , "armv5t" },
|
|
|
|
{ eByteOrderLittle, 4, 2, 4, llvm::Triple::arm , ArchSpec::eCore_arm_armv6 , "armv6" },
|
|
|
|
{ eByteOrderLittle, 4, 2, 4, llvm::Triple::arm , ArchSpec::eCore_arm_armv7 , "armv7" },
|
|
|
|
{ eByteOrderLittle, 4, 2, 4, llvm::Triple::arm , ArchSpec::eCore_arm_armv7f , "armv7f" },
|
|
|
|
{ eByteOrderLittle, 4, 2, 4, llvm::Triple::arm , ArchSpec::eCore_arm_armv7k , "armv7k" },
|
|
|
|
{ eByteOrderLittle, 4, 2, 4, llvm::Triple::arm , ArchSpec::eCore_arm_armv7s , "armv7s" },
|
|
|
|
{ eByteOrderLittle, 4, 2, 4, llvm::Triple::arm , ArchSpec::eCore_arm_xscale , "xscale" },
|
|
|
|
{ eByteOrderLittle, 4, 2, 4, llvm::Triple::thumb , ArchSpec::eCore_thumb_generic , "thumb" },
|
2011-02-23 08:35:02 +08:00
|
|
|
|
Added the ability to get the min and max instruction byte size for
an architecture into ArchSpec:
uint32_t
ArchSpec::GetMinimumOpcodeByteSize() const;
uint32_t
ArchSpec::GetMaximumOpcodeByteSize() const;
Added an AddressClass to the Instruction class in Disassembler.h.
This allows decoded instructions to know know if they are code,
code with alternate ISA (thumb), or even data which can be mixed
into code. The instruction does have an address, but it is a good
idea to cache this value so we don't have to look it up more than
once.
Fixed an issue in Opcode::SetOpcodeBytes() where the length wasn't
getting set.
Changed:
bool
SymbolContextList::AppendIfUnique (const SymbolContext& sc);
To:
bool
SymbolContextList::AppendIfUnique (const SymbolContext& sc,
bool merge_symbol_into_function);
This function was typically being used when looking up functions
and symbols. Now if you lookup a function, then find the symbol,
they can be merged into the same symbol context and not cause
multiple symbol contexts to appear in a symbol context list that
describes the same function.
Fixed the SymbolContext not equal operator which was causing mixed
mode disassembly to not work ("disassembler --mixed --name main").
Modified the disassembler classes to know about the fact we know,
for a given architecture, what the min and max opcode byte sizes
are. The InstructionList class was modified to return the max
opcode byte size for all of the instructions in its list.
These two fixes means when disassemble a list of instructions and dump
them and show the opcode bytes, we can format the output more
intelligently when showing opcode bytes. This affects any architectures
that have varying opcode byte sizes (x86_64 and i386). Knowing the max
opcode byte size also helps us to be able to disassemble N instructions
without having to re-read data if we didn't read enough bytes.
Added the ability to set the architecture for the disassemble command.
This means you can easily cross disassemble data for any supported
architecture. I also added the ability to specify "thumb" as an
architecture so that we can force disassembly into thumb mode when
needed. In GDB this was done using a hack of specifying an odd
address when disassembling. I don't want to repeat this hack in LLDB,
so the auto detection between ARM and thumb is failing, just specify
thumb when disassembling:
(lldb) disassemble --arch thumb --name main
You can also have data in say an x86_64 file executable and disassemble
data as any other supported architecture:
% lldb a.out
Current executable set to 'a.out' (x86_64).
(lldb) b main
(lldb) run
(lldb) disassemble --arch thumb --count 2 --start-address 0x0000000100001080 --bytes
0x100001080: 0xb580 push {r7, lr}
0x100001082: 0xaf00 add r7, sp, #0
Fixed Target::ReadMemory(...) to be able to deal with Address argument object
that isn't section offset. When an address object was supplied that was
out on the heap or stack, target read memory would fail. Disassembly uses
Target::ReadMemory(...), and the example above where we disassembler thumb
opcodes in an x86 binary was failing do to this bug.
llvm-svn: 128347
2011-03-27 03:14:58 +08:00
|
|
|
{ eByteOrderLittle, 4, 4, 4, llvm::Triple::ppc , ArchSpec::eCore_ppc_generic , "ppc" },
|
|
|
|
{ eByteOrderLittle, 4, 4, 4, llvm::Triple::ppc , ArchSpec::eCore_ppc_ppc601 , "ppc601" },
|
|
|
|
{ eByteOrderLittle, 4, 4, 4, llvm::Triple::ppc , ArchSpec::eCore_ppc_ppc602 , "ppc602" },
|
|
|
|
{ eByteOrderLittle, 4, 4, 4, llvm::Triple::ppc , ArchSpec::eCore_ppc_ppc603 , "ppc603" },
|
|
|
|
{ eByteOrderLittle, 4, 4, 4, llvm::Triple::ppc , ArchSpec::eCore_ppc_ppc603e , "ppc603e" },
|
|
|
|
{ eByteOrderLittle, 4, 4, 4, llvm::Triple::ppc , ArchSpec::eCore_ppc_ppc603ev , "ppc603ev" },
|
|
|
|
{ eByteOrderLittle, 4, 4, 4, llvm::Triple::ppc , ArchSpec::eCore_ppc_ppc604 , "ppc604" },
|
|
|
|
{ eByteOrderLittle, 4, 4, 4, llvm::Triple::ppc , ArchSpec::eCore_ppc_ppc604e , "ppc604e" },
|
|
|
|
{ eByteOrderLittle, 4, 4, 4, llvm::Triple::ppc , ArchSpec::eCore_ppc_ppc620 , "ppc620" },
|
|
|
|
{ eByteOrderLittle, 4, 4, 4, llvm::Triple::ppc , ArchSpec::eCore_ppc_ppc750 , "ppc750" },
|
|
|
|
{ eByteOrderLittle, 4, 4, 4, llvm::Triple::ppc , ArchSpec::eCore_ppc_ppc7400 , "ppc7400" },
|
|
|
|
{ eByteOrderLittle, 4, 4, 4, llvm::Triple::ppc , ArchSpec::eCore_ppc_ppc7450 , "ppc7450" },
|
|
|
|
{ eByteOrderLittle, 4, 4, 4, llvm::Triple::ppc , ArchSpec::eCore_ppc_ppc970 , "ppc970" },
|
2011-02-23 08:35:02 +08:00
|
|
|
|
Added the ability to get the min and max instruction byte size for
an architecture into ArchSpec:
uint32_t
ArchSpec::GetMinimumOpcodeByteSize() const;
uint32_t
ArchSpec::GetMaximumOpcodeByteSize() const;
Added an AddressClass to the Instruction class in Disassembler.h.
This allows decoded instructions to know know if they are code,
code with alternate ISA (thumb), or even data which can be mixed
into code. The instruction does have an address, but it is a good
idea to cache this value so we don't have to look it up more than
once.
Fixed an issue in Opcode::SetOpcodeBytes() where the length wasn't
getting set.
Changed:
bool
SymbolContextList::AppendIfUnique (const SymbolContext& sc);
To:
bool
SymbolContextList::AppendIfUnique (const SymbolContext& sc,
bool merge_symbol_into_function);
This function was typically being used when looking up functions
and symbols. Now if you lookup a function, then find the symbol,
they can be merged into the same symbol context and not cause
multiple symbol contexts to appear in a symbol context list that
describes the same function.
Fixed the SymbolContext not equal operator which was causing mixed
mode disassembly to not work ("disassembler --mixed --name main").
Modified the disassembler classes to know about the fact we know,
for a given architecture, what the min and max opcode byte sizes
are. The InstructionList class was modified to return the max
opcode byte size for all of the instructions in its list.
These two fixes means when disassemble a list of instructions and dump
them and show the opcode bytes, we can format the output more
intelligently when showing opcode bytes. This affects any architectures
that have varying opcode byte sizes (x86_64 and i386). Knowing the max
opcode byte size also helps us to be able to disassemble N instructions
without having to re-read data if we didn't read enough bytes.
Added the ability to set the architecture for the disassemble command.
This means you can easily cross disassemble data for any supported
architecture. I also added the ability to specify "thumb" as an
architecture so that we can force disassembly into thumb mode when
needed. In GDB this was done using a hack of specifying an odd
address when disassembling. I don't want to repeat this hack in LLDB,
so the auto detection between ARM and thumb is failing, just specify
thumb when disassembling:
(lldb) disassemble --arch thumb --name main
You can also have data in say an x86_64 file executable and disassemble
data as any other supported architecture:
% lldb a.out
Current executable set to 'a.out' (x86_64).
(lldb) b main
(lldb) run
(lldb) disassemble --arch thumb --count 2 --start-address 0x0000000100001080 --bytes
0x100001080: 0xb580 push {r7, lr}
0x100001082: 0xaf00 add r7, sp, #0
Fixed Target::ReadMemory(...) to be able to deal with Address argument object
that isn't section offset. When an address object was supplied that was
out on the heap or stack, target read memory would fail. Disassembly uses
Target::ReadMemory(...), and the example above where we disassembler thumb
opcodes in an x86 binary was failing do to this bug.
llvm-svn: 128347
2011-03-27 03:14:58 +08:00
|
|
|
{ eByteOrderLittle, 8, 4, 4, llvm::Triple::ppc64 , ArchSpec::eCore_ppc64_generic , "ppc64" },
|
|
|
|
{ eByteOrderLittle, 8, 4, 4, llvm::Triple::ppc64 , ArchSpec::eCore_ppc64_ppc970_64 , "ppc970-64" },
|
2011-02-23 08:35:02 +08:00
|
|
|
|
Added the ability to get the min and max instruction byte size for
an architecture into ArchSpec:
uint32_t
ArchSpec::GetMinimumOpcodeByteSize() const;
uint32_t
ArchSpec::GetMaximumOpcodeByteSize() const;
Added an AddressClass to the Instruction class in Disassembler.h.
This allows decoded instructions to know know if they are code,
code with alternate ISA (thumb), or even data which can be mixed
into code. The instruction does have an address, but it is a good
idea to cache this value so we don't have to look it up more than
once.
Fixed an issue in Opcode::SetOpcodeBytes() where the length wasn't
getting set.
Changed:
bool
SymbolContextList::AppendIfUnique (const SymbolContext& sc);
To:
bool
SymbolContextList::AppendIfUnique (const SymbolContext& sc,
bool merge_symbol_into_function);
This function was typically being used when looking up functions
and symbols. Now if you lookup a function, then find the symbol,
they can be merged into the same symbol context and not cause
multiple symbol contexts to appear in a symbol context list that
describes the same function.
Fixed the SymbolContext not equal operator which was causing mixed
mode disassembly to not work ("disassembler --mixed --name main").
Modified the disassembler classes to know about the fact we know,
for a given architecture, what the min and max opcode byte sizes
are. The InstructionList class was modified to return the max
opcode byte size for all of the instructions in its list.
These two fixes means when disassemble a list of instructions and dump
them and show the opcode bytes, we can format the output more
intelligently when showing opcode bytes. This affects any architectures
that have varying opcode byte sizes (x86_64 and i386). Knowing the max
opcode byte size also helps us to be able to disassemble N instructions
without having to re-read data if we didn't read enough bytes.
Added the ability to set the architecture for the disassemble command.
This means you can easily cross disassemble data for any supported
architecture. I also added the ability to specify "thumb" as an
architecture so that we can force disassembly into thumb mode when
needed. In GDB this was done using a hack of specifying an odd
address when disassembling. I don't want to repeat this hack in LLDB,
so the auto detection between ARM and thumb is failing, just specify
thumb when disassembling:
(lldb) disassemble --arch thumb --name main
You can also have data in say an x86_64 file executable and disassemble
data as any other supported architecture:
% lldb a.out
Current executable set to 'a.out' (x86_64).
(lldb) b main
(lldb) run
(lldb) disassemble --arch thumb --count 2 --start-address 0x0000000100001080 --bytes
0x100001080: 0xb580 push {r7, lr}
0x100001082: 0xaf00 add r7, sp, #0
Fixed Target::ReadMemory(...) to be able to deal with Address argument object
that isn't section offset. When an address object was supplied that was
out on the heap or stack, target read memory would fail. Disassembly uses
Target::ReadMemory(...), and the example above where we disassembler thumb
opcodes in an x86 binary was failing do to this bug.
llvm-svn: 128347
2011-03-27 03:14:58 +08:00
|
|
|
{ eByteOrderLittle, 4, 4, 4, llvm::Triple::sparc , ArchSpec::eCore_sparc_generic , "sparc" },
|
|
|
|
{ eByteOrderLittle, 8, 4, 4, llvm::Triple::sparcv9, ArchSpec::eCore_sparc9_generic , "sparcv9" },
|
2011-02-23 08:35:02 +08:00
|
|
|
|
2011-04-14 06:47:15 +08:00
|
|
|
{ eByteOrderLittle, 4, 1, 15, llvm::Triple::x86 , ArchSpec::eCore_x86_32_i386 , "i386" },
|
|
|
|
{ eByteOrderLittle, 4, 1, 15, llvm::Triple::x86 , ArchSpec::eCore_x86_32_i486 , "i486" },
|
|
|
|
{ eByteOrderLittle, 4, 1, 15, llvm::Triple::x86 , ArchSpec::eCore_x86_32_i486sx , "i486sx" },
|
2011-02-23 08:35:02 +08:00
|
|
|
|
2011-04-14 06:47:15 +08:00
|
|
|
{ eByteOrderLittle, 8, 1, 15, llvm::Triple::x86_64 , ArchSpec::eCore_x86_64_x86_64 , "x86_64" }
|
2010-06-11 11:25:34 +08:00
|
|
|
};
|
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
struct ArchDefinitionEntry
|
|
|
|
{
|
|
|
|
ArchSpec::Core core;
|
|
|
|
uint32_t cpu;
|
|
|
|
uint32_t sub;
|
|
|
|
};
|
2010-06-11 11:25:34 +08:00
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
struct ArchDefinition
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
ArchitectureType type;
|
|
|
|
size_t num_entries;
|
|
|
|
const ArchDefinitionEntry *entries;
|
|
|
|
uint32_t cpu_mask;
|
|
|
|
uint32_t sub_mask;
|
|
|
|
const char *name;
|
2010-06-09 00:52:24 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
|
2011-04-14 06:47:15 +08:00
|
|
|
uint32_t
|
|
|
|
ArchSpec::AutoComplete (const char *name, StringList &matches)
|
|
|
|
{
|
|
|
|
uint32_t i;
|
|
|
|
if (name && name[0])
|
|
|
|
{
|
|
|
|
for (i = 0; i < ArchSpec::kNumCores; ++i)
|
|
|
|
{
|
|
|
|
if (NameMatches(g_core_definitions[i].name, eNameMatchStartsWith, name))
|
|
|
|
matches.AppendString (g_core_definitions[i].name);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
for (i = 0; i < ArchSpec::kNumCores; ++i)
|
|
|
|
matches.AppendString (g_core_definitions[i].name);
|
|
|
|
}
|
|
|
|
return matches.GetSize();
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
#define CPU_ANY (UINT32_MAX)
|
2010-06-09 00:52:24 +08:00
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
// A table that gets searched linearly for matches. This table is used to
|
|
|
|
// convert cpu type and subtypes to architecture names, and to convert
|
|
|
|
// architecture names to cpu types and subtypes. The ordering is important and
|
|
|
|
// allows the precedence to be set when the table is built.
|
|
|
|
static const ArchDefinitionEntry g_macho_arch_entries[] =
|
|
|
|
{
|
|
|
|
{ ArchSpec::eCore_arm_generic , llvm::MachO::CPUTypeARM , CPU_ANY },
|
|
|
|
{ ArchSpec::eCore_arm_generic , llvm::MachO::CPUTypeARM , 0 },
|
|
|
|
{ ArchSpec::eCore_arm_armv4 , llvm::MachO::CPUTypeARM , 5 },
|
|
|
|
{ ArchSpec::eCore_arm_armv6 , llvm::MachO::CPUTypeARM , 6 },
|
|
|
|
{ ArchSpec::eCore_arm_armv5 , llvm::MachO::CPUTypeARM , 7 },
|
|
|
|
{ ArchSpec::eCore_arm_xscale , llvm::MachO::CPUTypeARM , 8 },
|
|
|
|
{ ArchSpec::eCore_arm_armv7 , llvm::MachO::CPUTypeARM , 9 },
|
2011-03-19 09:12:21 +08:00
|
|
|
{ ArchSpec::eCore_arm_armv7f , llvm::MachO::CPUTypeARM , 10 },
|
|
|
|
{ ArchSpec::eCore_arm_armv7k , llvm::MachO::CPUTypeARM , 12 },
|
|
|
|
{ ArchSpec::eCore_arm_armv7s , llvm::MachO::CPUTypeARM , 11 },
|
Added the ability to get the min and max instruction byte size for
an architecture into ArchSpec:
uint32_t
ArchSpec::GetMinimumOpcodeByteSize() const;
uint32_t
ArchSpec::GetMaximumOpcodeByteSize() const;
Added an AddressClass to the Instruction class in Disassembler.h.
This allows decoded instructions to know know if they are code,
code with alternate ISA (thumb), or even data which can be mixed
into code. The instruction does have an address, but it is a good
idea to cache this value so we don't have to look it up more than
once.
Fixed an issue in Opcode::SetOpcodeBytes() where the length wasn't
getting set.
Changed:
bool
SymbolContextList::AppendIfUnique (const SymbolContext& sc);
To:
bool
SymbolContextList::AppendIfUnique (const SymbolContext& sc,
bool merge_symbol_into_function);
This function was typically being used when looking up functions
and symbols. Now if you lookup a function, then find the symbol,
they can be merged into the same symbol context and not cause
multiple symbol contexts to appear in a symbol context list that
describes the same function.
Fixed the SymbolContext not equal operator which was causing mixed
mode disassembly to not work ("disassembler --mixed --name main").
Modified the disassembler classes to know about the fact we know,
for a given architecture, what the min and max opcode byte sizes
are. The InstructionList class was modified to return the max
opcode byte size for all of the instructions in its list.
These two fixes means when disassemble a list of instructions and dump
them and show the opcode bytes, we can format the output more
intelligently when showing opcode bytes. This affects any architectures
that have varying opcode byte sizes (x86_64 and i386). Knowing the max
opcode byte size also helps us to be able to disassemble N instructions
without having to re-read data if we didn't read enough bytes.
Added the ability to set the architecture for the disassemble command.
This means you can easily cross disassemble data for any supported
architecture. I also added the ability to specify "thumb" as an
architecture so that we can force disassembly into thumb mode when
needed. In GDB this was done using a hack of specifying an odd
address when disassembling. I don't want to repeat this hack in LLDB,
so the auto detection between ARM and thumb is failing, just specify
thumb when disassembling:
(lldb) disassemble --arch thumb --name main
You can also have data in say an x86_64 file executable and disassemble
data as any other supported architecture:
% lldb a.out
Current executable set to 'a.out' (x86_64).
(lldb) b main
(lldb) run
(lldb) disassemble --arch thumb --count 2 --start-address 0x0000000100001080 --bytes
0x100001080: 0xb580 push {r7, lr}
0x100001082: 0xaf00 add r7, sp, #0
Fixed Target::ReadMemory(...) to be able to deal with Address argument object
that isn't section offset. When an address object was supplied that was
out on the heap or stack, target read memory would fail. Disassembly uses
Target::ReadMemory(...), and the example above where we disassembler thumb
opcodes in an x86 binary was failing do to this bug.
llvm-svn: 128347
2011-03-27 03:14:58 +08:00
|
|
|
{ ArchSpec::eCore_thumb_generic , llvm::MachO::CPUTypeARM , 0 },
|
2011-02-23 08:35:02 +08:00
|
|
|
{ ArchSpec::eCore_ppc_generic , llvm::MachO::CPUTypePowerPC , CPU_ANY },
|
|
|
|
{ ArchSpec::eCore_ppc_generic , llvm::MachO::CPUTypePowerPC , 0 },
|
|
|
|
{ ArchSpec::eCore_ppc_ppc601 , llvm::MachO::CPUTypePowerPC , 1 },
|
|
|
|
{ ArchSpec::eCore_ppc_ppc602 , llvm::MachO::CPUTypePowerPC , 2 },
|
|
|
|
{ ArchSpec::eCore_ppc_ppc603 , llvm::MachO::CPUTypePowerPC , 3 },
|
|
|
|
{ ArchSpec::eCore_ppc_ppc603e , llvm::MachO::CPUTypePowerPC , 4 },
|
|
|
|
{ ArchSpec::eCore_ppc_ppc603ev , llvm::MachO::CPUTypePowerPC , 5 },
|
|
|
|
{ ArchSpec::eCore_ppc_ppc604 , llvm::MachO::CPUTypePowerPC , 6 },
|
|
|
|
{ ArchSpec::eCore_ppc_ppc604e , llvm::MachO::CPUTypePowerPC , 7 },
|
|
|
|
{ ArchSpec::eCore_ppc_ppc620 , llvm::MachO::CPUTypePowerPC , 8 },
|
|
|
|
{ ArchSpec::eCore_ppc_ppc750 , llvm::MachO::CPUTypePowerPC , 9 },
|
|
|
|
{ ArchSpec::eCore_ppc_ppc7400 , llvm::MachO::CPUTypePowerPC , 10 },
|
|
|
|
{ ArchSpec::eCore_ppc_ppc7450 , llvm::MachO::CPUTypePowerPC , 11 },
|
|
|
|
{ ArchSpec::eCore_ppc_ppc970 , llvm::MachO::CPUTypePowerPC , 100 },
|
|
|
|
{ ArchSpec::eCore_ppc64_generic , llvm::MachO::CPUTypePowerPC64 , 0 },
|
|
|
|
{ ArchSpec::eCore_ppc64_ppc970_64 , llvm::MachO::CPUTypePowerPC64 , 100 },
|
|
|
|
{ ArchSpec::eCore_x86_32_i386 , llvm::MachO::CPUTypeI386 , 3 },
|
|
|
|
{ ArchSpec::eCore_x86_32_i486 , llvm::MachO::CPUTypeI386 , 4 },
|
|
|
|
{ ArchSpec::eCore_x86_32_i486sx , llvm::MachO::CPUTypeI386 , 0x84 },
|
|
|
|
{ ArchSpec::eCore_x86_32_i386 , llvm::MachO::CPUTypeI386 , CPU_ANY },
|
|
|
|
{ ArchSpec::eCore_x86_64_x86_64 , llvm::MachO::CPUTypeX86_64 , 3 },
|
|
|
|
{ ArchSpec::eCore_x86_64_x86_64 , llvm::MachO::CPUTypeX86_64 , CPU_ANY }
|
|
|
|
};
|
|
|
|
static const ArchDefinition g_macho_arch_def = {
|
|
|
|
eArchTypeMachO,
|
|
|
|
sizeof(g_macho_arch_entries)/sizeof(g_macho_arch_entries[0]),
|
|
|
|
g_macho_arch_entries,
|
|
|
|
UINT32_MAX, // CPU type mask
|
|
|
|
0x00FFFFFFu, // CPU subtype mask
|
|
|
|
"mach-o"
|
|
|
|
};
|
2010-06-11 11:25:34 +08:00
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
// A table that gets searched linearly for matches. This table is used to
|
|
|
|
// convert cpu type and subtypes to architecture names, and to convert
|
|
|
|
// architecture names to cpu types and subtypes. The ordering is important and
|
|
|
|
// allows the precedence to be set when the table is built.
|
|
|
|
static const ArchDefinitionEntry g_elf_arch_entries[] =
|
|
|
|
{
|
|
|
|
{ ArchSpec::eCore_sparc_generic , llvm::ELF::EM_SPARC , LLDB_INVALID_CPUTYPE }, // Sparc
|
|
|
|
{ ArchSpec::eCore_x86_32_i386 , llvm::ELF::EM_386 , LLDB_INVALID_CPUTYPE }, // Intel 80386
|
|
|
|
{ ArchSpec::eCore_x86_32_i486 , llvm::ELF::EM_486 , LLDB_INVALID_CPUTYPE }, // Intel 486 (deprecated)
|
|
|
|
{ ArchSpec::eCore_ppc_generic , llvm::ELF::EM_PPC , LLDB_INVALID_CPUTYPE }, // PowerPC
|
|
|
|
{ ArchSpec::eCore_ppc64_generic , llvm::ELF::EM_PPC64 , LLDB_INVALID_CPUTYPE }, // PowerPC64
|
|
|
|
{ ArchSpec::eCore_arm_generic , llvm::ELF::EM_ARM , LLDB_INVALID_CPUTYPE }, // ARM
|
|
|
|
{ ArchSpec::eCore_alpha_generic , llvm::ELF::EM_ALPHA , LLDB_INVALID_CPUTYPE }, // DEC Alpha
|
|
|
|
{ ArchSpec::eCore_sparc9_generic , llvm::ELF::EM_SPARCV9, LLDB_INVALID_CPUTYPE }, // SPARC V9
|
|
|
|
{ ArchSpec::eCore_x86_64_x86_64 , llvm::ELF::EM_X86_64 , LLDB_INVALID_CPUTYPE }, // AMD64
|
2010-06-11 11:25:34 +08:00
|
|
|
};
|
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
static const ArchDefinition g_elf_arch_def = {
|
|
|
|
eArchTypeELF,
|
|
|
|
sizeof(g_elf_arch_entries)/sizeof(g_elf_arch_entries[0]),
|
|
|
|
g_elf_arch_entries,
|
|
|
|
UINT32_MAX, // CPU type mask
|
|
|
|
UINT32_MAX, // CPU subtype mask
|
|
|
|
"elf",
|
|
|
|
};
|
2010-06-11 11:25:34 +08:00
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
// Table of all ArchDefinitions
|
|
|
|
static const ArchDefinition *g_arch_definitions[] = {
|
|
|
|
&g_macho_arch_def,
|
|
|
|
&g_elf_arch_def,
|
|
|
|
};
|
2010-06-09 00:52:24 +08:00
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
static const size_t k_num_arch_definitions =
|
|
|
|
sizeof(g_arch_definitions) / sizeof(g_arch_definitions[0]);
|
2010-06-09 00:52:24 +08:00
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
// Static helper functions.
|
2010-06-09 00:52:24 +08:00
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
|
|
|
|
// Get the architecture definition for a given object type.
|
|
|
|
static const ArchDefinition *
|
|
|
|
FindArchDefinition (ArchitectureType arch_type)
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
for (unsigned int i = 0; i < k_num_arch_definitions; ++i)
|
|
|
|
{
|
|
|
|
const ArchDefinition *def = g_arch_definitions[i];
|
|
|
|
if (def->type == arch_type)
|
|
|
|
return def;
|
|
|
|
}
|
|
|
|
return NULL;
|
2010-06-09 00:52:24 +08:00
|
|
|
}
|
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
// Get an architecture definition by name.
|
|
|
|
static const CoreDefinition *
|
|
|
|
FindCoreDefinition (llvm::StringRef name)
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
for (unsigned int i = 0; i < ArchSpec::kNumCores; ++i)
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
if (name.equals_lower(g_core_definitions[i].name))
|
|
|
|
return &g_core_definitions[i];
|
2010-06-09 00:52:24 +08:00
|
|
|
}
|
2011-02-23 08:35:02 +08:00
|
|
|
return NULL;
|
2010-06-09 00:52:24 +08:00
|
|
|
}
|
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
static inline const CoreDefinition *
|
|
|
|
FindCoreDefinition (ArchSpec::Core core)
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
if (core >= 0 && core < ArchSpec::kNumCores)
|
|
|
|
return &g_core_definitions[core];
|
|
|
|
return NULL;
|
2010-06-09 00:52:24 +08:00
|
|
|
}
|
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
// Get a definition entry by cpu type and subtype.
|
|
|
|
static const ArchDefinitionEntry *
|
|
|
|
FindArchDefinitionEntry (const ArchDefinition *def, uint32_t cpu, uint32_t sub)
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
if (def == NULL)
|
2010-06-11 11:25:34 +08:00
|
|
|
return NULL;
|
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
const uint32_t cpu_mask = def->cpu_mask;
|
|
|
|
const uint32_t sub_mask = def->sub_mask;
|
|
|
|
const ArchDefinitionEntry *entries = def->entries;
|
|
|
|
for (size_t i = 0; i < def->num_entries; ++i)
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
if ((entries[i].cpu == (cpu_mask & cpu)) &&
|
|
|
|
(entries[i].sub == (sub_mask & sub)))
|
|
|
|
return &entries[i];
|
2010-06-09 00:52:24 +08:00
|
|
|
}
|
2011-02-23 08:35:02 +08:00
|
|
|
return NULL;
|
2010-06-09 00:52:24 +08:00
|
|
|
}
|
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
static const ArchDefinitionEntry *
|
|
|
|
FindArchDefinitionEntry (const ArchDefinition *def, ArchSpec::Core core)
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
if (def == NULL)
|
|
|
|
return NULL;
|
|
|
|
|
|
|
|
const ArchDefinitionEntry *entries = def->entries;
|
|
|
|
for (size_t i = 0; i < def->num_entries; ++i)
|
2010-06-11 11:25:34 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
if (entries[i].core == core)
|
|
|
|
return &entries[i];
|
2010-06-11 11:25:34 +08:00
|
|
|
}
|
2011-02-23 08:35:02 +08:00
|
|
|
return NULL;
|
2010-06-09 00:52:24 +08:00
|
|
|
}
|
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
// Constructors and destructors.
|
2010-06-09 00:52:24 +08:00
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
ArchSpec::ArchSpec() :
|
|
|
|
m_triple (),
|
|
|
|
m_core (kCore_invalid),
|
|
|
|
m_byte_order (eByteOrderInvalid)
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
|
|
|
}
|
|
|
|
|
2011-04-08 06:46:35 +08:00
|
|
|
ArchSpec::ArchSpec (const char *triple_cstr, Platform *platform) :
|
2011-02-23 08:35:02 +08:00
|
|
|
m_triple (),
|
|
|
|
m_core (kCore_invalid),
|
|
|
|
m_byte_order (eByteOrderInvalid)
|
2010-06-11 11:25:34 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
if (triple_cstr)
|
2011-04-08 06:46:35 +08:00
|
|
|
SetTriple(triple_cstr, platform);
|
2010-06-11 11:25:34 +08:00
|
|
|
}
|
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
ArchSpec::ArchSpec(const llvm::Triple &triple) :
|
|
|
|
m_triple (),
|
|
|
|
m_core (kCore_invalid),
|
|
|
|
m_byte_order (eByteOrderInvalid)
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
SetTriple(triple);
|
2010-06-09 00:52:24 +08:00
|
|
|
}
|
|
|
|
|
2011-03-25 05:19:54 +08:00
|
|
|
ArchSpec::ArchSpec (ArchitectureType arch_type, uint32_t cpu, uint32_t subtype) :
|
2011-02-23 08:35:02 +08:00
|
|
|
m_triple (),
|
|
|
|
m_core (kCore_invalid),
|
|
|
|
m_byte_order (eByteOrderInvalid)
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
SetArchitecture (arch_type, cpu, subtype);
|
|
|
|
}
|
2010-06-09 00:52:24 +08:00
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
ArchSpec::~ArchSpec()
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
}
|
2010-06-09 00:52:24 +08:00
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
// Assignment and initialization.
|
2010-06-09 00:52:24 +08:00
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
const ArchSpec&
|
|
|
|
ArchSpec::operator= (const ArchSpec& rhs)
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
if (this != &rhs)
|
|
|
|
{
|
|
|
|
m_triple = rhs.m_triple;
|
|
|
|
m_core = rhs.m_core;
|
|
|
|
m_byte_order = rhs.m_byte_order;
|
|
|
|
}
|
|
|
|
return *this;
|
|
|
|
}
|
2010-06-09 00:52:24 +08:00
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
void
|
|
|
|
ArchSpec::Clear()
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
m_triple = llvm::Triple();
|
|
|
|
m_core = kCore_invalid;
|
|
|
|
m_byte_order = eByteOrderInvalid;
|
|
|
|
}
|
2010-06-09 00:52:24 +08:00
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
// Predicates.
|
2010-06-09 00:52:24 +08:00
|
|
|
|
|
|
|
|
|
|
|
const char *
|
2011-02-23 08:35:02 +08:00
|
|
|
ArchSpec::GetArchitectureName () const
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
const CoreDefinition *core_def = FindCoreDefinition (m_core);
|
|
|
|
if (core_def)
|
|
|
|
return core_def->name;
|
|
|
|
return "unknown";
|
2010-06-09 00:52:24 +08:00
|
|
|
}
|
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
uint32_t
|
|
|
|
ArchSpec::GetMachOCPUType () const
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
const CoreDefinition *core_def = FindCoreDefinition (m_core);
|
|
|
|
if (core_def)
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
const ArchDefinitionEntry *arch_def = FindArchDefinitionEntry (&g_macho_arch_def, core_def->core);
|
|
|
|
if (arch_def)
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
return arch_def->cpu;
|
2010-06-09 00:52:24 +08:00
|
|
|
}
|
|
|
|
}
|
2011-02-23 08:35:02 +08:00
|
|
|
return LLDB_INVALID_CPUTYPE;
|
|
|
|
}
|
2010-06-09 00:52:24 +08:00
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
uint32_t
|
|
|
|
ArchSpec::GetMachOCPUSubType () const
|
|
|
|
{
|
|
|
|
const CoreDefinition *core_def = FindCoreDefinition (m_core);
|
|
|
|
if (core_def)
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
const ArchDefinitionEntry *arch_def = FindArchDefinitionEntry (&g_macho_arch_def, core_def->core);
|
|
|
|
if (arch_def)
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-03-24 12:28:38 +08:00
|
|
|
return arch_def->sub;
|
2010-06-09 00:52:24 +08:00
|
|
|
}
|
|
|
|
}
|
2011-02-23 08:35:02 +08:00
|
|
|
return LLDB_INVALID_CPUTYPE;
|
2010-06-09 00:52:24 +08:00
|
|
|
}
|
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
llvm::Triple::ArchType
|
|
|
|
ArchSpec::GetMachine () const
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
const CoreDefinition *core_def = FindCoreDefinition (m_core);
|
|
|
|
if (core_def)
|
|
|
|
return core_def->machine;
|
|
|
|
|
|
|
|
return llvm::Triple::UnknownArch;
|
2010-06-09 00:52:24 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
uint32_t
|
|
|
|
ArchSpec::GetAddressByteSize() const
|
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
const CoreDefinition *core_def = FindCoreDefinition (m_core);
|
|
|
|
if (core_def)
|
|
|
|
return core_def->addr_byte_size;
|
2010-06-11 11:25:34 +08:00
|
|
|
return 0;
|
2010-06-09 00:52:24 +08:00
|
|
|
}
|
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
ByteOrder
|
|
|
|
ArchSpec::GetDefaultEndian () const
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
const CoreDefinition *core_def = FindCoreDefinition (m_core);
|
|
|
|
if (core_def)
|
|
|
|
return core_def->default_byte_order;
|
|
|
|
return eByteOrderInvalid;
|
2010-06-09 00:52:24 +08:00
|
|
|
}
|
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
lldb::ByteOrder
|
|
|
|
ArchSpec::GetByteOrder () const
|
2011-02-16 05:59:32 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
if (m_byte_order == eByteOrderInvalid)
|
|
|
|
return GetDefaultEndian();
|
|
|
|
return m_byte_order;
|
2011-02-16 05:59:32 +08:00
|
|
|
}
|
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
// Mutators.
|
|
|
|
|
|
|
|
bool
|
|
|
|
ArchSpec::SetTriple (const llvm::Triple &triple)
|
2011-02-16 05:59:32 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
m_triple = triple;
|
2011-02-16 05:59:32 +08:00
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
llvm::StringRef arch_name (m_triple.getArchName());
|
|
|
|
const CoreDefinition *core_def = FindCoreDefinition (arch_name);
|
|
|
|
if (core_def)
|
2011-02-16 05:59:32 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
m_core = core_def->core;
|
2011-04-08 06:46:35 +08:00
|
|
|
// Set the byte order to the default byte order for an architecture.
|
|
|
|
// This can be modified if needed for cases when cores handle both
|
|
|
|
// big and little endian
|
|
|
|
m_byte_order = core_def->default_byte_order;
|
2011-02-16 05:59:32 +08:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
Clear();
|
2011-02-16 05:59:32 +08:00
|
|
|
}
|
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
|
|
|
|
return IsValid();
|
2011-02-16 05:59:32 +08:00
|
|
|
}
|
2010-06-09 00:52:24 +08:00
|
|
|
|
|
|
|
bool
|
2011-04-08 06:46:35 +08:00
|
|
|
ArchSpec::SetTriple (const char *triple_cstr, Platform *platform)
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
if (triple_cstr || triple_cstr[0])
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
llvm::StringRef triple_stref (triple_cstr);
|
|
|
|
if (triple_stref.startswith (LLDB_ARCH_DEFAULT))
|
2011-02-16 05:59:32 +08:00
|
|
|
{
|
|
|
|
// Special case for the current host default architectures...
|
2011-02-23 08:35:02 +08:00
|
|
|
if (triple_stref.equals (LLDB_ARCH_DEFAULT_32BIT))
|
2011-02-16 05:59:32 +08:00
|
|
|
*this = Host::GetArchitecture (Host::eSystemDefaultArchitecture32);
|
2011-02-23 08:35:02 +08:00
|
|
|
else if (triple_stref.equals (LLDB_ARCH_DEFAULT_64BIT))
|
2011-02-16 05:59:32 +08:00
|
|
|
*this = Host::GetArchitecture (Host::eSystemDefaultArchitecture64);
|
2011-02-23 08:35:02 +08:00
|
|
|
else if (triple_stref.equals (LLDB_ARCH_DEFAULT))
|
2011-02-16 05:59:32 +08:00
|
|
|
*this = Host::GetArchitecture (Host::eSystemDefaultArchitecture);
|
|
|
|
}
|
2011-02-23 08:35:02 +08:00
|
|
|
else
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
std::string normalized_triple_sstr (llvm::Triple::normalize(triple_stref));
|
|
|
|
triple_stref = normalized_triple_sstr;
|
2011-04-08 06:46:35 +08:00
|
|
|
llvm::Triple normalized_triple (triple_stref);
|
|
|
|
|
|
|
|
const bool os_specified = normalized_triple.getOSName().size() > 0;
|
|
|
|
const bool vendor_specified = normalized_triple.getVendorName().size() > 0;
|
|
|
|
const bool env_specified = normalized_triple.getEnvironmentName().size() > 0;
|
|
|
|
|
|
|
|
// If we got an arch only, then default the vendor, os, environment
|
|
|
|
// to match the platform if one is supplied
|
|
|
|
if (!(os_specified || vendor_specified || env_specified))
|
|
|
|
{
|
|
|
|
if (platform)
|
|
|
|
{
|
|
|
|
// If we were given a platform, use the platform's system
|
|
|
|
// architecture. If this is not available (might not be
|
|
|
|
// connected) use the first supported architecture.
|
|
|
|
ArchSpec platform_arch (platform->GetSystemArchitecture());
|
|
|
|
if (!platform_arch.IsValid())
|
|
|
|
{
|
|
|
|
if (!platform->GetSupportedArchitectureAtIndex (0, platform_arch))
|
|
|
|
platform_arch.Clear();
|
|
|
|
}
|
|
|
|
|
|
|
|
if (platform_arch.IsValid())
|
|
|
|
{
|
|
|
|
normalized_triple.setVendor(platform_arch.GetTriple().getVendor());
|
|
|
|
normalized_triple.setOS(platform_arch.GetTriple().getOS());
|
|
|
|
normalized_triple.setEnvironment(platform_arch.GetTriple().getEnvironment());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
// No platform specified, fall back to the host system for
|
|
|
|
// the default vendor, os, and environment.
|
|
|
|
llvm::Triple host_triple(llvm::sys::getHostTriple());
|
|
|
|
normalized_triple.setVendor(host_triple.getVendor());
|
|
|
|
normalized_triple.setOS(host_triple.getOS());
|
|
|
|
normalized_triple.setEnvironment(host_triple.getEnvironment());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
SetTriple (normalized_triple);
|
2010-06-09 00:52:24 +08:00
|
|
|
}
|
2011-02-23 08:35:02 +08:00
|
|
|
}
|
|
|
|
else
|
|
|
|
Clear();
|
|
|
|
return IsValid();
|
|
|
|
}
|
2010-06-09 00:52:24 +08:00
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
bool
|
2011-03-25 05:19:54 +08:00
|
|
|
ArchSpec::SetArchitecture (ArchitectureType arch_type, uint32_t cpu, uint32_t sub)
|
2011-02-23 08:35:02 +08:00
|
|
|
{
|
|
|
|
m_core = kCore_invalid;
|
|
|
|
bool update_triple = true;
|
|
|
|
const ArchDefinition *arch_def = FindArchDefinition(arch_type);
|
|
|
|
if (arch_def)
|
|
|
|
{
|
|
|
|
const ArchDefinitionEntry *arch_def_entry = FindArchDefinitionEntry (arch_def, cpu, sub);
|
|
|
|
if (arch_def_entry)
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
const CoreDefinition *core_def = FindCoreDefinition (arch_def_entry->core);
|
|
|
|
if (core_def)
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
m_core = core_def->core;
|
|
|
|
update_triple = false;
|
|
|
|
m_triple.setArch (core_def->machine);
|
|
|
|
if (arch_type == eArchTypeMachO)
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
m_triple.setVendor (llvm::Triple::Apple);
|
|
|
|
m_triple.setOS (llvm::Triple::Darwin);
|
2010-06-09 00:52:24 +08:00
|
|
|
}
|
2011-02-23 08:35:02 +08:00
|
|
|
else
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
m_triple.setVendor (llvm::Triple::UnknownVendor);
|
|
|
|
m_triple.setOS (llvm::Triple::UnknownOS);
|
2010-06-09 00:52:24 +08:00
|
|
|
}
|
2010-06-11 11:25:34 +08:00
|
|
|
}
|
2010-06-09 00:52:24 +08:00
|
|
|
}
|
|
|
|
}
|
2011-02-23 08:35:02 +08:00
|
|
|
CoreUpdated(update_triple);
|
|
|
|
return IsValid();
|
2010-06-09 00:52:24 +08:00
|
|
|
}
|
|
|
|
|
Added the ability to get the min and max instruction byte size for
an architecture into ArchSpec:
uint32_t
ArchSpec::GetMinimumOpcodeByteSize() const;
uint32_t
ArchSpec::GetMaximumOpcodeByteSize() const;
Added an AddressClass to the Instruction class in Disassembler.h.
This allows decoded instructions to know know if they are code,
code with alternate ISA (thumb), or even data which can be mixed
into code. The instruction does have an address, but it is a good
idea to cache this value so we don't have to look it up more than
once.
Fixed an issue in Opcode::SetOpcodeBytes() where the length wasn't
getting set.
Changed:
bool
SymbolContextList::AppendIfUnique (const SymbolContext& sc);
To:
bool
SymbolContextList::AppendIfUnique (const SymbolContext& sc,
bool merge_symbol_into_function);
This function was typically being used when looking up functions
and symbols. Now if you lookup a function, then find the symbol,
they can be merged into the same symbol context and not cause
multiple symbol contexts to appear in a symbol context list that
describes the same function.
Fixed the SymbolContext not equal operator which was causing mixed
mode disassembly to not work ("disassembler --mixed --name main").
Modified the disassembler classes to know about the fact we know,
for a given architecture, what the min and max opcode byte sizes
are. The InstructionList class was modified to return the max
opcode byte size for all of the instructions in its list.
These two fixes means when disassemble a list of instructions and dump
them and show the opcode bytes, we can format the output more
intelligently when showing opcode bytes. This affects any architectures
that have varying opcode byte sizes (x86_64 and i386). Knowing the max
opcode byte size also helps us to be able to disassemble N instructions
without having to re-read data if we didn't read enough bytes.
Added the ability to set the architecture for the disassemble command.
This means you can easily cross disassemble data for any supported
architecture. I also added the ability to specify "thumb" as an
architecture so that we can force disassembly into thumb mode when
needed. In GDB this was done using a hack of specifying an odd
address when disassembling. I don't want to repeat this hack in LLDB,
so the auto detection between ARM and thumb is failing, just specify
thumb when disassembling:
(lldb) disassemble --arch thumb --name main
You can also have data in say an x86_64 file executable and disassemble
data as any other supported architecture:
% lldb a.out
Current executable set to 'a.out' (x86_64).
(lldb) b main
(lldb) run
(lldb) disassemble --arch thumb --count 2 --start-address 0x0000000100001080 --bytes
0x100001080: 0xb580 push {r7, lr}
0x100001082: 0xaf00 add r7, sp, #0
Fixed Target::ReadMemory(...) to be able to deal with Address argument object
that isn't section offset. When an address object was supplied that was
out on the heap or stack, target read memory would fail. Disassembly uses
Target::ReadMemory(...), and the example above where we disassembler thumb
opcodes in an x86 binary was failing do to this bug.
llvm-svn: 128347
2011-03-27 03:14:58 +08:00
|
|
|
uint32_t
|
|
|
|
ArchSpec::GetMinimumOpcodeByteSize() const
|
|
|
|
{
|
|
|
|
const CoreDefinition *core_def = FindCoreDefinition (m_core);
|
|
|
|
if (core_def)
|
|
|
|
return core_def->min_opcode_byte_size;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
uint32_t
|
|
|
|
ArchSpec::GetMaximumOpcodeByteSize() const
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
Added the ability to get the min and max instruction byte size for
an architecture into ArchSpec:
uint32_t
ArchSpec::GetMinimumOpcodeByteSize() const;
uint32_t
ArchSpec::GetMaximumOpcodeByteSize() const;
Added an AddressClass to the Instruction class in Disassembler.h.
This allows decoded instructions to know know if they are code,
code with alternate ISA (thumb), or even data which can be mixed
into code. The instruction does have an address, but it is a good
idea to cache this value so we don't have to look it up more than
once.
Fixed an issue in Opcode::SetOpcodeBytes() where the length wasn't
getting set.
Changed:
bool
SymbolContextList::AppendIfUnique (const SymbolContext& sc);
To:
bool
SymbolContextList::AppendIfUnique (const SymbolContext& sc,
bool merge_symbol_into_function);
This function was typically being used when looking up functions
and symbols. Now if you lookup a function, then find the symbol,
they can be merged into the same symbol context and not cause
multiple symbol contexts to appear in a symbol context list that
describes the same function.
Fixed the SymbolContext not equal operator which was causing mixed
mode disassembly to not work ("disassembler --mixed --name main").
Modified the disassembler classes to know about the fact we know,
for a given architecture, what the min and max opcode byte sizes
are. The InstructionList class was modified to return the max
opcode byte size for all of the instructions in its list.
These two fixes means when disassemble a list of instructions and dump
them and show the opcode bytes, we can format the output more
intelligently when showing opcode bytes. This affects any architectures
that have varying opcode byte sizes (x86_64 and i386). Knowing the max
opcode byte size also helps us to be able to disassemble N instructions
without having to re-read data if we didn't read enough bytes.
Added the ability to set the architecture for the disassemble command.
This means you can easily cross disassemble data for any supported
architecture. I also added the ability to specify "thumb" as an
architecture so that we can force disassembly into thumb mode when
needed. In GDB this was done using a hack of specifying an odd
address when disassembling. I don't want to repeat this hack in LLDB,
so the auto detection between ARM and thumb is failing, just specify
thumb when disassembling:
(lldb) disassemble --arch thumb --name main
You can also have data in say an x86_64 file executable and disassemble
data as any other supported architecture:
% lldb a.out
Current executable set to 'a.out' (x86_64).
(lldb) b main
(lldb) run
(lldb) disassemble --arch thumb --count 2 --start-address 0x0000000100001080 --bytes
0x100001080: 0xb580 push {r7, lr}
0x100001082: 0xaf00 add r7, sp, #0
Fixed Target::ReadMemory(...) to be able to deal with Address argument object
that isn't section offset. When an address object was supplied that was
out on the heap or stack, target read memory would fail. Disassembly uses
Target::ReadMemory(...), and the example above where we disassembler thumb
opcodes in an x86 binary was failing do to this bug.
llvm-svn: 128347
2011-03-27 03:14:58 +08:00
|
|
|
const CoreDefinition *core_def = FindCoreDefinition (m_core);
|
|
|
|
if (core_def)
|
|
|
|
return core_def->max_opcode_byte_size;
|
|
|
|
return 0;
|
2011-02-23 08:35:02 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
// Helper methods.
|
|
|
|
|
|
|
|
void
|
|
|
|
ArchSpec::CoreUpdated (bool update_triple)
|
|
|
|
{
|
|
|
|
const CoreDefinition *core_def = FindCoreDefinition (m_core);
|
|
|
|
if (core_def)
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
if (update_triple)
|
|
|
|
m_triple = llvm::Triple(core_def->name, "unknown", "unknown");
|
|
|
|
m_byte_order = core_def->default_byte_order;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
if (update_triple)
|
|
|
|
m_triple = llvm::Triple();
|
|
|
|
m_byte_order = eByteOrderInvalid;
|
2010-06-09 00:52:24 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
// Operators.
|
|
|
|
|
2010-06-09 00:52:24 +08:00
|
|
|
bool
|
|
|
|
lldb_private::operator== (const ArchSpec& lhs, const ArchSpec& rhs)
|
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
const ArchSpec::Core lhs_core = lhs.GetCore ();
|
|
|
|
const ArchSpec::Core rhs_core = rhs.GetCore ();
|
|
|
|
|
|
|
|
if (lhs_core == rhs_core)
|
|
|
|
return true;
|
2010-06-09 00:52:24 +08:00
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
if (lhs_core == ArchSpec::kCore_any || rhs_core == ArchSpec::kCore_any)
|
2010-06-09 00:52:24 +08:00
|
|
|
return true;
|
|
|
|
|
2011-02-23 08:35:02 +08:00
|
|
|
if (lhs_core == ArchSpec::kCore_arm_any)
|
|
|
|
{
|
|
|
|
if ((rhs_core >= ArchSpec::kCore_arm_first && rhs_core <= ArchSpec::kCore_arm_last) || (rhs_core == ArchSpec::kCore_arm_any))
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
else if (rhs_core == ArchSpec::kCore_arm_any)
|
|
|
|
{
|
|
|
|
if ((lhs_core >= ArchSpec::kCore_arm_first && lhs_core <= ArchSpec::kCore_arm_last) || (lhs_core == ArchSpec::kCore_arm_any))
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
else if (lhs_core == ArchSpec::kCore_x86_32_any)
|
|
|
|
{
|
|
|
|
if ((rhs_core >= ArchSpec::kCore_x86_32_first && rhs_core <= ArchSpec::kCore_x86_32_last) || (rhs_core == ArchSpec::kCore_x86_32_any))
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
else if (rhs_core == ArchSpec::kCore_x86_32_any)
|
2010-06-09 00:52:24 +08:00
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
if ((lhs_core >= ArchSpec::kCore_x86_32_first && lhs_core <= ArchSpec::kCore_x86_32_last) || (lhs_core == ArchSpec::kCore_x86_32_any))
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
else if (lhs_core == ArchSpec::kCore_ppc_any)
|
|
|
|
{
|
|
|
|
if ((rhs_core >= ArchSpec::kCore_ppc_first && rhs_core <= ArchSpec::kCore_ppc_last) || (rhs_core == ArchSpec::kCore_ppc_any))
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
else if (rhs_core == ArchSpec::kCore_ppc_any)
|
|
|
|
{
|
|
|
|
if ((lhs_core >= ArchSpec::kCore_ppc_first && lhs_core <= ArchSpec::kCore_ppc_last) || (lhs_core == ArchSpec::kCore_ppc_any))
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
else if (lhs_core == ArchSpec::kCore_ppc64_any)
|
|
|
|
{
|
|
|
|
if ((rhs_core >= ArchSpec::kCore_ppc64_first && rhs_core <= ArchSpec::kCore_ppc64_last) || (rhs_core == ArchSpec::kCore_ppc64_any))
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
else if (rhs_core == ArchSpec::kCore_ppc64_any)
|
|
|
|
{
|
|
|
|
if ((lhs_core >= ArchSpec::kCore_ppc64_first && lhs_core <= ArchSpec::kCore_ppc64_last) || (lhs_core == ArchSpec::kCore_ppc64_any))
|
2010-06-09 00:52:24 +08:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool
|
|
|
|
lldb_private::operator!= (const ArchSpec& lhs, const ArchSpec& rhs)
|
|
|
|
{
|
|
|
|
return !(lhs == rhs);
|
|
|
|
}
|
|
|
|
|
|
|
|
bool
|
|
|
|
lldb_private::operator<(const ArchSpec& lhs, const ArchSpec& rhs)
|
|
|
|
{
|
2011-02-23 08:35:02 +08:00
|
|
|
const ArchSpec::Core lhs_core = lhs.GetCore ();
|
|
|
|
const ArchSpec::Core rhs_core = rhs.GetCore ();
|
|
|
|
return lhs_core < rhs_core;
|
2010-06-09 00:52:24 +08:00
|
|
|
}
|