2017-04-22 06:03:05 +08:00
|
|
|
//===- MachOObjectFile.cpp - Mach-O object file binding -------------------===//
|
2011-04-22 11:19:48 +08:00
|
|
|
//
|
2019-01-19 16:50:56 +08:00
|
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
2011-04-22 11:19:48 +08:00
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
//
|
|
|
|
// This file defines the MachOObjectFile class, which binds the MachOObject
|
|
|
|
// class to the generic ObjectFile wrapper.
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
2017-04-22 06:03:05 +08:00
|
|
|
#include "llvm/ADT/ArrayRef.h"
|
|
|
|
#include "llvm/ADT/None.h"
|
2014-03-29 18:18:08 +08:00
|
|
|
#include "llvm/ADT/STLExtras.h"
|
2017-06-06 19:49:48 +08:00
|
|
|
#include "llvm/ADT/SmallVector.h"
|
2017-04-22 06:03:05 +08:00
|
|
|
#include "llvm/ADT/StringRef.h"
|
2014-08-09 00:30:17 +08:00
|
|
|
#include "llvm/ADT/StringSwitch.h"
|
2012-12-04 00:50:05 +08:00
|
|
|
#include "llvm/ADT/Triple.h"
|
2017-04-22 06:03:05 +08:00
|
|
|
#include "llvm/ADT/Twine.h"
|
2017-06-07 11:48:56 +08:00
|
|
|
#include "llvm/BinaryFormat/MachO.h"
|
2017-04-22 06:03:05 +08:00
|
|
|
#include "llvm/Object/Error.h"
|
|
|
|
#include "llvm/Object/MachO.h"
|
|
|
|
#include "llvm/Object/ObjectFile.h"
|
|
|
|
#include "llvm/Object/SymbolicFile.h"
|
2013-04-08 04:01:29 +08:00
|
|
|
#include "llvm/Support/DataExtractor.h"
|
2014-09-13 05:34:15 +08:00
|
|
|
#include "llvm/Support/Debug.h"
|
2017-04-22 06:03:05 +08:00
|
|
|
#include "llvm/Support/Error.h"
|
|
|
|
#include "llvm/Support/ErrorHandling.h"
|
2011-10-27 04:42:54 +08:00
|
|
|
#include "llvm/Support/Format.h"
|
2013-04-19 02:08:55 +08:00
|
|
|
#include "llvm/Support/Host.h"
|
2014-08-30 08:20:14 +08:00
|
|
|
#include "llvm/Support/LEB128.h"
|
2011-04-22 11:19:48 +08:00
|
|
|
#include "llvm/Support/MemoryBuffer.h"
|
2017-04-22 06:03:05 +08:00
|
|
|
#include "llvm/Support/SwapByteOrder.h"
|
2017-06-06 19:49:48 +08:00
|
|
|
#include "llvm/Support/raw_ostream.h"
|
2017-04-22 06:03:05 +08:00
|
|
|
#include <algorithm>
|
|
|
|
#include <cassert>
|
|
|
|
#include <cstddef>
|
|
|
|
#include <cstdint>
|
2011-04-22 11:19:48 +08:00
|
|
|
#include <cstring>
|
|
|
|
#include <limits>
|
2016-11-01 04:29:48 +08:00
|
|
|
#include <list>
|
2017-04-22 06:03:05 +08:00
|
|
|
#include <memory>
|
|
|
|
#include <string>
|
|
|
|
#include <system_error>
|
2011-04-22 11:19:48 +08:00
|
|
|
|
|
|
|
using namespace llvm;
|
|
|
|
using namespace object;
|
|
|
|
|
2014-07-20 20:08:28 +08:00
|
|
|
namespace {
|
2017-04-22 06:03:05 +08:00
|
|
|
|
2014-07-20 20:08:28 +08:00
|
|
|
struct section_base {
|
|
|
|
char sectname[16];
|
|
|
|
char segname[16];
|
|
|
|
};
|
2017-04-22 06:03:05 +08:00
|
|
|
|
|
|
|
} // end anonymous namespace
|
2013-04-19 02:08:55 +08:00
|
|
|
|
2017-08-20 23:13:39 +08:00
|
|
|
static Error malformedError(const Twine &Msg) {
|
|
|
|
return make_error<GenericBinaryError>("truncated or malformed object (" +
|
|
|
|
Msg + ")",
|
2016-05-06 07:41:05 +08:00
|
|
|
object_error::parse_failed);
|
2016-03-26 01:25:34 +08:00
|
|
|
}
|
|
|
|
|
2015-06-05 03:45:22 +08:00
|
|
|
// FIXME: Replace all uses of this function with getStructOrErr.
|
2015-01-16 06:52:38 +08:00
|
|
|
template <typename T>
|
2016-12-04 09:56:10 +08:00
|
|
|
static T getStruct(const MachOObjectFile &O, const char *P) {
|
2015-01-16 06:52:38 +08:00
|
|
|
// Don't read before the beginning or past the end of the file
|
2016-12-04 09:56:10 +08:00
|
|
|
if (P < O.getData().begin() || P + sizeof(T) > O.getData().end())
|
2015-01-16 06:52:38 +08:00
|
|
|
report_fatal_error("Malformed MachO file.");
|
|
|
|
|
2013-04-19 21:45:05 +08:00
|
|
|
T Cmd;
|
|
|
|
memcpy(&Cmd, P, sizeof(T));
|
2016-12-04 09:56:10 +08:00
|
|
|
if (O.isLittleEndian() != sys::IsLittleEndianHost)
|
2014-07-18 17:26:16 +08:00
|
|
|
MachO::swapStruct(Cmd);
|
2013-04-19 21:45:05 +08:00
|
|
|
return Cmd;
|
2012-03-01 09:36:50 +08:00
|
|
|
}
|
|
|
|
|
2015-06-05 03:45:22 +08:00
|
|
|
template <typename T>
|
2016-12-04 09:56:10 +08:00
|
|
|
static Expected<T> getStructOrErr(const MachOObjectFile &O, const char *P) {
|
2015-06-05 03:45:22 +08:00
|
|
|
// Don't read before the beginning or past the end of the file
|
2016-12-04 09:56:10 +08:00
|
|
|
if (P < O.getData().begin() || P + sizeof(T) > O.getData().end())
|
2016-05-07 04:16:28 +08:00
|
|
|
return malformedError("Structure read out-of-range");
|
2015-06-05 03:45:22 +08:00
|
|
|
|
|
|
|
T Cmd;
|
|
|
|
memcpy(&Cmd, P, sizeof(T));
|
2016-12-04 09:56:10 +08:00
|
|
|
if (O.isLittleEndian() != sys::IsLittleEndianHost)
|
2015-06-05 03:45:22 +08:00
|
|
|
MachO::swapStruct(Cmd);
|
|
|
|
return Cmd;
|
|
|
|
}
|
|
|
|
|
2013-04-27 04:07:33 +08:00
|
|
|
static const char *
|
2016-12-04 09:56:10 +08:00
|
|
|
getSectionPtr(const MachOObjectFile &O, MachOObjectFile::LoadCommandInfo L,
|
2013-04-27 04:07:33 +08:00
|
|
|
unsigned Sec) {
|
2013-04-19 02:08:55 +08:00
|
|
|
uintptr_t CommandAddr = reinterpret_cast<uintptr_t>(L.Ptr);
|
2011-04-22 11:19:48 +08:00
|
|
|
|
2016-12-04 09:56:10 +08:00
|
|
|
bool Is64 = O.is64Bit();
|
2013-09-01 12:28:48 +08:00
|
|
|
unsigned SegmentLoadSize = Is64 ? sizeof(MachO::segment_command_64) :
|
|
|
|
sizeof(MachO::segment_command);
|
|
|
|
unsigned SectionSize = Is64 ? sizeof(MachO::section_64) :
|
|
|
|
sizeof(MachO::section);
|
2013-04-19 02:08:55 +08:00
|
|
|
|
|
|
|
uintptr_t SectionAddr = CommandAddr + SegmentLoadSize + Sec * SectionSize;
|
2013-08-27 13:38:30 +08:00
|
|
|
return reinterpret_cast<const char*>(SectionAddr);
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2016-12-04 09:56:10 +08:00
|
|
|
static const char *getPtr(const MachOObjectFile &O, size_t Offset) {
|
2018-06-05 01:01:20 +08:00
|
|
|
assert(Offset <= O.getData().size());
|
2018-05-30 11:37:26 +08:00
|
|
|
return O.getData().data() + Offset;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2014-07-18 17:26:16 +08:00
|
|
|
static MachO::nlist_base
|
2016-12-04 09:56:10 +08:00
|
|
|
getSymbolTableEntryBase(const MachOObjectFile &O, DataRefImpl DRI) {
|
2013-04-25 03:47:55 +08:00
|
|
|
const char *P = reinterpret_cast<const char *>(DRI.p);
|
2014-07-18 17:26:16 +08:00
|
|
|
return getStruct<MachO::nlist_base>(O, P);
|
2011-10-08 03:25:32 +08:00
|
|
|
}
|
|
|
|
|
2013-04-19 02:08:55 +08:00
|
|
|
static StringRef parseSegmentOrSectionName(const char *P) {
|
Add a function to get the segment name of a section.
On MachO, sections also have segment names. When a tool looking at a .o file
prints a segment name, this is what they mean. In reality, a .o has only one
anonymous, segment.
This patch adds a MachO only function to fetch that segment name. I named it
getSectionFinalSegmentName since the main use for the name seems to be inform
the linker with segment this section should go to.
The patch also changes MachOObjectFile::getSectionName to return just the
section name instead of computing SegmentName,SectionName.
The main difference from the previous patch is that it doesn't use
InMemoryStruct. It is extremely dangerous: if the endians match it returns
a pointer to the file buffer, if not, it returns a pointer to an internal buffer
that is overwritten in the next API call.
We should change all of this code to use
support::detail::packed_endian_specific_integral like ELF, but since these
functions only handle strings, they work with big and little endian machines
as is.
I have tested this by installing ubuntu 12.10 ppc on qemu, that is why it took
so long :-)
llvm-svn: 170838
2012-12-21 11:47:03 +08:00
|
|
|
if (P[15] == 0)
|
|
|
|
// Null terminated.
|
|
|
|
return P;
|
|
|
|
// Not null terminated, so this is a 16 char string.
|
|
|
|
return StringRef(P, 16);
|
|
|
|
}
|
|
|
|
|
2016-12-04 09:56:10 +08:00
|
|
|
static unsigned getCPUType(const MachOObjectFile &O) {
|
|
|
|
return O.getHeader().cputype;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2013-09-01 12:28:48 +08:00
|
|
|
static uint32_t
|
|
|
|
getPlainRelocationAddress(const MachO::any_relocation_info &RE) {
|
|
|
|
return RE.r_word0;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static unsigned
|
2013-09-01 12:28:48 +08:00
|
|
|
getScatteredRelocationAddress(const MachO::any_relocation_info &RE) {
|
|
|
|
return RE.r_word0 & 0xffffff;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2016-12-04 09:56:10 +08:00
|
|
|
static bool getPlainRelocationPCRel(const MachOObjectFile &O,
|
2013-09-01 12:28:48 +08:00
|
|
|
const MachO::any_relocation_info &RE) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if (O.isLittleEndian())
|
2013-09-01 12:28:48 +08:00
|
|
|
return (RE.r_word1 >> 24) & 1;
|
|
|
|
return (RE.r_word1 >> 7) & 1;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static bool
|
2016-12-04 09:56:10 +08:00
|
|
|
getScatteredRelocationPCRel(const MachO::any_relocation_info &RE) {
|
2013-09-01 12:28:48 +08:00
|
|
|
return (RE.r_word0 >> 30) & 1;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2016-12-04 09:56:10 +08:00
|
|
|
static unsigned getPlainRelocationLength(const MachOObjectFile &O,
|
2013-09-01 12:28:48 +08:00
|
|
|
const MachO::any_relocation_info &RE) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if (O.isLittleEndian())
|
2013-09-01 12:28:48 +08:00
|
|
|
return (RE.r_word1 >> 25) & 3;
|
|
|
|
return (RE.r_word1 >> 5) & 3;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static unsigned
|
2013-09-01 12:28:48 +08:00
|
|
|
getScatteredRelocationLength(const MachO::any_relocation_info &RE) {
|
|
|
|
return (RE.r_word0 >> 28) & 3;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2016-12-04 09:56:10 +08:00
|
|
|
static unsigned getPlainRelocationType(const MachOObjectFile &O,
|
2013-09-01 12:28:48 +08:00
|
|
|
const MachO::any_relocation_info &RE) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if (O.isLittleEndian())
|
2013-09-01 12:28:48 +08:00
|
|
|
return RE.r_word1 >> 28;
|
|
|
|
return RE.r_word1 & 0xf;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2016-12-04 09:56:10 +08:00
|
|
|
static uint32_t getSectionFlags(const MachOObjectFile &O,
|
2013-04-19 02:08:55 +08:00
|
|
|
DataRefImpl Sec) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if (O.is64Bit()) {
|
|
|
|
MachO::section_64 Sect = O.getSection64(Sec);
|
2013-09-01 12:28:48 +08:00
|
|
|
return Sect.flags;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
2016-12-04 09:56:10 +08:00
|
|
|
MachO::section Sect = O.getSection(Sec);
|
2013-09-01 12:28:48 +08:00
|
|
|
return Sect.flags;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2016-03-26 01:25:34 +08:00
|
|
|
static Expected<MachOObjectFile::LoadCommandInfo>
|
2016-12-04 09:56:10 +08:00
|
|
|
getLoadCommandInfo(const MachOObjectFile &Obj, const char *Ptr,
|
2016-05-04 07:13:50 +08:00
|
|
|
uint32_t LoadCommandIndex) {
|
2016-03-26 01:25:34 +08:00
|
|
|
if (auto CmdOrErr = getStructOrErr<MachO::load_command>(Obj, Ptr)) {
|
2017-09-13 21:43:01 +08:00
|
|
|
if (CmdOrErr->cmdsize + Ptr > Obj.getData().end())
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" extends past end of file");
|
2016-03-26 01:25:34 +08:00
|
|
|
if (CmdOrErr->cmdsize < 8)
|
2016-05-07 04:16:28 +08:00
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
2016-05-06 07:41:05 +08:00
|
|
|
" with size less than 8 bytes");
|
2016-03-26 01:25:34 +08:00
|
|
|
return MachOObjectFile::LoadCommandInfo({Ptr, *CmdOrErr});
|
|
|
|
} else
|
|
|
|
return CmdOrErr.takeError();
|
|
|
|
}
|
|
|
|
|
|
|
|
static Expected<MachOObjectFile::LoadCommandInfo>
|
2016-12-04 09:56:10 +08:00
|
|
|
getFirstLoadCommandInfo(const MachOObjectFile &Obj) {
|
|
|
|
unsigned HeaderSize = Obj.is64Bit() ? sizeof(MachO::mach_header_64)
|
|
|
|
: sizeof(MachO::mach_header);
|
|
|
|
if (sizeof(MachO::load_command) > Obj.getHeader().sizeofcmds)
|
2016-05-07 04:16:28 +08:00
|
|
|
return malformedError("load command 0 extends past the end all load "
|
2016-05-06 07:41:05 +08:00
|
|
|
"commands in the file");
|
2016-05-04 07:13:50 +08:00
|
|
|
return getLoadCommandInfo(Obj, getPtr(Obj, HeaderSize), 0);
|
2015-06-05 03:34:14 +08:00
|
|
|
}
|
|
|
|
|
2016-03-26 01:25:34 +08:00
|
|
|
static Expected<MachOObjectFile::LoadCommandInfo>
|
2016-12-04 09:56:10 +08:00
|
|
|
getNextLoadCommandInfo(const MachOObjectFile &Obj, uint32_t LoadCommandIndex,
|
2015-06-05 03:34:14 +08:00
|
|
|
const MachOObjectFile::LoadCommandInfo &L) {
|
2016-12-04 09:56:10 +08:00
|
|
|
unsigned HeaderSize = Obj.is64Bit() ? sizeof(MachO::mach_header_64)
|
|
|
|
: sizeof(MachO::mach_header);
|
2016-09-01 01:57:46 +08:00
|
|
|
if (L.Ptr + L.C.cmdsize + sizeof(MachO::load_command) >
|
2016-12-04 09:56:10 +08:00
|
|
|
Obj.getData().data() + HeaderSize + Obj.getHeader().sizeofcmds)
|
2016-05-07 04:16:28 +08:00
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex + 1) +
|
2016-05-06 07:41:05 +08:00
|
|
|
" extends past the end all load commands in the file");
|
2016-05-04 07:13:50 +08:00
|
|
|
return getLoadCommandInfo(Obj, L.Ptr + L.C.cmdsize, LoadCommandIndex + 1);
|
2015-06-05 03:34:14 +08:00
|
|
|
}
|
|
|
|
|
2015-06-05 03:45:22 +08:00
|
|
|
template <typename T>
|
2016-12-04 09:56:10 +08:00
|
|
|
static void parseHeader(const MachOObjectFile &Obj, T &Header,
|
2016-03-26 01:25:34 +08:00
|
|
|
Error &Err) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if (sizeof(T) > Obj.getData().size()) {
|
2016-05-07 04:16:28 +08:00
|
|
|
Err = malformedError("the mach header extends past the end of the "
|
2016-05-06 07:41:05 +08:00
|
|
|
"file");
|
2016-04-14 05:17:58 +08:00
|
|
|
return;
|
|
|
|
}
|
2016-03-26 01:25:34 +08:00
|
|
|
if (auto HeaderOrErr = getStructOrErr<T>(Obj, getPtr(Obj, 0)))
|
|
|
|
Header = *HeaderOrErr;
|
2015-06-05 03:45:22 +08:00
|
|
|
else
|
2016-03-26 01:25:34 +08:00
|
|
|
Err = HeaderOrErr.takeError();
|
2015-06-05 03:45:22 +08:00
|
|
|
}
|
|
|
|
|
2016-11-01 04:29:48 +08:00
|
|
|
// This is used to check for overlapping of Mach-O elements.
|
|
|
|
struct MachOElement {
|
|
|
|
uint64_t Offset;
|
|
|
|
uint64_t Size;
|
|
|
|
const char *Name;
|
|
|
|
};
|
|
|
|
|
|
|
|
static Error checkOverlappingElement(std::list<MachOElement> &Elements,
|
|
|
|
uint64_t Offset, uint64_t Size,
|
|
|
|
const char *Name) {
|
|
|
|
if (Size == 0)
|
|
|
|
return Error::success();
|
|
|
|
|
|
|
|
for (auto it=Elements.begin() ; it != Elements.end(); ++it) {
|
|
|
|
auto E = *it;
|
|
|
|
if ((Offset >= E.Offset && Offset < E.Offset + E.Size) ||
|
|
|
|
(Offset + Size > E.Offset && Offset + Size < E.Offset + E.Size) ||
|
|
|
|
(Offset <= E.Offset && Offset + Size >= E.Offset + E.Size))
|
|
|
|
return malformedError(Twine(Name) + " at offset " + Twine(Offset) +
|
|
|
|
" with a size of " + Twine(Size) + ", overlaps " +
|
|
|
|
E.Name + " at offset " + Twine(E.Offset) + " with "
|
|
|
|
"a size of " + Twine(E.Size));
|
|
|
|
auto nt = it;
|
|
|
|
nt++;
|
|
|
|
if (nt != Elements.end()) {
|
|
|
|
auto N = *nt;
|
|
|
|
if (Offset + Size <= N.Offset) {
|
|
|
|
Elements.insert(nt, {Offset, Size, Name});
|
|
|
|
return Error::success();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
Elements.push_back({Offset, Size, Name});
|
|
|
|
return Error::success();
|
|
|
|
}
|
|
|
|
|
2015-06-05 06:08:37 +08:00
|
|
|
// Parses LC_SEGMENT or LC_SEGMENT_64 load command, adds addresses of all
|
|
|
|
// sections to \param Sections, and optionally sets
|
|
|
|
// \param IsPageZeroSegment to true.
|
2016-08-13 04:10:25 +08:00
|
|
|
template <typename Segment, typename Section>
|
2016-03-26 01:25:34 +08:00
|
|
|
static Error parseSegmentLoadCommand(
|
2016-12-04 09:56:10 +08:00
|
|
|
const MachOObjectFile &Obj, const MachOObjectFile::LoadCommandInfo &Load,
|
2016-05-06 01:43:35 +08:00
|
|
|
SmallVectorImpl<const char *> &Sections, bool &IsPageZeroSegment,
|
2016-11-03 05:08:39 +08:00
|
|
|
uint32_t LoadCommandIndex, const char *CmdName, uint64_t SizeOfHeaders,
|
|
|
|
std::list<MachOElement> &Elements) {
|
2016-08-13 04:10:25 +08:00
|
|
|
const unsigned SegmentLoadSize = sizeof(Segment);
|
2015-06-05 06:08:37 +08:00
|
|
|
if (Load.C.cmdsize < SegmentLoadSize)
|
2016-05-07 04:16:28 +08:00
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
2016-05-06 07:41:05 +08:00
|
|
|
" " + CmdName + " cmdsize too small");
|
2016-08-13 04:10:25 +08:00
|
|
|
if (auto SegOrErr = getStructOrErr<Segment>(Obj, Load.Ptr)) {
|
|
|
|
Segment S = SegOrErr.get();
|
|
|
|
const unsigned SectionSize = sizeof(Section);
|
2016-12-04 09:56:10 +08:00
|
|
|
uint64_t FileSize = Obj.getData().size();
|
2016-03-26 01:25:34 +08:00
|
|
|
if (S.nsects > std::numeric_limits<uint32_t>::max() / SectionSize ||
|
|
|
|
S.nsects * SectionSize > Load.C.cmdsize - SegmentLoadSize)
|
2016-05-07 04:16:28 +08:00
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
2016-08-22 08:58:47 +08:00
|
|
|
" inconsistent cmdsize in " + CmdName +
|
2016-05-06 07:41:05 +08:00
|
|
|
" for the number of sections");
|
2016-03-26 01:25:34 +08:00
|
|
|
for (unsigned J = 0; J < S.nsects; ++J) {
|
|
|
|
const char *Sec = getSectionPtr(Obj, Load, J);
|
|
|
|
Sections.push_back(Sec);
|
2019-06-05 00:55:30 +08:00
|
|
|
auto SectionOrErr = getStructOrErr<Section>(Obj, Sec);
|
|
|
|
if (!SectionOrErr)
|
|
|
|
return SectionOrErr.takeError();
|
|
|
|
Section s = SectionOrErr.get();
|
2016-12-04 09:56:10 +08:00
|
|
|
if (Obj.getHeader().filetype != MachO::MH_DYLIB_STUB &&
|
|
|
|
Obj.getHeader().filetype != MachO::MH_DSYM &&
|
2016-08-13 04:10:25 +08:00
|
|
|
s.flags != MachO::S_ZEROFILL &&
|
|
|
|
s.flags != MachO::S_THREAD_LOCAL_ZEROFILL &&
|
|
|
|
s.offset > FileSize)
|
|
|
|
return malformedError("offset field of section " + Twine(J) + " in " +
|
|
|
|
CmdName + " command " + Twine(LoadCommandIndex) +
|
|
|
|
" extends past the end of the file");
|
2016-12-04 09:56:10 +08:00
|
|
|
if (Obj.getHeader().filetype != MachO::MH_DYLIB_STUB &&
|
|
|
|
Obj.getHeader().filetype != MachO::MH_DSYM &&
|
2016-08-13 04:10:25 +08:00
|
|
|
s.flags != MachO::S_ZEROFILL &&
|
2016-08-22 08:58:04 +08:00
|
|
|
s.flags != MachO::S_THREAD_LOCAL_ZEROFILL && S.fileoff == 0 &&
|
|
|
|
s.offset < SizeOfHeaders && s.size != 0)
|
2016-08-13 04:10:25 +08:00
|
|
|
return malformedError("offset field of section " + Twine(J) + " in " +
|
|
|
|
CmdName + " command " + Twine(LoadCommandIndex) +
|
|
|
|
" not past the headers of the file");
|
|
|
|
uint64_t BigSize = s.offset;
|
|
|
|
BigSize += s.size;
|
2016-12-04 09:56:10 +08:00
|
|
|
if (Obj.getHeader().filetype != MachO::MH_DYLIB_STUB &&
|
|
|
|
Obj.getHeader().filetype != MachO::MH_DSYM &&
|
2016-08-13 04:10:25 +08:00
|
|
|
s.flags != MachO::S_ZEROFILL &&
|
|
|
|
s.flags != MachO::S_THREAD_LOCAL_ZEROFILL &&
|
|
|
|
BigSize > FileSize)
|
|
|
|
return malformedError("offset field plus size field of section " +
|
|
|
|
Twine(J) + " in " + CmdName + " command " +
|
|
|
|
Twine(LoadCommandIndex) +
|
|
|
|
" extends past the end of the file");
|
2016-12-04 09:56:10 +08:00
|
|
|
if (Obj.getHeader().filetype != MachO::MH_DYLIB_STUB &&
|
|
|
|
Obj.getHeader().filetype != MachO::MH_DSYM &&
|
2016-08-13 04:10:25 +08:00
|
|
|
s.flags != MachO::S_ZEROFILL &&
|
|
|
|
s.flags != MachO::S_THREAD_LOCAL_ZEROFILL &&
|
|
|
|
s.size > S.filesize)
|
|
|
|
return malformedError("size field of section " +
|
|
|
|
Twine(J) + " in " + CmdName + " command " +
|
|
|
|
Twine(LoadCommandIndex) +
|
|
|
|
" greater than the segment");
|
2016-12-04 09:56:10 +08:00
|
|
|
if (Obj.getHeader().filetype != MachO::MH_DYLIB_STUB &&
|
|
|
|
Obj.getHeader().filetype != MachO::MH_DSYM && s.size != 0 &&
|
2016-08-22 08:58:04 +08:00
|
|
|
s.addr < S.vmaddr)
|
|
|
|
return malformedError("addr field of section " + Twine(J) + " in " +
|
|
|
|
CmdName + " command " + Twine(LoadCommandIndex) +
|
|
|
|
" less than the segment's vmaddr");
|
2016-08-13 04:10:25 +08:00
|
|
|
BigSize = s.addr;
|
|
|
|
BigSize += s.size;
|
|
|
|
uint64_t BigEnd = S.vmaddr;
|
|
|
|
BigEnd += S.vmsize;
|
|
|
|
if (S.vmsize != 0 && s.size != 0 && BigSize > BigEnd)
|
2016-08-22 08:58:04 +08:00
|
|
|
return malformedError("addr field plus size of section " + Twine(J) +
|
|
|
|
" in " + CmdName + " command " +
|
|
|
|
Twine(LoadCommandIndex) +
|
|
|
|
" greater than than "
|
2016-08-13 04:10:25 +08:00
|
|
|
"the segment's vmaddr plus vmsize");
|
2016-12-04 09:56:10 +08:00
|
|
|
if (Obj.getHeader().filetype != MachO::MH_DYLIB_STUB &&
|
|
|
|
Obj.getHeader().filetype != MachO::MH_DSYM &&
|
2016-11-03 05:08:39 +08:00
|
|
|
s.flags != MachO::S_ZEROFILL &&
|
|
|
|
s.flags != MachO::S_THREAD_LOCAL_ZEROFILL)
|
|
|
|
if (Error Err = checkOverlappingElement(Elements, s.offset, s.size,
|
|
|
|
"section contents"))
|
|
|
|
return Err;
|
2016-08-13 04:10:25 +08:00
|
|
|
if (s.reloff > FileSize)
|
2016-08-22 08:58:04 +08:00
|
|
|
return malformedError("reloff field of section " + Twine(J) + " in " +
|
|
|
|
CmdName + " command " + Twine(LoadCommandIndex) +
|
2016-08-13 04:10:25 +08:00
|
|
|
" extends past the end of the file");
|
|
|
|
BigSize = s.nreloc;
|
|
|
|
BigSize *= sizeof(struct MachO::relocation_info);
|
|
|
|
BigSize += s.reloff;
|
|
|
|
if (BigSize > FileSize)
|
|
|
|
return malformedError("reloff field plus nreloc field times sizeof("
|
|
|
|
"struct relocation_info) of section " +
|
|
|
|
Twine(J) + " in " + CmdName + " command " +
|
2016-08-22 08:58:04 +08:00
|
|
|
Twine(LoadCommandIndex) +
|
2016-08-13 04:10:25 +08:00
|
|
|
" extends past the end of the file");
|
2016-11-03 05:08:39 +08:00
|
|
|
if (Error Err = checkOverlappingElement(Elements, s.reloff, s.nreloc *
|
|
|
|
sizeof(struct
|
|
|
|
MachO::relocation_info),
|
|
|
|
"section relocation entries"))
|
|
|
|
return Err;
|
2016-03-26 01:25:34 +08:00
|
|
|
}
|
2016-08-06 02:19:40 +08:00
|
|
|
if (S.fileoff > FileSize)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
2016-08-22 08:58:47 +08:00
|
|
|
" fileoff field in " + CmdName +
|
2016-08-06 02:19:40 +08:00
|
|
|
" extends past the end of the file");
|
2016-08-13 04:10:25 +08:00
|
|
|
uint64_t BigSize = S.fileoff;
|
|
|
|
BigSize += S.filesize;
|
|
|
|
if (BigSize > FileSize)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" fileoff field plus filesize field in " +
|
|
|
|
CmdName + " extends past the end of the file");
|
|
|
|
if (S.vmsize != 0 && S.filesize > S.vmsize)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
2017-02-08 05:20:44 +08:00
|
|
|
" filesize field in " + CmdName +
|
2016-08-13 04:10:25 +08:00
|
|
|
" greater than vmsize field");
|
2016-03-26 01:25:34 +08:00
|
|
|
IsPageZeroSegment |= StringRef("__PAGEZERO").equals(S.segname);
|
|
|
|
} else
|
|
|
|
return SegOrErr.takeError();
|
|
|
|
|
|
|
|
return Error::success();
|
2015-06-05 06:08:37 +08:00
|
|
|
}
|
|
|
|
|
2016-12-04 09:56:10 +08:00
|
|
|
static Error checkSymtabCommand(const MachOObjectFile &Obj,
|
2016-08-27 03:34:07 +08:00
|
|
|
const MachOObjectFile::LoadCommandInfo &Load,
|
|
|
|
uint32_t LoadCommandIndex,
|
2016-11-01 04:29:48 +08:00
|
|
|
const char **SymtabLoadCmd,
|
|
|
|
std::list<MachOElement> &Elements) {
|
2016-08-27 03:34:07 +08:00
|
|
|
if (Load.C.cmdsize < sizeof(MachO::symtab_command))
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" LC_SYMTAB cmdsize too small");
|
|
|
|
if (*SymtabLoadCmd != nullptr)
|
|
|
|
return malformedError("more than one LC_SYMTAB command");
|
2019-06-05 00:55:30 +08:00
|
|
|
auto SymtabOrErr = getStructOrErr<MachO::symtab_command>(Obj, Load.Ptr);
|
|
|
|
if (!SymtabOrErr)
|
|
|
|
return SymtabOrErr.takeError();
|
|
|
|
MachO::symtab_command Symtab = SymtabOrErr.get();
|
2016-08-27 03:34:07 +08:00
|
|
|
if (Symtab.cmdsize != sizeof(MachO::symtab_command))
|
|
|
|
return malformedError("LC_SYMTAB command " + Twine(LoadCommandIndex) +
|
|
|
|
" has incorrect cmdsize");
|
2016-12-04 09:56:10 +08:00
|
|
|
uint64_t FileSize = Obj.getData().size();
|
2016-08-27 03:34:07 +08:00
|
|
|
if (Symtab.symoff > FileSize)
|
|
|
|
return malformedError("symoff field of LC_SYMTAB command " +
|
|
|
|
Twine(LoadCommandIndex) + " extends past the end "
|
|
|
|
"of the file");
|
2016-11-01 04:29:48 +08:00
|
|
|
uint64_t SymtabSize = Symtab.nsyms;
|
2016-08-27 03:34:07 +08:00
|
|
|
const char *struct_nlist_name;
|
2016-12-04 09:56:10 +08:00
|
|
|
if (Obj.is64Bit()) {
|
2016-11-01 04:29:48 +08:00
|
|
|
SymtabSize *= sizeof(MachO::nlist_64);
|
2016-08-27 03:34:07 +08:00
|
|
|
struct_nlist_name = "struct nlist_64";
|
|
|
|
} else {
|
2016-11-01 04:29:48 +08:00
|
|
|
SymtabSize *= sizeof(MachO::nlist);
|
2016-08-27 03:34:07 +08:00
|
|
|
struct_nlist_name = "struct nlist";
|
|
|
|
}
|
2016-11-01 04:29:48 +08:00
|
|
|
uint64_t BigSize = SymtabSize;
|
2016-08-27 03:34:07 +08:00
|
|
|
BigSize += Symtab.symoff;
|
|
|
|
if (BigSize > FileSize)
|
|
|
|
return malformedError("symoff field plus nsyms field times sizeof(" +
|
|
|
|
Twine(struct_nlist_name) + ") of LC_SYMTAB command " +
|
|
|
|
Twine(LoadCommandIndex) + " extends past the end "
|
|
|
|
"of the file");
|
2016-11-01 04:29:48 +08:00
|
|
|
if (Error Err = checkOverlappingElement(Elements, Symtab.symoff, SymtabSize,
|
|
|
|
"symbol table"))
|
|
|
|
return Err;
|
2016-08-27 03:34:07 +08:00
|
|
|
if (Symtab.stroff > FileSize)
|
|
|
|
return malformedError("stroff field of LC_SYMTAB command " +
|
|
|
|
Twine(LoadCommandIndex) + " extends past the end "
|
|
|
|
"of the file");
|
|
|
|
BigSize = Symtab.stroff;
|
|
|
|
BigSize += Symtab.strsize;
|
|
|
|
if (BigSize > FileSize)
|
|
|
|
return malformedError("stroff field plus strsize field of LC_SYMTAB "
|
|
|
|
"command " + Twine(LoadCommandIndex) + " extends "
|
|
|
|
"past the end of the file");
|
2016-11-01 04:29:48 +08:00
|
|
|
if (Error Err = checkOverlappingElement(Elements, Symtab.stroff,
|
|
|
|
Symtab.strsize, "string table"))
|
|
|
|
return Err;
|
2016-08-27 03:34:07 +08:00
|
|
|
*SymtabLoadCmd = Load.Ptr;
|
|
|
|
return Error::success();
|
|
|
|
}
|
|
|
|
|
2016-12-04 09:56:10 +08:00
|
|
|
static Error checkDysymtabCommand(const MachOObjectFile &Obj,
|
|
|
|
const MachOObjectFile::LoadCommandInfo &Load,
|
|
|
|
uint32_t LoadCommandIndex,
|
|
|
|
const char **DysymtabLoadCmd,
|
|
|
|
std::list<MachOElement> &Elements) {
|
2016-08-31 05:28:30 +08:00
|
|
|
if (Load.C.cmdsize < sizeof(MachO::dysymtab_command))
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" LC_DYSYMTAB cmdsize too small");
|
|
|
|
if (*DysymtabLoadCmd != nullptr)
|
|
|
|
return malformedError("more than one LC_DYSYMTAB command");
|
2019-06-05 00:55:30 +08:00
|
|
|
auto DysymtabOrErr =
|
|
|
|
getStructOrErr<MachO::dysymtab_command>(Obj, Load.Ptr);
|
|
|
|
if (!DysymtabOrErr)
|
|
|
|
return DysymtabOrErr.takeError();
|
|
|
|
MachO::dysymtab_command Dysymtab = DysymtabOrErr.get();
|
2016-08-31 05:28:30 +08:00
|
|
|
if (Dysymtab.cmdsize != sizeof(MachO::dysymtab_command))
|
|
|
|
return malformedError("LC_DYSYMTAB command " + Twine(LoadCommandIndex) +
|
|
|
|
" has incorrect cmdsize");
|
2016-12-04 09:56:10 +08:00
|
|
|
uint64_t FileSize = Obj.getData().size();
|
2016-08-31 05:28:30 +08:00
|
|
|
if (Dysymtab.tocoff > FileSize)
|
|
|
|
return malformedError("tocoff field of LC_DYSYMTAB command " +
|
|
|
|
Twine(LoadCommandIndex) + " extends past the end of "
|
|
|
|
"the file");
|
|
|
|
uint64_t BigSize = Dysymtab.ntoc;
|
|
|
|
BigSize *= sizeof(MachO::dylib_table_of_contents);
|
|
|
|
BigSize += Dysymtab.tocoff;
|
|
|
|
if (BigSize > FileSize)
|
|
|
|
return malformedError("tocoff field plus ntoc field times sizeof(struct "
|
|
|
|
"dylib_table_of_contents) of LC_DYSYMTAB command " +
|
|
|
|
Twine(LoadCommandIndex) + " extends past the end of "
|
|
|
|
"the file");
|
2016-11-03 05:08:39 +08:00
|
|
|
if (Error Err = checkOverlappingElement(Elements, Dysymtab.tocoff,
|
|
|
|
Dysymtab.ntoc * sizeof(struct
|
2017-10-18 21:31:28 +08:00
|
|
|
MachO::dylib_table_of_contents),
|
|
|
|
"table of contents"))
|
2016-11-03 05:08:39 +08:00
|
|
|
return Err;
|
2016-08-31 05:28:30 +08:00
|
|
|
if (Dysymtab.modtaboff > FileSize)
|
|
|
|
return malformedError("modtaboff field of LC_DYSYMTAB command " +
|
|
|
|
Twine(LoadCommandIndex) + " extends past the end of "
|
|
|
|
"the file");
|
|
|
|
BigSize = Dysymtab.nmodtab;
|
|
|
|
const char *struct_dylib_module_name;
|
2016-11-03 05:08:39 +08:00
|
|
|
uint64_t sizeof_modtab;
|
2016-12-04 09:56:10 +08:00
|
|
|
if (Obj.is64Bit()) {
|
2016-11-03 05:08:39 +08:00
|
|
|
sizeof_modtab = sizeof(MachO::dylib_module_64);
|
2016-08-31 05:28:30 +08:00
|
|
|
struct_dylib_module_name = "struct dylib_module_64";
|
|
|
|
} else {
|
2016-11-03 05:08:39 +08:00
|
|
|
sizeof_modtab = sizeof(MachO::dylib_module);
|
2016-08-31 05:28:30 +08:00
|
|
|
struct_dylib_module_name = "struct dylib_module";
|
|
|
|
}
|
2016-11-03 05:08:39 +08:00
|
|
|
BigSize *= sizeof_modtab;
|
2016-08-31 05:28:30 +08:00
|
|
|
BigSize += Dysymtab.modtaboff;
|
|
|
|
if (BigSize > FileSize)
|
|
|
|
return malformedError("modtaboff field plus nmodtab field times sizeof(" +
|
|
|
|
Twine(struct_dylib_module_name) + ") of LC_DYSYMTAB "
|
|
|
|
"command " + Twine(LoadCommandIndex) + " extends "
|
|
|
|
"past the end of the file");
|
2016-11-03 05:08:39 +08:00
|
|
|
if (Error Err = checkOverlappingElement(Elements, Dysymtab.modtaboff,
|
|
|
|
Dysymtab.nmodtab * sizeof_modtab,
|
2017-08-28 14:47:47 +08:00
|
|
|
"module table"))
|
2016-11-03 05:08:39 +08:00
|
|
|
return Err;
|
2016-08-31 05:28:30 +08:00
|
|
|
if (Dysymtab.extrefsymoff > FileSize)
|
|
|
|
return malformedError("extrefsymoff field of LC_DYSYMTAB command " +
|
|
|
|
Twine(LoadCommandIndex) + " extends past the end of "
|
|
|
|
"the file");
|
|
|
|
BigSize = Dysymtab.nextrefsyms;
|
|
|
|
BigSize *= sizeof(MachO::dylib_reference);
|
|
|
|
BigSize += Dysymtab.extrefsymoff;
|
|
|
|
if (BigSize > FileSize)
|
|
|
|
return malformedError("extrefsymoff field plus nextrefsyms field times "
|
|
|
|
"sizeof(struct dylib_reference) of LC_DYSYMTAB "
|
|
|
|
"command " + Twine(LoadCommandIndex) + " extends "
|
|
|
|
"past the end of the file");
|
2016-11-03 05:08:39 +08:00
|
|
|
if (Error Err = checkOverlappingElement(Elements, Dysymtab.extrefsymoff,
|
|
|
|
Dysymtab.nextrefsyms *
|
2017-08-28 14:47:47 +08:00
|
|
|
sizeof(MachO::dylib_reference),
|
|
|
|
"reference table"))
|
2016-11-03 05:08:39 +08:00
|
|
|
return Err;
|
2016-08-31 05:28:30 +08:00
|
|
|
if (Dysymtab.indirectsymoff > FileSize)
|
|
|
|
return malformedError("indirectsymoff field of LC_DYSYMTAB command " +
|
|
|
|
Twine(LoadCommandIndex) + " extends past the end of "
|
|
|
|
"the file");
|
|
|
|
BigSize = Dysymtab.nindirectsyms;
|
|
|
|
BigSize *= sizeof(uint32_t);
|
|
|
|
BigSize += Dysymtab.indirectsymoff;
|
|
|
|
if (BigSize > FileSize)
|
|
|
|
return malformedError("indirectsymoff field plus nindirectsyms field times "
|
|
|
|
"sizeof(uint32_t) of LC_DYSYMTAB command " +
|
|
|
|
Twine(LoadCommandIndex) + " extends past the end of "
|
|
|
|
"the file");
|
2016-11-03 05:08:39 +08:00
|
|
|
if (Error Err = checkOverlappingElement(Elements, Dysymtab.indirectsymoff,
|
|
|
|
Dysymtab.nindirectsyms *
|
|
|
|
sizeof(uint32_t),
|
2017-10-18 21:31:28 +08:00
|
|
|
"indirect table"))
|
2016-11-03 05:08:39 +08:00
|
|
|
return Err;
|
2016-08-31 05:28:30 +08:00
|
|
|
if (Dysymtab.extreloff > FileSize)
|
|
|
|
return malformedError("extreloff field of LC_DYSYMTAB command " +
|
|
|
|
Twine(LoadCommandIndex) + " extends past the end of "
|
|
|
|
"the file");
|
|
|
|
BigSize = Dysymtab.nextrel;
|
|
|
|
BigSize *= sizeof(MachO::relocation_info);
|
|
|
|
BigSize += Dysymtab.extreloff;
|
|
|
|
if (BigSize > FileSize)
|
|
|
|
return malformedError("extreloff field plus nextrel field times sizeof"
|
|
|
|
"(struct relocation_info) of LC_DYSYMTAB command " +
|
|
|
|
Twine(LoadCommandIndex) + " extends past the end of "
|
|
|
|
"the file");
|
2016-11-03 05:08:39 +08:00
|
|
|
if (Error Err = checkOverlappingElement(Elements, Dysymtab.extreloff,
|
|
|
|
Dysymtab.nextrel *
|
2017-08-28 14:47:47 +08:00
|
|
|
sizeof(MachO::relocation_info),
|
|
|
|
"external relocation table"))
|
2016-11-03 05:08:39 +08:00
|
|
|
return Err;
|
2016-08-31 05:28:30 +08:00
|
|
|
if (Dysymtab.locreloff > FileSize)
|
|
|
|
return malformedError("locreloff field of LC_DYSYMTAB command " +
|
|
|
|
Twine(LoadCommandIndex) + " extends past the end of "
|
|
|
|
"the file");
|
|
|
|
BigSize = Dysymtab.nlocrel;
|
|
|
|
BigSize *= sizeof(MachO::relocation_info);
|
|
|
|
BigSize += Dysymtab.locreloff;
|
|
|
|
if (BigSize > FileSize)
|
|
|
|
return malformedError("locreloff field plus nlocrel field times sizeof"
|
|
|
|
"(struct relocation_info) of LC_DYSYMTAB command " +
|
|
|
|
Twine(LoadCommandIndex) + " extends past the end of "
|
|
|
|
"the file");
|
2016-11-03 05:08:39 +08:00
|
|
|
if (Error Err = checkOverlappingElement(Elements, Dysymtab.locreloff,
|
|
|
|
Dysymtab.nlocrel *
|
2017-08-28 14:47:47 +08:00
|
|
|
sizeof(MachO::relocation_info),
|
|
|
|
"local relocation table"))
|
2016-11-03 05:08:39 +08:00
|
|
|
return Err;
|
2016-08-31 05:28:30 +08:00
|
|
|
*DysymtabLoadCmd = Load.Ptr;
|
|
|
|
return Error::success();
|
|
|
|
}
|
|
|
|
|
2016-12-04 09:56:10 +08:00
|
|
|
static Error checkLinkeditDataCommand(const MachOObjectFile &Obj,
|
2016-09-01 01:57:46 +08:00
|
|
|
const MachOObjectFile::LoadCommandInfo &Load,
|
|
|
|
uint32_t LoadCommandIndex,
|
2016-11-03 05:08:39 +08:00
|
|
|
const char **LoadCmd, const char *CmdName,
|
|
|
|
std::list<MachOElement> &Elements,
|
|
|
|
const char *ElementName) {
|
2016-09-01 01:57:46 +08:00
|
|
|
if (Load.C.cmdsize < sizeof(MachO::linkedit_data_command))
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) + " " +
|
|
|
|
CmdName + " cmdsize too small");
|
|
|
|
if (*LoadCmd != nullptr)
|
|
|
|
return malformedError("more than one " + Twine(CmdName) + " command");
|
2019-06-05 00:55:30 +08:00
|
|
|
auto LinkDataOrError =
|
|
|
|
getStructOrErr<MachO::linkedit_data_command>(Obj, Load.Ptr);
|
|
|
|
if (!LinkDataOrError)
|
|
|
|
return LinkDataOrError.takeError();
|
|
|
|
MachO::linkedit_data_command LinkData = LinkDataOrError.get();
|
2016-09-01 01:57:46 +08:00
|
|
|
if (LinkData.cmdsize != sizeof(MachO::linkedit_data_command))
|
|
|
|
return malformedError(Twine(CmdName) + " command " +
|
|
|
|
Twine(LoadCommandIndex) + " has incorrect cmdsize");
|
2016-12-04 09:56:10 +08:00
|
|
|
uint64_t FileSize = Obj.getData().size();
|
2016-09-01 01:57:46 +08:00
|
|
|
if (LinkData.dataoff > FileSize)
|
|
|
|
return malformedError("dataoff field of " + Twine(CmdName) + " command " +
|
|
|
|
Twine(LoadCommandIndex) + " extends past the end of "
|
|
|
|
"the file");
|
|
|
|
uint64_t BigSize = LinkData.dataoff;
|
|
|
|
BigSize += LinkData.datasize;
|
|
|
|
if (BigSize > FileSize)
|
|
|
|
return malformedError("dataoff field plus datasize field of " +
|
|
|
|
Twine(CmdName) + " command " +
|
|
|
|
Twine(LoadCommandIndex) + " extends past the end of "
|
|
|
|
"the file");
|
2016-11-03 05:08:39 +08:00
|
|
|
if (Error Err = checkOverlappingElement(Elements, LinkData.dataoff,
|
|
|
|
LinkData.datasize, ElementName))
|
|
|
|
return Err;
|
2016-09-01 01:57:46 +08:00
|
|
|
*LoadCmd = Load.Ptr;
|
|
|
|
return Error::success();
|
|
|
|
}
|
|
|
|
|
2016-12-04 09:56:10 +08:00
|
|
|
static Error checkDyldInfoCommand(const MachOObjectFile &Obj,
|
2016-09-14 05:42:28 +08:00
|
|
|
const MachOObjectFile::LoadCommandInfo &Load,
|
|
|
|
uint32_t LoadCommandIndex,
|
2016-11-03 05:08:39 +08:00
|
|
|
const char **LoadCmd, const char *CmdName,
|
|
|
|
std::list<MachOElement> &Elements) {
|
2016-09-14 05:42:28 +08:00
|
|
|
if (Load.C.cmdsize < sizeof(MachO::dyld_info_command))
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) + " " +
|
|
|
|
CmdName + " cmdsize too small");
|
|
|
|
if (*LoadCmd != nullptr)
|
|
|
|
return malformedError("more than one LC_DYLD_INFO and or LC_DYLD_INFO_ONLY "
|
|
|
|
"command");
|
2019-06-05 00:55:30 +08:00
|
|
|
auto DyldInfoOrErr =
|
|
|
|
getStructOrErr<MachO::dyld_info_command>(Obj, Load.Ptr);
|
|
|
|
if (!DyldInfoOrErr)
|
|
|
|
return DyldInfoOrErr.takeError();
|
|
|
|
MachO::dyld_info_command DyldInfo = DyldInfoOrErr.get();
|
2016-09-14 05:42:28 +08:00
|
|
|
if (DyldInfo.cmdsize != sizeof(MachO::dyld_info_command))
|
|
|
|
return malformedError(Twine(CmdName) + " command " +
|
|
|
|
Twine(LoadCommandIndex) + " has incorrect cmdsize");
|
2016-12-04 09:56:10 +08:00
|
|
|
uint64_t FileSize = Obj.getData().size();
|
2016-09-14 05:42:28 +08:00
|
|
|
if (DyldInfo.rebase_off > FileSize)
|
|
|
|
return malformedError("rebase_off field of " + Twine(CmdName) +
|
|
|
|
" command " + Twine(LoadCommandIndex) + " extends "
|
|
|
|
"past the end of the file");
|
|
|
|
uint64_t BigSize = DyldInfo.rebase_off;
|
|
|
|
BigSize += DyldInfo.rebase_size;
|
|
|
|
if (BigSize > FileSize)
|
|
|
|
return malformedError("rebase_off field plus rebase_size field of " +
|
|
|
|
Twine(CmdName) + " command " +
|
|
|
|
Twine(LoadCommandIndex) + " extends past the end of "
|
|
|
|
"the file");
|
2016-11-03 05:08:39 +08:00
|
|
|
if (Error Err = checkOverlappingElement(Elements, DyldInfo.rebase_off,
|
|
|
|
DyldInfo.rebase_size,
|
|
|
|
"dyld rebase info"))
|
|
|
|
return Err;
|
2016-09-14 05:42:28 +08:00
|
|
|
if (DyldInfo.bind_off > FileSize)
|
|
|
|
return malformedError("bind_off field of " + Twine(CmdName) +
|
|
|
|
" command " + Twine(LoadCommandIndex) + " extends "
|
|
|
|
"past the end of the file");
|
|
|
|
BigSize = DyldInfo.bind_off;
|
|
|
|
BigSize += DyldInfo.bind_size;
|
|
|
|
if (BigSize > FileSize)
|
|
|
|
return malformedError("bind_off field plus bind_size field of " +
|
|
|
|
Twine(CmdName) + " command " +
|
|
|
|
Twine(LoadCommandIndex) + " extends past the end of "
|
|
|
|
"the file");
|
2016-11-03 05:08:39 +08:00
|
|
|
if (Error Err = checkOverlappingElement(Elements, DyldInfo.bind_off,
|
|
|
|
DyldInfo.bind_size,
|
|
|
|
"dyld bind info"))
|
|
|
|
return Err;
|
2016-09-14 05:42:28 +08:00
|
|
|
if (DyldInfo.weak_bind_off > FileSize)
|
|
|
|
return malformedError("weak_bind_off field of " + Twine(CmdName) +
|
|
|
|
" command " + Twine(LoadCommandIndex) + " extends "
|
|
|
|
"past the end of the file");
|
|
|
|
BigSize = DyldInfo.weak_bind_off;
|
|
|
|
BigSize += DyldInfo.weak_bind_size;
|
|
|
|
if (BigSize > FileSize)
|
|
|
|
return malformedError("weak_bind_off field plus weak_bind_size field of " +
|
|
|
|
Twine(CmdName) + " command " +
|
|
|
|
Twine(LoadCommandIndex) + " extends past the end of "
|
|
|
|
"the file");
|
2016-11-03 05:08:39 +08:00
|
|
|
if (Error Err = checkOverlappingElement(Elements, DyldInfo.weak_bind_off,
|
|
|
|
DyldInfo.weak_bind_size,
|
|
|
|
"dyld weak bind info"))
|
|
|
|
return Err;
|
2016-09-14 05:42:28 +08:00
|
|
|
if (DyldInfo.lazy_bind_off > FileSize)
|
|
|
|
return malformedError("lazy_bind_off field of " + Twine(CmdName) +
|
|
|
|
" command " + Twine(LoadCommandIndex) + " extends "
|
|
|
|
"past the end of the file");
|
|
|
|
BigSize = DyldInfo.lazy_bind_off;
|
|
|
|
BigSize += DyldInfo.lazy_bind_size;
|
|
|
|
if (BigSize > FileSize)
|
|
|
|
return malformedError("lazy_bind_off field plus lazy_bind_size field of " +
|
|
|
|
Twine(CmdName) + " command " +
|
|
|
|
Twine(LoadCommandIndex) + " extends past the end of "
|
|
|
|
"the file");
|
2016-11-03 05:08:39 +08:00
|
|
|
if (Error Err = checkOverlappingElement(Elements, DyldInfo.lazy_bind_off,
|
|
|
|
DyldInfo.lazy_bind_size,
|
|
|
|
"dyld lazy bind info"))
|
|
|
|
return Err;
|
2016-09-14 05:42:28 +08:00
|
|
|
if (DyldInfo.export_off > FileSize)
|
|
|
|
return malformedError("export_off field of " + Twine(CmdName) +
|
|
|
|
" command " + Twine(LoadCommandIndex) + " extends "
|
|
|
|
"past the end of the file");
|
|
|
|
BigSize = DyldInfo.export_off;
|
|
|
|
BigSize += DyldInfo.export_size;
|
|
|
|
if (BigSize > FileSize)
|
|
|
|
return malformedError("export_off field plus export_size field of " +
|
|
|
|
Twine(CmdName) + " command " +
|
|
|
|
Twine(LoadCommandIndex) + " extends past the end of "
|
|
|
|
"the file");
|
2016-11-03 05:08:39 +08:00
|
|
|
if (Error Err = checkOverlappingElement(Elements, DyldInfo.export_off,
|
|
|
|
DyldInfo.export_size,
|
|
|
|
"dyld export info"))
|
|
|
|
return Err;
|
2016-09-14 05:42:28 +08:00
|
|
|
*LoadCmd = Load.Ptr;
|
|
|
|
return Error::success();
|
|
|
|
}
|
|
|
|
|
2016-12-04 09:56:10 +08:00
|
|
|
static Error checkDylibCommand(const MachOObjectFile &Obj,
|
2016-09-21 04:14:14 +08:00
|
|
|
const MachOObjectFile::LoadCommandInfo &Load,
|
|
|
|
uint32_t LoadCommandIndex, const char *CmdName) {
|
|
|
|
if (Load.C.cmdsize < sizeof(MachO::dylib_command))
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) + " " +
|
|
|
|
CmdName + " cmdsize too small");
|
2019-06-05 00:55:30 +08:00
|
|
|
auto CommandOrErr = getStructOrErr<MachO::dylib_command>(Obj, Load.Ptr);
|
|
|
|
if (!CommandOrErr)
|
|
|
|
return CommandOrErr.takeError();
|
|
|
|
MachO::dylib_command D = CommandOrErr.get();
|
2016-09-21 04:14:14 +08:00
|
|
|
if (D.dylib.name < sizeof(MachO::dylib_command))
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) + " " +
|
|
|
|
CmdName + " name.offset field too small, not past "
|
|
|
|
"the end of the dylib_command struct");
|
|
|
|
if (D.dylib.name >= D.cmdsize)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) + " " +
|
|
|
|
CmdName + " name.offset field extends past the end "
|
|
|
|
"of the load command");
|
|
|
|
// Make sure there is a null between the starting offset of the name and
|
|
|
|
// the end of the load command.
|
|
|
|
uint32_t i;
|
|
|
|
const char *P = (const char *)Load.Ptr;
|
|
|
|
for (i = D.dylib.name; i < D.cmdsize; i++)
|
|
|
|
if (P[i] == '\0')
|
|
|
|
break;
|
|
|
|
if (i >= D.cmdsize)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) + " " +
|
|
|
|
CmdName + " library name extends past the end of the "
|
|
|
|
"load command");
|
|
|
|
return Error::success();
|
|
|
|
}
|
|
|
|
|
2016-12-04 09:56:10 +08:00
|
|
|
static Error checkDylibIdCommand(const MachOObjectFile &Obj,
|
2016-09-21 04:14:14 +08:00
|
|
|
const MachOObjectFile::LoadCommandInfo &Load,
|
|
|
|
uint32_t LoadCommandIndex,
|
|
|
|
const char **LoadCmd) {
|
|
|
|
if (Error Err = checkDylibCommand(Obj, Load, LoadCommandIndex,
|
|
|
|
"LC_ID_DYLIB"))
|
|
|
|
return Err;
|
|
|
|
if (*LoadCmd != nullptr)
|
|
|
|
return malformedError("more than one LC_ID_DYLIB command");
|
2016-12-04 09:56:10 +08:00
|
|
|
if (Obj.getHeader().filetype != MachO::MH_DYLIB &&
|
|
|
|
Obj.getHeader().filetype != MachO::MH_DYLIB_STUB)
|
2016-09-21 04:14:14 +08:00
|
|
|
return malformedError("LC_ID_DYLIB load command in non-dynamic library "
|
|
|
|
"file type");
|
|
|
|
*LoadCmd = Load.Ptr;
|
|
|
|
return Error::success();
|
|
|
|
}
|
|
|
|
|
2016-12-04 09:56:10 +08:00
|
|
|
static Error checkDyldCommand(const MachOObjectFile &Obj,
|
2016-09-28 07:24:13 +08:00
|
|
|
const MachOObjectFile::LoadCommandInfo &Load,
|
|
|
|
uint32_t LoadCommandIndex, const char *CmdName) {
|
|
|
|
if (Load.C.cmdsize < sizeof(MachO::dylinker_command))
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) + " " +
|
|
|
|
CmdName + " cmdsize too small");
|
2019-06-05 00:55:30 +08:00
|
|
|
auto CommandOrErr = getStructOrErr<MachO::dylinker_command>(Obj, Load.Ptr);
|
|
|
|
if (!CommandOrErr)
|
|
|
|
return CommandOrErr.takeError();
|
|
|
|
MachO::dylinker_command D = CommandOrErr.get();
|
2016-09-28 07:24:13 +08:00
|
|
|
if (D.name < sizeof(MachO::dylinker_command))
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) + " " +
|
|
|
|
CmdName + " name.offset field too small, not past "
|
|
|
|
"the end of the dylinker_command struct");
|
|
|
|
if (D.name >= D.cmdsize)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) + " " +
|
|
|
|
CmdName + " name.offset field extends past the end "
|
|
|
|
"of the load command");
|
|
|
|
// Make sure there is a null between the starting offset of the name and
|
|
|
|
// the end of the load command.
|
|
|
|
uint32_t i;
|
|
|
|
const char *P = (const char *)Load.Ptr;
|
|
|
|
for (i = D.name; i < D.cmdsize; i++)
|
|
|
|
if (P[i] == '\0')
|
|
|
|
break;
|
|
|
|
if (i >= D.cmdsize)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) + " " +
|
|
|
|
CmdName + " dyld name extends past the end of the "
|
|
|
|
"load command");
|
|
|
|
return Error::success();
|
|
|
|
}
|
|
|
|
|
2016-12-04 09:56:10 +08:00
|
|
|
static Error checkVersCommand(const MachOObjectFile &Obj,
|
2016-09-29 05:20:45 +08:00
|
|
|
const MachOObjectFile::LoadCommandInfo &Load,
|
|
|
|
uint32_t LoadCommandIndex,
|
|
|
|
const char **LoadCmd, const char *CmdName) {
|
|
|
|
if (Load.C.cmdsize != sizeof(MachO::version_min_command))
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) + " " +
|
|
|
|
CmdName + " has incorrect cmdsize");
|
|
|
|
if (*LoadCmd != nullptr)
|
|
|
|
return malformedError("more than one LC_VERSION_MIN_MACOSX, "
|
|
|
|
"LC_VERSION_MIN_IPHONEOS, LC_VERSION_MIN_TVOS or "
|
|
|
|
"LC_VERSION_MIN_WATCHOS command");
|
|
|
|
*LoadCmd = Load.Ptr;
|
|
|
|
return Error::success();
|
|
|
|
}
|
|
|
|
|
2017-01-20 01:36:31 +08:00
|
|
|
static Error checkNoteCommand(const MachOObjectFile &Obj,
|
|
|
|
const MachOObjectFile::LoadCommandInfo &Load,
|
|
|
|
uint32_t LoadCommandIndex,
|
|
|
|
std::list<MachOElement> &Elements) {
|
|
|
|
if (Load.C.cmdsize != sizeof(MachO::note_command))
|
2017-09-13 21:43:01 +08:00
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
2017-01-20 01:36:31 +08:00
|
|
|
" LC_NOTE has incorrect cmdsize");
|
2019-06-05 00:55:30 +08:00
|
|
|
auto NoteCmdOrErr = getStructOrErr<MachO::note_command>(Obj, Load.Ptr);
|
|
|
|
if (!NoteCmdOrErr)
|
|
|
|
return NoteCmdOrErr.takeError();
|
|
|
|
MachO::note_command Nt = NoteCmdOrErr.get();
|
2017-01-20 01:36:31 +08:00
|
|
|
uint64_t FileSize = Obj.getData().size();
|
|
|
|
if (Nt.offset > FileSize)
|
|
|
|
return malformedError("offset field of LC_NOTE command " +
|
|
|
|
Twine(LoadCommandIndex) + " extends "
|
|
|
|
"past the end of the file");
|
|
|
|
uint64_t BigSize = Nt.offset;
|
|
|
|
BigSize += Nt.size;
|
|
|
|
if (BigSize > FileSize)
|
|
|
|
return malformedError("size field plus offset field of LC_NOTE command " +
|
|
|
|
Twine(LoadCommandIndex) + " extends past the end of "
|
|
|
|
"the file");
|
|
|
|
if (Error Err = checkOverlappingElement(Elements, Nt.offset, Nt.size,
|
|
|
|
"LC_NOTE data"))
|
|
|
|
return Err;
|
|
|
|
return Error::success();
|
|
|
|
}
|
|
|
|
|
2017-01-24 04:07:55 +08:00
|
|
|
static Error
|
|
|
|
parseBuildVersionCommand(const MachOObjectFile &Obj,
|
|
|
|
const MachOObjectFile::LoadCommandInfo &Load,
|
|
|
|
SmallVectorImpl<const char*> &BuildTools,
|
|
|
|
uint32_t LoadCommandIndex) {
|
2019-06-05 00:55:30 +08:00
|
|
|
auto BVCOrErr =
|
|
|
|
getStructOrErr<MachO::build_version_command>(Obj, Load.Ptr);
|
|
|
|
if (!BVCOrErr)
|
|
|
|
return BVCOrErr.takeError();
|
|
|
|
MachO::build_version_command BVC = BVCOrErr.get();
|
2017-01-24 04:07:55 +08:00
|
|
|
if (Load.C.cmdsize !=
|
|
|
|
sizeof(MachO::build_version_command) +
|
|
|
|
BVC.ntools * sizeof(MachO::build_tool_version))
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" LC_BUILD_VERSION_COMMAND has incorrect cmdsize");
|
|
|
|
|
|
|
|
auto Start = Load.Ptr + sizeof(MachO::build_version_command);
|
|
|
|
BuildTools.resize(BVC.ntools);
|
|
|
|
for (unsigned i = 0; i < BVC.ntools; ++i)
|
|
|
|
BuildTools[i] = Start + i * sizeof(MachO::build_tool_version);
|
|
|
|
|
|
|
|
return Error::success();
|
|
|
|
}
|
|
|
|
|
2016-12-04 09:56:10 +08:00
|
|
|
static Error checkRpathCommand(const MachOObjectFile &Obj,
|
2016-09-29 07:16:01 +08:00
|
|
|
const MachOObjectFile::LoadCommandInfo &Load,
|
|
|
|
uint32_t LoadCommandIndex) {
|
|
|
|
if (Load.C.cmdsize < sizeof(MachO::rpath_command))
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" LC_RPATH cmdsize too small");
|
2019-06-05 00:55:30 +08:00
|
|
|
auto ROrErr = getStructOrErr<MachO::rpath_command>(Obj, Load.Ptr);
|
|
|
|
if (!ROrErr)
|
|
|
|
return ROrErr.takeError();
|
|
|
|
MachO::rpath_command R = ROrErr.get();
|
2016-09-29 07:16:01 +08:00
|
|
|
if (R.path < sizeof(MachO::rpath_command))
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" LC_RPATH path.offset field too small, not past "
|
|
|
|
"the end of the rpath_command struct");
|
|
|
|
if (R.path >= R.cmdsize)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" LC_RPATH path.offset field extends past the end "
|
|
|
|
"of the load command");
|
|
|
|
// Make sure there is a null between the starting offset of the path and
|
|
|
|
// the end of the load command.
|
|
|
|
uint32_t i;
|
|
|
|
const char *P = (const char *)Load.Ptr;
|
|
|
|
for (i = R.path; i < R.cmdsize; i++)
|
|
|
|
if (P[i] == '\0')
|
|
|
|
break;
|
|
|
|
if (i >= R.cmdsize)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" LC_RPATH library name extends past the end of the "
|
|
|
|
"load command");
|
|
|
|
return Error::success();
|
|
|
|
}
|
|
|
|
|
2016-12-04 09:56:10 +08:00
|
|
|
static Error checkEncryptCommand(const MachOObjectFile &Obj,
|
2016-10-05 04:37:43 +08:00
|
|
|
const MachOObjectFile::LoadCommandInfo &Load,
|
|
|
|
uint32_t LoadCommandIndex,
|
|
|
|
uint64_t cryptoff, uint64_t cryptsize,
|
|
|
|
const char **LoadCmd, const char *CmdName) {
|
|
|
|
if (*LoadCmd != nullptr)
|
|
|
|
return malformedError("more than one LC_ENCRYPTION_INFO and or "
|
|
|
|
"LC_ENCRYPTION_INFO_64 command");
|
2016-12-04 09:56:10 +08:00
|
|
|
uint64_t FileSize = Obj.getData().size();
|
2016-10-05 04:37:43 +08:00
|
|
|
if (cryptoff > FileSize)
|
|
|
|
return malformedError("cryptoff field of " + Twine(CmdName) +
|
|
|
|
" command " + Twine(LoadCommandIndex) + " extends "
|
|
|
|
"past the end of the file");
|
|
|
|
uint64_t BigSize = cryptoff;
|
|
|
|
BigSize += cryptsize;
|
|
|
|
if (BigSize > FileSize)
|
|
|
|
return malformedError("cryptoff field plus cryptsize field of " +
|
|
|
|
Twine(CmdName) + " command " +
|
|
|
|
Twine(LoadCommandIndex) + " extends past the end of "
|
|
|
|
"the file");
|
|
|
|
*LoadCmd = Load.Ptr;
|
|
|
|
return Error::success();
|
|
|
|
}
|
|
|
|
|
2016-12-04 09:56:10 +08:00
|
|
|
static Error checkLinkerOptCommand(const MachOObjectFile &Obj,
|
2016-10-12 05:04:39 +08:00
|
|
|
const MachOObjectFile::LoadCommandInfo &Load,
|
|
|
|
uint32_t LoadCommandIndex) {
|
|
|
|
if (Load.C.cmdsize < sizeof(MachO::linker_option_command))
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" LC_LINKER_OPTION cmdsize too small");
|
2019-06-05 00:55:30 +08:00
|
|
|
auto LinkOptionOrErr =
|
|
|
|
getStructOrErr<MachO::linker_option_command>(Obj, Load.Ptr);
|
|
|
|
if (!LinkOptionOrErr)
|
|
|
|
return LinkOptionOrErr.takeError();
|
|
|
|
MachO::linker_option_command L = LinkOptionOrErr.get();
|
2016-10-12 05:04:39 +08:00
|
|
|
// Make sure the count of strings is correct.
|
|
|
|
const char *string = (const char *)Load.Ptr +
|
|
|
|
sizeof(struct MachO::linker_option_command);
|
|
|
|
uint32_t left = L.cmdsize - sizeof(struct MachO::linker_option_command);
|
|
|
|
uint32_t i = 0;
|
|
|
|
while (left > 0) {
|
|
|
|
while (*string == '\0' && left > 0) {
|
|
|
|
string++;
|
|
|
|
left--;
|
|
|
|
}
|
|
|
|
if (left > 0) {
|
|
|
|
i++;
|
|
|
|
uint32_t NullPos = StringRef(string, left).find('\0');
|
2019-03-12 02:29:25 +08:00
|
|
|
if (0xffffffff == NullPos)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" LC_LINKER_OPTION string #" + Twine(i) +
|
|
|
|
" is not NULL terminated");
|
2016-10-12 05:04:39 +08:00
|
|
|
uint32_t len = std::min(NullPos, left) + 1;
|
|
|
|
string += len;
|
|
|
|
left -= len;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (L.count != i)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" LC_LINKER_OPTION string count " + Twine(L.count) +
|
|
|
|
" does not match number of strings");
|
|
|
|
return Error::success();
|
|
|
|
}
|
|
|
|
|
2016-12-04 09:56:10 +08:00
|
|
|
static Error checkSubCommand(const MachOObjectFile &Obj,
|
2016-10-18 06:09:25 +08:00
|
|
|
const MachOObjectFile::LoadCommandInfo &Load,
|
|
|
|
uint32_t LoadCommandIndex, const char *CmdName,
|
|
|
|
size_t SizeOfCmd, const char *CmdStructName,
|
|
|
|
uint32_t PathOffset, const char *PathFieldName) {
|
|
|
|
if (PathOffset < SizeOfCmd)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) + " " +
|
|
|
|
CmdName + " " + PathFieldName + ".offset field too "
|
|
|
|
"small, not past the end of the " + CmdStructName);
|
|
|
|
if (PathOffset >= Load.C.cmdsize)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) + " " +
|
|
|
|
CmdName + " " + PathFieldName + ".offset field "
|
|
|
|
"extends past the end of the load command");
|
|
|
|
// Make sure there is a null between the starting offset of the path and
|
|
|
|
// the end of the load command.
|
|
|
|
uint32_t i;
|
|
|
|
const char *P = (const char *)Load.Ptr;
|
|
|
|
for (i = PathOffset; i < Load.C.cmdsize; i++)
|
|
|
|
if (P[i] == '\0')
|
|
|
|
break;
|
|
|
|
if (i >= Load.C.cmdsize)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) + " " +
|
|
|
|
CmdName + " " + PathFieldName + " name extends past "
|
|
|
|
"the end of the load command");
|
|
|
|
return Error::success();
|
|
|
|
}
|
|
|
|
|
2016-12-04 09:56:10 +08:00
|
|
|
static Error checkThreadCommand(const MachOObjectFile &Obj,
|
2016-10-20 07:44:34 +08:00
|
|
|
const MachOObjectFile::LoadCommandInfo &Load,
|
|
|
|
uint32_t LoadCommandIndex,
|
|
|
|
const char *CmdName) {
|
|
|
|
if (Load.C.cmdsize < sizeof(MachO::thread_command))
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
CmdName + " cmdsize too small");
|
2019-06-05 00:55:30 +08:00
|
|
|
auto ThreadCommandOrErr =
|
|
|
|
getStructOrErr<MachO::thread_command>(Obj, Load.Ptr);
|
|
|
|
if (!ThreadCommandOrErr)
|
|
|
|
return ThreadCommandOrErr.takeError();
|
|
|
|
MachO::thread_command T = ThreadCommandOrErr.get();
|
2016-10-20 07:44:34 +08:00
|
|
|
const char *state = Load.Ptr + sizeof(MachO::thread_command);
|
|
|
|
const char *end = Load.Ptr + T.cmdsize;
|
|
|
|
uint32_t nflavor = 0;
|
|
|
|
uint32_t cputype = getCPUType(Obj);
|
|
|
|
while (state < end) {
|
|
|
|
if(state + sizeof(uint32_t) > end)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
"flavor in " + CmdName + " extends past end of "
|
|
|
|
"command");
|
|
|
|
uint32_t flavor;
|
|
|
|
memcpy(&flavor, state, sizeof(uint32_t));
|
2016-12-04 09:56:10 +08:00
|
|
|
if (Obj.isLittleEndian() != sys::IsLittleEndianHost)
|
2016-10-20 07:44:34 +08:00
|
|
|
sys::swapByteOrder(flavor);
|
|
|
|
state += sizeof(uint32_t);
|
|
|
|
|
|
|
|
if(state + sizeof(uint32_t) > end)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" count in " + CmdName + " extends past end of "
|
|
|
|
"command");
|
|
|
|
uint32_t count;
|
|
|
|
memcpy(&count, state, sizeof(uint32_t));
|
2016-12-04 09:56:10 +08:00
|
|
|
if (Obj.isLittleEndian() != sys::IsLittleEndianHost)
|
2016-10-20 07:44:34 +08:00
|
|
|
sys::swapByteOrder(count);
|
|
|
|
state += sizeof(uint32_t);
|
|
|
|
|
2017-01-24 05:13:29 +08:00
|
|
|
if (cputype == MachO::CPU_TYPE_I386) {
|
|
|
|
if (flavor == MachO::x86_THREAD_STATE32) {
|
|
|
|
if (count != MachO::x86_THREAD_STATE32_COUNT)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" count not x86_THREAD_STATE32_COUNT for "
|
|
|
|
"flavor number " + Twine(nflavor) + " which is "
|
|
|
|
"a x86_THREAD_STATE32 flavor in " + CmdName +
|
|
|
|
" command");
|
|
|
|
if (state + sizeof(MachO::x86_thread_state32_t) > end)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" x86_THREAD_STATE32 extends past end of "
|
|
|
|
"command in " + CmdName + " command");
|
|
|
|
state += sizeof(MachO::x86_thread_state32_t);
|
|
|
|
} else {
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" unknown flavor (" + Twine(flavor) + ") for "
|
|
|
|
"flavor number " + Twine(nflavor) + " in " +
|
|
|
|
CmdName + " command");
|
|
|
|
}
|
|
|
|
} else if (cputype == MachO::CPU_TYPE_X86_64) {
|
2018-03-09 07:10:38 +08:00
|
|
|
if (flavor == MachO::x86_THREAD_STATE) {
|
|
|
|
if (count != MachO::x86_THREAD_STATE_COUNT)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" count not x86_THREAD_STATE_COUNT for "
|
|
|
|
"flavor number " + Twine(nflavor) + " which is "
|
|
|
|
"a x86_THREAD_STATE flavor in " + CmdName +
|
|
|
|
" command");
|
|
|
|
if (state + sizeof(MachO::x86_thread_state_t) > end)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" x86_THREAD_STATE extends past end of "
|
|
|
|
"command in " + CmdName + " command");
|
|
|
|
state += sizeof(MachO::x86_thread_state_t);
|
|
|
|
} else if (flavor == MachO::x86_FLOAT_STATE) {
|
|
|
|
if (count != MachO::x86_FLOAT_STATE_COUNT)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" count not x86_FLOAT_STATE_COUNT for "
|
|
|
|
"flavor number " + Twine(nflavor) + " which is "
|
|
|
|
"a x86_FLOAT_STATE flavor in " + CmdName +
|
|
|
|
" command");
|
|
|
|
if (state + sizeof(MachO::x86_float_state_t) > end)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" x86_FLOAT_STATE extends past end of "
|
|
|
|
"command in " + CmdName + " command");
|
|
|
|
state += sizeof(MachO::x86_float_state_t);
|
|
|
|
} else if (flavor == MachO::x86_EXCEPTION_STATE) {
|
|
|
|
if (count != MachO::x86_EXCEPTION_STATE_COUNT)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" count not x86_EXCEPTION_STATE_COUNT for "
|
|
|
|
"flavor number " + Twine(nflavor) + " which is "
|
|
|
|
"a x86_EXCEPTION_STATE flavor in " + CmdName +
|
|
|
|
" command");
|
|
|
|
if (state + sizeof(MachO::x86_exception_state_t) > end)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" x86_EXCEPTION_STATE extends past end of "
|
|
|
|
"command in " + CmdName + " command");
|
|
|
|
state += sizeof(MachO::x86_exception_state_t);
|
|
|
|
} else if (flavor == MachO::x86_THREAD_STATE64) {
|
2016-10-20 07:44:34 +08:00
|
|
|
if (count != MachO::x86_THREAD_STATE64_COUNT)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" count not x86_THREAD_STATE64_COUNT for "
|
|
|
|
"flavor number " + Twine(nflavor) + " which is "
|
|
|
|
"a x86_THREAD_STATE64 flavor in " + CmdName +
|
|
|
|
" command");
|
|
|
|
if (state + sizeof(MachO::x86_thread_state64_t) > end)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" x86_THREAD_STATE64 extends past end of "
|
|
|
|
"command in " + CmdName + " command");
|
|
|
|
state += sizeof(MachO::x86_thread_state64_t);
|
2018-03-09 07:10:38 +08:00
|
|
|
} else if (flavor == MachO::x86_EXCEPTION_STATE64) {
|
|
|
|
if (count != MachO::x86_EXCEPTION_STATE64_COUNT)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" count not x86_EXCEPTION_STATE64_COUNT for "
|
|
|
|
"flavor number " + Twine(nflavor) + " which is "
|
|
|
|
"a x86_EXCEPTION_STATE64 flavor in " + CmdName +
|
|
|
|
" command");
|
|
|
|
if (state + sizeof(MachO::x86_exception_state64_t) > end)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" x86_EXCEPTION_STATE64 extends past end of "
|
|
|
|
"command in " + CmdName + " command");
|
|
|
|
state += sizeof(MachO::x86_exception_state64_t);
|
2016-10-20 07:44:34 +08:00
|
|
|
} else {
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" unknown flavor (" + Twine(flavor) + ") for "
|
|
|
|
"flavor number " + Twine(nflavor) + " in " +
|
|
|
|
CmdName + " command");
|
|
|
|
}
|
|
|
|
} else if (cputype == MachO::CPU_TYPE_ARM) {
|
|
|
|
if (flavor == MachO::ARM_THREAD_STATE) {
|
|
|
|
if (count != MachO::ARM_THREAD_STATE_COUNT)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" count not ARM_THREAD_STATE_COUNT for "
|
|
|
|
"flavor number " + Twine(nflavor) + " which is "
|
|
|
|
"a ARM_THREAD_STATE flavor in " + CmdName +
|
|
|
|
" command");
|
|
|
|
if (state + sizeof(MachO::arm_thread_state32_t) > end)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" ARM_THREAD_STATE extends past end of "
|
|
|
|
"command in " + CmdName + " command");
|
|
|
|
state += sizeof(MachO::arm_thread_state32_t);
|
|
|
|
} else {
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" unknown flavor (" + Twine(flavor) + ") for "
|
|
|
|
"flavor number " + Twine(nflavor) + " in " +
|
|
|
|
CmdName + " command");
|
|
|
|
}
|
2019-05-14 19:25:44 +08:00
|
|
|
} else if (cputype == MachO::CPU_TYPE_ARM64 ||
|
|
|
|
cputype == MachO::CPU_TYPE_ARM64_32) {
|
2016-11-04 04:51:28 +08:00
|
|
|
if (flavor == MachO::ARM_THREAD_STATE64) {
|
|
|
|
if (count != MachO::ARM_THREAD_STATE64_COUNT)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" count not ARM_THREAD_STATE64_COUNT for "
|
|
|
|
"flavor number " + Twine(nflavor) + " which is "
|
|
|
|
"a ARM_THREAD_STATE64 flavor in " + CmdName +
|
|
|
|
" command");
|
|
|
|
if (state + sizeof(MachO::arm_thread_state64_t) > end)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" ARM_THREAD_STATE64 extends past end of "
|
|
|
|
"command in " + CmdName + " command");
|
|
|
|
state += sizeof(MachO::arm_thread_state64_t);
|
|
|
|
} else {
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" unknown flavor (" + Twine(flavor) + ") for "
|
|
|
|
"flavor number " + Twine(nflavor) + " in " +
|
|
|
|
CmdName + " command");
|
|
|
|
}
|
2016-10-20 07:44:34 +08:00
|
|
|
} else if (cputype == MachO::CPU_TYPE_POWERPC) {
|
|
|
|
if (flavor == MachO::PPC_THREAD_STATE) {
|
|
|
|
if (count != MachO::PPC_THREAD_STATE_COUNT)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" count not PPC_THREAD_STATE_COUNT for "
|
|
|
|
"flavor number " + Twine(nflavor) + " which is "
|
|
|
|
"a PPC_THREAD_STATE flavor in " + CmdName +
|
|
|
|
" command");
|
|
|
|
if (state + sizeof(MachO::ppc_thread_state32_t) > end)
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" PPC_THREAD_STATE extends past end of "
|
|
|
|
"command in " + CmdName + " command");
|
|
|
|
state += sizeof(MachO::ppc_thread_state32_t);
|
|
|
|
} else {
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" unknown flavor (" + Twine(flavor) + ") for "
|
|
|
|
"flavor number " + Twine(nflavor) + " in " +
|
|
|
|
CmdName + " command");
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
return malformedError("unknown cputype (" + Twine(cputype) + ") load "
|
|
|
|
"command " + Twine(LoadCommandIndex) + " for " +
|
|
|
|
CmdName + " command can't be checked");
|
|
|
|
}
|
|
|
|
nflavor++;
|
|
|
|
}
|
|
|
|
return Error::success();
|
|
|
|
}
|
|
|
|
|
2016-12-04 09:56:10 +08:00
|
|
|
static Error checkTwoLevelHintsCommand(const MachOObjectFile &Obj,
|
2016-10-21 04:10:30 +08:00
|
|
|
const MachOObjectFile::LoadCommandInfo
|
|
|
|
&Load,
|
|
|
|
uint32_t LoadCommandIndex,
|
2016-11-03 05:08:39 +08:00
|
|
|
const char **LoadCmd,
|
|
|
|
std::list<MachOElement> &Elements) {
|
2016-10-21 04:10:30 +08:00
|
|
|
if (Load.C.cmdsize != sizeof(MachO::twolevel_hints_command))
|
|
|
|
return malformedError("load command " + Twine(LoadCommandIndex) +
|
|
|
|
" LC_TWOLEVEL_HINTS has incorrect cmdsize");
|
|
|
|
if (*LoadCmd != nullptr)
|
|
|
|
return malformedError("more than one LC_TWOLEVEL_HINTS command");
|
2019-06-05 00:55:30 +08:00
|
|
|
auto HintsOrErr = getStructOrErr<MachO::twolevel_hints_command>(Obj, Load.Ptr);
|
|
|
|
if(!HintsOrErr)
|
|
|
|
return HintsOrErr.takeError();
|
|
|
|
MachO::twolevel_hints_command Hints = HintsOrErr.get();
|
2016-12-04 09:56:10 +08:00
|
|
|
uint64_t FileSize = Obj.getData().size();
|
2016-10-21 04:10:30 +08:00
|
|
|
if (Hints.offset > FileSize)
|
|
|
|
return malformedError("offset field of LC_TWOLEVEL_HINTS command " +
|
|
|
|
Twine(LoadCommandIndex) + " extends past the end of "
|
|
|
|
"the file");
|
|
|
|
uint64_t BigSize = Hints.nhints;
|
2017-10-18 04:43:33 +08:00
|
|
|
BigSize *= sizeof(MachO::twolevel_hint);
|
2016-10-21 04:10:30 +08:00
|
|
|
BigSize += Hints.offset;
|
|
|
|
if (BigSize > FileSize)
|
|
|
|
return malformedError("offset field plus nhints times sizeof(struct "
|
|
|
|
"twolevel_hint) field of LC_TWOLEVEL_HINTS command " +
|
|
|
|
Twine(LoadCommandIndex) + " extends past the end of "
|
|
|
|
"the file");
|
2016-11-03 05:08:39 +08:00
|
|
|
if (Error Err = checkOverlappingElement(Elements, Hints.offset, Hints.nhints *
|
|
|
|
sizeof(MachO::twolevel_hint),
|
|
|
|
"two level hints"))
|
|
|
|
return Err;
|
2016-10-21 04:10:30 +08:00
|
|
|
*LoadCmd = Load.Ptr;
|
|
|
|
return Error::success();
|
|
|
|
}
|
|
|
|
|
2016-10-28 04:59:10 +08:00
|
|
|
// Returns true if the libObject code does not support the load command and its
|
|
|
|
// contents. The cmd value it is treated as an unknown load command but with
|
|
|
|
// an error message that says the cmd value is obsolete.
|
|
|
|
static bool isLoadCommandObsolete(uint32_t cmd) {
|
|
|
|
if (cmd == MachO::LC_SYMSEG ||
|
|
|
|
cmd == MachO::LC_LOADFVMLIB ||
|
|
|
|
cmd == MachO::LC_IDFVMLIB ||
|
|
|
|
cmd == MachO::LC_IDENT ||
|
|
|
|
cmd == MachO::LC_FVMFILE ||
|
|
|
|
cmd == MachO::LC_PREPAGE ||
|
|
|
|
cmd == MachO::LC_PREBOUND_DYLIB ||
|
|
|
|
cmd == MachO::LC_TWOLEVEL_HINTS ||
|
|
|
|
cmd == MachO::LC_PREBIND_CKSUM)
|
|
|
|
return true;
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2016-03-26 05:59:14 +08:00
|
|
|
Expected<std::unique_ptr<MachOObjectFile>>
|
|
|
|
MachOObjectFile::create(MemoryBufferRef Object, bool IsLittleEndian,
|
2016-10-25 05:15:11 +08:00
|
|
|
bool Is64Bits, uint32_t UniversalCputype,
|
|
|
|
uint32_t UniversalIndex) {
|
2016-11-11 12:28:40 +08:00
|
|
|
Error Err = Error::success();
|
2016-03-26 05:59:14 +08:00
|
|
|
std::unique_ptr<MachOObjectFile> Obj(
|
|
|
|
new MachOObjectFile(std::move(Object), IsLittleEndian,
|
2016-10-25 05:15:11 +08:00
|
|
|
Is64Bits, Err, UniversalCputype,
|
|
|
|
UniversalIndex));
|
2016-03-26 05:59:14 +08:00
|
|
|
if (Err)
|
|
|
|
return std::move(Err);
|
|
|
|
return std::move(Obj);
|
|
|
|
}
|
|
|
|
|
2014-08-20 02:44:46 +08:00
|
|
|
MachOObjectFile::MachOObjectFile(MemoryBufferRef Object, bool IsLittleEndian,
|
2016-10-25 05:15:11 +08:00
|
|
|
bool Is64bits, Error &Err,
|
|
|
|
uint32_t UniversalCputype,
|
|
|
|
uint32_t UniversalIndex)
|
2017-04-22 06:03:05 +08:00
|
|
|
: ObjectFile(getMachOType(IsLittleEndian, Is64bits), Object) {
|
2016-07-23 00:11:25 +08:00
|
|
|
ErrorAsOutParameter ErrAsOutParam(&Err);
|
2016-08-13 04:10:25 +08:00
|
|
|
uint64_t SizeOfHeaders;
|
2016-10-25 05:15:11 +08:00
|
|
|
uint32_t cputype;
|
2016-04-14 05:17:58 +08:00
|
|
|
if (is64Bit()) {
|
2016-12-04 09:56:10 +08:00
|
|
|
parseHeader(*this, Header64, Err);
|
2016-08-13 04:10:25 +08:00
|
|
|
SizeOfHeaders = sizeof(MachO::mach_header_64);
|
2016-10-25 05:15:11 +08:00
|
|
|
cputype = Header64.cputype;
|
2016-04-14 05:17:58 +08:00
|
|
|
} else {
|
2016-12-04 09:56:10 +08:00
|
|
|
parseHeader(*this, Header, Err);
|
2016-08-13 04:10:25 +08:00
|
|
|
SizeOfHeaders = sizeof(MachO::mach_header);
|
2016-10-25 05:15:11 +08:00
|
|
|
cputype = Header.cputype;
|
2016-04-14 05:17:58 +08:00
|
|
|
}
|
2016-03-26 01:25:34 +08:00
|
|
|
if (Err)
|
2015-06-05 03:45:22 +08:00
|
|
|
return;
|
2016-08-13 04:10:25 +08:00
|
|
|
SizeOfHeaders += getHeader().sizeofcmds;
|
|
|
|
if (getData().data() + SizeOfHeaders > getData().end()) {
|
2016-05-07 04:16:28 +08:00
|
|
|
Err = malformedError("load commands extend past the end of the file");
|
2016-04-14 05:17:58 +08:00
|
|
|
return;
|
|
|
|
}
|
2016-10-25 05:15:11 +08:00
|
|
|
if (UniversalCputype != 0 && cputype != UniversalCputype) {
|
|
|
|
Err = malformedError("universal header architecture: " +
|
|
|
|
Twine(UniversalIndex) + "'s cputype does not match "
|
|
|
|
"object file's mach header");
|
|
|
|
return;
|
|
|
|
}
|
2016-11-01 04:29:48 +08:00
|
|
|
std::list<MachOElement> Elements;
|
|
|
|
Elements.push_back({0, SizeOfHeaders, "Mach-O headers"});
|
2015-06-05 03:22:03 +08:00
|
|
|
|
|
|
|
uint32_t LoadCommandCount = getHeader().ncmds;
|
2016-03-26 01:25:34 +08:00
|
|
|
LoadCommandInfo Load;
|
2016-09-21 04:14:14 +08:00
|
|
|
if (LoadCommandCount != 0) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if (auto LoadOrErr = getFirstLoadCommandInfo(*this))
|
2016-09-21 04:14:14 +08:00
|
|
|
Load = *LoadOrErr;
|
|
|
|
else {
|
|
|
|
Err = LoadOrErr.takeError();
|
|
|
|
return;
|
|
|
|
}
|
2015-06-05 03:57:46 +08:00
|
|
|
}
|
2016-03-26 01:25:34 +08:00
|
|
|
|
2016-09-21 04:14:14 +08:00
|
|
|
const char *DyldIdLoadCmd = nullptr;
|
2016-09-27 05:11:03 +08:00
|
|
|
const char *FuncStartsLoadCmd = nullptr;
|
|
|
|
const char *SplitInfoLoadCmd = nullptr;
|
|
|
|
const char *CodeSignDrsLoadCmd = nullptr;
|
2016-10-19 04:24:12 +08:00
|
|
|
const char *CodeSignLoadCmd = nullptr;
|
2016-09-29 05:20:45 +08:00
|
|
|
const char *VersLoadCmd = nullptr;
|
2016-09-30 01:45:23 +08:00
|
|
|
const char *SourceLoadCmd = nullptr;
|
2016-09-30 05:07:29 +08:00
|
|
|
const char *EntryPointLoadCmd = nullptr;
|
2016-10-05 04:37:43 +08:00
|
|
|
const char *EncryptLoadCmd = nullptr;
|
2016-10-19 01:54:17 +08:00
|
|
|
const char *RoutinesLoadCmd = nullptr;
|
2016-10-20 07:44:34 +08:00
|
|
|
const char *UnixThreadLoadCmd = nullptr;
|
2016-10-21 04:10:30 +08:00
|
|
|
const char *TwoLevelHintsLoadCmd = nullptr;
|
2015-06-04 06:19:36 +08:00
|
|
|
for (unsigned I = 0; I < LoadCommandCount; ++I) {
|
2016-07-08 06:11:42 +08:00
|
|
|
if (is64Bit()) {
|
|
|
|
if (Load.C.cmdsize % 8 != 0) {
|
|
|
|
// We have a hack here to allow 64-bit Mach-O core files to have
|
|
|
|
// LC_THREAD commands that are only a multiple of 4 and not 8 to be
|
|
|
|
// allowed since the macOS kernel produces them.
|
|
|
|
if (getHeader().filetype != MachO::MH_CORE ||
|
|
|
|
Load.C.cmd != MachO::LC_THREAD || Load.C.cmdsize % 4) {
|
|
|
|
Err = malformedError("load command " + Twine(I) + " cmdsize not a "
|
|
|
|
"multiple of 8");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
if (Load.C.cmdsize % 4 != 0) {
|
|
|
|
Err = malformedError("load command " + Twine(I) + " cmdsize not a "
|
|
|
|
"multiple of 4");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
2015-06-04 06:19:36 +08:00
|
|
|
LoadCommands.push_back(Load);
|
2013-09-01 12:28:48 +08:00
|
|
|
if (Load.C.cmd == MachO::LC_SYMTAB) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if ((Err = checkSymtabCommand(*this, Load, I, &SymtabLoadCmd, Elements)))
|
2014-11-14 03:48:56 +08:00
|
|
|
return;
|
2013-09-01 12:28:48 +08:00
|
|
|
} else if (Load.C.cmd == MachO::LC_DYSYMTAB) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if ((Err = checkDysymtabCommand(*this, Load, I, &DysymtabLoadCmd,
|
2016-11-03 05:08:39 +08:00
|
|
|
Elements)))
|
2014-11-14 03:48:56 +08:00
|
|
|
return;
|
2013-09-01 12:28:48 +08:00
|
|
|
} else if (Load.C.cmd == MachO::LC_DATA_IN_CODE) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if ((Err = checkLinkeditDataCommand(*this, Load, I, &DataInCodeLoadCmd,
|
2016-11-03 05:08:39 +08:00
|
|
|
"LC_DATA_IN_CODE", Elements,
|
|
|
|
"data in code info")))
|
2014-11-14 03:48:56 +08:00
|
|
|
return;
|
2015-01-28 05:28:24 +08:00
|
|
|
} else if (Load.C.cmd == MachO::LC_LINKER_OPTIMIZATION_HINT) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if ((Err = checkLinkeditDataCommand(*this, Load, I, &LinkOptHintsLoadCmd,
|
2016-11-03 05:08:39 +08:00
|
|
|
"LC_LINKER_OPTIMIZATION_HINT",
|
|
|
|
Elements, "linker optimization "
|
|
|
|
"hints")))
|
2015-01-28 05:28:24 +08:00
|
|
|
return;
|
2016-09-27 05:11:03 +08:00
|
|
|
} else if (Load.C.cmd == MachO::LC_FUNCTION_STARTS) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if ((Err = checkLinkeditDataCommand(*this, Load, I, &FuncStartsLoadCmd,
|
2016-11-03 05:08:39 +08:00
|
|
|
"LC_FUNCTION_STARTS", Elements,
|
|
|
|
"function starts data")))
|
2016-09-27 05:11:03 +08:00
|
|
|
return;
|
|
|
|
} else if (Load.C.cmd == MachO::LC_SEGMENT_SPLIT_INFO) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if ((Err = checkLinkeditDataCommand(*this, Load, I, &SplitInfoLoadCmd,
|
2016-11-03 05:08:39 +08:00
|
|
|
"LC_SEGMENT_SPLIT_INFO", Elements,
|
|
|
|
"split info data")))
|
2016-09-27 05:11:03 +08:00
|
|
|
return;
|
|
|
|
} else if (Load.C.cmd == MachO::LC_DYLIB_CODE_SIGN_DRS) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if ((Err = checkLinkeditDataCommand(*this, Load, I, &CodeSignDrsLoadCmd,
|
2016-11-03 05:08:39 +08:00
|
|
|
"LC_DYLIB_CODE_SIGN_DRS", Elements,
|
|
|
|
"code signing RDs data")))
|
2016-09-27 05:11:03 +08:00
|
|
|
return;
|
2016-10-19 04:24:12 +08:00
|
|
|
} else if (Load.C.cmd == MachO::LC_CODE_SIGNATURE) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if ((Err = checkLinkeditDataCommand(*this, Load, I, &CodeSignLoadCmd,
|
2016-11-03 05:08:39 +08:00
|
|
|
"LC_CODE_SIGNATURE", Elements,
|
|
|
|
"code signature data")))
|
2016-10-19 04:24:12 +08:00
|
|
|
return;
|
2016-09-14 05:42:28 +08:00
|
|
|
} else if (Load.C.cmd == MachO::LC_DYLD_INFO) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if ((Err = checkDyldInfoCommand(*this, Load, I, &DyldInfoLoadCmd,
|
2016-11-03 05:08:39 +08:00
|
|
|
"LC_DYLD_INFO", Elements)))
|
2016-09-14 05:42:28 +08:00
|
|
|
return;
|
|
|
|
} else if (Load.C.cmd == MachO::LC_DYLD_INFO_ONLY) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if ((Err = checkDyldInfoCommand(*this, Load, I, &DyldInfoLoadCmd,
|
2016-11-03 05:08:39 +08:00
|
|
|
"LC_DYLD_INFO_ONLY", Elements)))
|
2014-11-14 03:48:56 +08:00
|
|
|
return;
|
2014-10-16 07:35:45 +08:00
|
|
|
} else if (Load.C.cmd == MachO::LC_UUID) {
|
2016-09-22 04:03:09 +08:00
|
|
|
if (Load.C.cmdsize != sizeof(MachO::uuid_command)) {
|
|
|
|
Err = malformedError("LC_UUID command " + Twine(I) + " has incorrect "
|
|
|
|
"cmdsize");
|
|
|
|
return;
|
|
|
|
}
|
2014-11-14 03:48:56 +08:00
|
|
|
if (UuidLoadCmd) {
|
2016-09-22 04:03:09 +08:00
|
|
|
Err = malformedError("more than one LC_UUID command");
|
2014-11-14 03:48:56 +08:00
|
|
|
return;
|
|
|
|
}
|
2014-10-16 07:35:45 +08:00
|
|
|
UuidLoadCmd = Load.Ptr;
|
2015-06-05 06:08:37 +08:00
|
|
|
} else if (Load.C.cmd == MachO::LC_SEGMENT_64) {
|
2016-08-13 04:10:25 +08:00
|
|
|
if ((Err = parseSegmentLoadCommand<MachO::segment_command_64,
|
|
|
|
MachO::section_64>(
|
2016-12-04 09:56:10 +08:00
|
|
|
*this, Load, Sections, HasPageZeroSegment, I,
|
2016-11-03 05:08:39 +08:00
|
|
|
"LC_SEGMENT_64", SizeOfHeaders, Elements)))
|
2015-06-05 04:08:52 +08:00
|
|
|
return;
|
2015-06-05 06:08:37 +08:00
|
|
|
} else if (Load.C.cmd == MachO::LC_SEGMENT) {
|
2016-08-13 04:10:25 +08:00
|
|
|
if ((Err = parseSegmentLoadCommand<MachO::segment_command,
|
|
|
|
MachO::section>(
|
2016-12-04 09:56:10 +08:00
|
|
|
*this, Load, Sections, HasPageZeroSegment, I,
|
2016-11-03 05:08:39 +08:00
|
|
|
"LC_SEGMENT", SizeOfHeaders, Elements)))
|
2015-06-05 04:08:52 +08:00
|
|
|
return;
|
2016-09-21 04:14:14 +08:00
|
|
|
} else if (Load.C.cmd == MachO::LC_ID_DYLIB) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if ((Err = checkDylibIdCommand(*this, Load, I, &DyldIdLoadCmd)))
|
2016-09-21 04:14:14 +08:00
|
|
|
return;
|
|
|
|
} else if (Load.C.cmd == MachO::LC_LOAD_DYLIB) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if ((Err = checkDylibCommand(*this, Load, I, "LC_LOAD_DYLIB")))
|
2016-09-21 04:14:14 +08:00
|
|
|
return;
|
|
|
|
Libraries.push_back(Load.Ptr);
|
|
|
|
} else if (Load.C.cmd == MachO::LC_LOAD_WEAK_DYLIB) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if ((Err = checkDylibCommand(*this, Load, I, "LC_LOAD_WEAK_DYLIB")))
|
2016-09-21 04:14:14 +08:00
|
|
|
return;
|
|
|
|
Libraries.push_back(Load.Ptr);
|
|
|
|
} else if (Load.C.cmd == MachO::LC_LAZY_LOAD_DYLIB) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if ((Err = checkDylibCommand(*this, Load, I, "LC_LAZY_LOAD_DYLIB")))
|
2016-09-21 04:14:14 +08:00
|
|
|
return;
|
|
|
|
Libraries.push_back(Load.Ptr);
|
|
|
|
} else if (Load.C.cmd == MachO::LC_REEXPORT_DYLIB) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if ((Err = checkDylibCommand(*this, Load, I, "LC_REEXPORT_DYLIB")))
|
2016-09-21 04:14:14 +08:00
|
|
|
return;
|
|
|
|
Libraries.push_back(Load.Ptr);
|
|
|
|
} else if (Load.C.cmd == MachO::LC_LOAD_UPWARD_DYLIB) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if ((Err = checkDylibCommand(*this, Load, I, "LC_LOAD_UPWARD_DYLIB")))
|
2016-09-21 04:14:14 +08:00
|
|
|
return;
|
2014-06-06 05:21:57 +08:00
|
|
|
Libraries.push_back(Load.Ptr);
|
2016-09-28 07:24:13 +08:00
|
|
|
} else if (Load.C.cmd == MachO::LC_ID_DYLINKER) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if ((Err = checkDyldCommand(*this, Load, I, "LC_ID_DYLINKER")))
|
2016-09-28 07:24:13 +08:00
|
|
|
return;
|
|
|
|
} else if (Load.C.cmd == MachO::LC_LOAD_DYLINKER) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if ((Err = checkDyldCommand(*this, Load, I, "LC_LOAD_DYLINKER")))
|
2016-09-28 07:24:13 +08:00
|
|
|
return;
|
|
|
|
} else if (Load.C.cmd == MachO::LC_DYLD_ENVIRONMENT) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if ((Err = checkDyldCommand(*this, Load, I, "LC_DYLD_ENVIRONMENT")))
|
2016-09-28 07:24:13 +08:00
|
|
|
return;
|
2016-09-29 05:20:45 +08:00
|
|
|
} else if (Load.C.cmd == MachO::LC_VERSION_MIN_MACOSX) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if ((Err = checkVersCommand(*this, Load, I, &VersLoadCmd,
|
2016-09-29 05:20:45 +08:00
|
|
|
"LC_VERSION_MIN_MACOSX")))
|
|
|
|
return;
|
|
|
|
} else if (Load.C.cmd == MachO::LC_VERSION_MIN_IPHONEOS) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if ((Err = checkVersCommand(*this, Load, I, &VersLoadCmd,
|
2016-09-29 05:20:45 +08:00
|
|
|
"LC_VERSION_MIN_IPHONEOS")))
|
|
|
|
return;
|
|
|
|
} else if (Load.C.cmd == MachO::LC_VERSION_MIN_TVOS) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if ((Err = checkVersCommand(*this, Load, I, &VersLoadCmd,
|
2016-09-29 05:20:45 +08:00
|
|
|
"LC_VERSION_MIN_TVOS")))
|
|
|
|
return;
|
|
|
|
} else if (Load.C.cmd == MachO::LC_VERSION_MIN_WATCHOS) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if ((Err = checkVersCommand(*this, Load, I, &VersLoadCmd,
|
2016-09-29 05:20:45 +08:00
|
|
|
"LC_VERSION_MIN_WATCHOS")))
|
|
|
|
return;
|
2017-01-20 01:36:31 +08:00
|
|
|
} else if (Load.C.cmd == MachO::LC_NOTE) {
|
|
|
|
if ((Err = checkNoteCommand(*this, Load, I, Elements)))
|
|
|
|
return;
|
2017-01-24 04:07:55 +08:00
|
|
|
} else if (Load.C.cmd == MachO::LC_BUILD_VERSION) {
|
|
|
|
if ((Err = parseBuildVersionCommand(*this, Load, BuildTools, I)))
|
|
|
|
return;
|
2016-09-29 07:16:01 +08:00
|
|
|
} else if (Load.C.cmd == MachO::LC_RPATH) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if ((Err = checkRpathCommand(*this, Load, I)))
|
2016-09-29 07:16:01 +08:00
|
|
|
return;
|
2016-09-30 01:45:23 +08:00
|
|
|
} else if (Load.C.cmd == MachO::LC_SOURCE_VERSION) {
|
|
|
|
if (Load.C.cmdsize != sizeof(MachO::source_version_command)) {
|
|
|
|
Err = malformedError("LC_SOURCE_VERSION command " + Twine(I) +
|
|
|
|
" has incorrect cmdsize");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
if (SourceLoadCmd) {
|
|
|
|
Err = malformedError("more than one LC_SOURCE_VERSION command");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
SourceLoadCmd = Load.Ptr;
|
2016-09-30 05:07:29 +08:00
|
|
|
} else if (Load.C.cmd == MachO::LC_MAIN) {
|
|
|
|
if (Load.C.cmdsize != sizeof(MachO::entry_point_command)) {
|
|
|
|
Err = malformedError("LC_MAIN command " + Twine(I) +
|
|
|
|
" has incorrect cmdsize");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
if (EntryPointLoadCmd) {
|
|
|
|
Err = malformedError("more than one LC_MAIN command");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
EntryPointLoadCmd = Load.Ptr;
|
2016-10-05 04:37:43 +08:00
|
|
|
} else if (Load.C.cmd == MachO::LC_ENCRYPTION_INFO) {
|
|
|
|
if (Load.C.cmdsize != sizeof(MachO::encryption_info_command)) {
|
|
|
|
Err = malformedError("LC_ENCRYPTION_INFO command " + Twine(I) +
|
|
|
|
" has incorrect cmdsize");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
MachO::encryption_info_command E =
|
2016-12-04 09:56:10 +08:00
|
|
|
getStruct<MachO::encryption_info_command>(*this, Load.Ptr);
|
|
|
|
if ((Err = checkEncryptCommand(*this, Load, I, E.cryptoff, E.cryptsize,
|
2016-10-05 04:37:43 +08:00
|
|
|
&EncryptLoadCmd, "LC_ENCRYPTION_INFO")))
|
|
|
|
return;
|
|
|
|
} else if (Load.C.cmd == MachO::LC_ENCRYPTION_INFO_64) {
|
|
|
|
if (Load.C.cmdsize != sizeof(MachO::encryption_info_command_64)) {
|
|
|
|
Err = malformedError("LC_ENCRYPTION_INFO_64 command " + Twine(I) +
|
|
|
|
" has incorrect cmdsize");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
MachO::encryption_info_command_64 E =
|
2016-12-04 09:56:10 +08:00
|
|
|
getStruct<MachO::encryption_info_command_64>(*this, Load.Ptr);
|
|
|
|
if ((Err = checkEncryptCommand(*this, Load, I, E.cryptoff, E.cryptsize,
|
2016-10-05 04:37:43 +08:00
|
|
|
&EncryptLoadCmd, "LC_ENCRYPTION_INFO_64")))
|
|
|
|
return;
|
2016-10-12 05:04:39 +08:00
|
|
|
} else if (Load.C.cmd == MachO::LC_LINKER_OPTION) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if ((Err = checkLinkerOptCommand(*this, Load, I)))
|
2016-10-12 05:04:39 +08:00
|
|
|
return;
|
2016-10-18 06:09:25 +08:00
|
|
|
} else if (Load.C.cmd == MachO::LC_SUB_FRAMEWORK) {
|
|
|
|
if (Load.C.cmdsize < sizeof(MachO::sub_framework_command)) {
|
|
|
|
Err = malformedError("load command " + Twine(I) +
|
|
|
|
" LC_SUB_FRAMEWORK cmdsize too small");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
MachO::sub_framework_command S =
|
2016-12-04 09:56:10 +08:00
|
|
|
getStruct<MachO::sub_framework_command>(*this, Load.Ptr);
|
|
|
|
if ((Err = checkSubCommand(*this, Load, I, "LC_SUB_FRAMEWORK",
|
2016-10-18 06:09:25 +08:00
|
|
|
sizeof(MachO::sub_framework_command),
|
|
|
|
"sub_framework_command", S.umbrella,
|
|
|
|
"umbrella")))
|
|
|
|
return;
|
|
|
|
} else if (Load.C.cmd == MachO::LC_SUB_UMBRELLA) {
|
|
|
|
if (Load.C.cmdsize < sizeof(MachO::sub_umbrella_command)) {
|
|
|
|
Err = malformedError("load command " + Twine(I) +
|
|
|
|
" LC_SUB_UMBRELLA cmdsize too small");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
MachO::sub_umbrella_command S =
|
2016-12-04 09:56:10 +08:00
|
|
|
getStruct<MachO::sub_umbrella_command>(*this, Load.Ptr);
|
|
|
|
if ((Err = checkSubCommand(*this, Load, I, "LC_SUB_UMBRELLA",
|
2016-10-18 06:09:25 +08:00
|
|
|
sizeof(MachO::sub_umbrella_command),
|
|
|
|
"sub_umbrella_command", S.sub_umbrella,
|
|
|
|
"sub_umbrella")))
|
|
|
|
return;
|
|
|
|
} else if (Load.C.cmd == MachO::LC_SUB_LIBRARY) {
|
|
|
|
if (Load.C.cmdsize < sizeof(MachO::sub_library_command)) {
|
|
|
|
Err = malformedError("load command " + Twine(I) +
|
|
|
|
" LC_SUB_LIBRARY cmdsize too small");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
MachO::sub_library_command S =
|
2016-12-04 09:56:10 +08:00
|
|
|
getStruct<MachO::sub_library_command>(*this, Load.Ptr);
|
|
|
|
if ((Err = checkSubCommand(*this, Load, I, "LC_SUB_LIBRARY",
|
2016-10-18 06:09:25 +08:00
|
|
|
sizeof(MachO::sub_library_command),
|
|
|
|
"sub_library_command", S.sub_library,
|
|
|
|
"sub_library")))
|
|
|
|
return;
|
|
|
|
} else if (Load.C.cmd == MachO::LC_SUB_CLIENT) {
|
|
|
|
if (Load.C.cmdsize < sizeof(MachO::sub_client_command)) {
|
|
|
|
Err = malformedError("load command " + Twine(I) +
|
|
|
|
" LC_SUB_CLIENT cmdsize too small");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
MachO::sub_client_command S =
|
2016-12-04 09:56:10 +08:00
|
|
|
getStruct<MachO::sub_client_command>(*this, Load.Ptr);
|
|
|
|
if ((Err = checkSubCommand(*this, Load, I, "LC_SUB_CLIENT",
|
2016-10-18 06:09:25 +08:00
|
|
|
sizeof(MachO::sub_client_command),
|
|
|
|
"sub_client_command", S.client, "client")))
|
|
|
|
return;
|
2016-10-19 01:54:17 +08:00
|
|
|
} else if (Load.C.cmd == MachO::LC_ROUTINES) {
|
|
|
|
if (Load.C.cmdsize != sizeof(MachO::routines_command)) {
|
|
|
|
Err = malformedError("LC_ROUTINES command " + Twine(I) +
|
|
|
|
" has incorrect cmdsize");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
if (RoutinesLoadCmd) {
|
|
|
|
Err = malformedError("more than one LC_ROUTINES and or LC_ROUTINES_64 "
|
|
|
|
"command");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
RoutinesLoadCmd = Load.Ptr;
|
|
|
|
} else if (Load.C.cmd == MachO::LC_ROUTINES_64) {
|
|
|
|
if (Load.C.cmdsize != sizeof(MachO::routines_command_64)) {
|
|
|
|
Err = malformedError("LC_ROUTINES_64 command " + Twine(I) +
|
|
|
|
" has incorrect cmdsize");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
if (RoutinesLoadCmd) {
|
|
|
|
Err = malformedError("more than one LC_ROUTINES_64 and or LC_ROUTINES "
|
|
|
|
"command");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
RoutinesLoadCmd = Load.Ptr;
|
2016-10-20 07:44:34 +08:00
|
|
|
} else if (Load.C.cmd == MachO::LC_UNIXTHREAD) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if ((Err = checkThreadCommand(*this, Load, I, "LC_UNIXTHREAD")))
|
2016-10-20 07:44:34 +08:00
|
|
|
return;
|
|
|
|
if (UnixThreadLoadCmd) {
|
|
|
|
Err = malformedError("more than one LC_UNIXTHREAD command");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
UnixThreadLoadCmd = Load.Ptr;
|
|
|
|
} else if (Load.C.cmd == MachO::LC_THREAD) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if ((Err = checkThreadCommand(*this, Load, I, "LC_THREAD")))
|
2016-10-20 07:44:34 +08:00
|
|
|
return;
|
2016-10-28 04:59:10 +08:00
|
|
|
// Note: LC_TWOLEVEL_HINTS is really obsolete and is not supported.
|
2016-10-21 04:10:30 +08:00
|
|
|
} else if (Load.C.cmd == MachO::LC_TWOLEVEL_HINTS) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if ((Err = checkTwoLevelHintsCommand(*this, Load, I,
|
2016-11-03 05:08:39 +08:00
|
|
|
&TwoLevelHintsLoadCmd, Elements)))
|
2016-10-21 04:10:30 +08:00
|
|
|
return;
|
2016-10-28 04:59:10 +08:00
|
|
|
} else if (isLoadCommandObsolete(Load.C.cmd)) {
|
|
|
|
Err = malformedError("load command " + Twine(I) + " for cmd value of: " +
|
|
|
|
Twine(Load.C.cmd) + " is obsolete and not "
|
|
|
|
"supported");
|
|
|
|
return;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
2016-10-28 04:59:10 +08:00
|
|
|
// TODO: generate a error for unknown load commands by default. But still
|
|
|
|
// need work out an approach to allow or not allow unknown values like this
|
|
|
|
// as an option for some uses like lldb.
|
2015-06-05 03:57:46 +08:00
|
|
|
if (I < LoadCommandCount - 1) {
|
2016-12-04 09:56:10 +08:00
|
|
|
if (auto LoadOrErr = getNextLoadCommandInfo(*this, I, Load))
|
2016-03-26 01:25:34 +08:00
|
|
|
Load = *LoadOrErr;
|
|
|
|
else {
|
|
|
|
Err = LoadOrErr.takeError();
|
2015-06-05 03:57:46 +08:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
2016-01-23 06:49:55 +08:00
|
|
|
if (!SymtabLoadCmd) {
|
|
|
|
if (DysymtabLoadCmd) {
|
2016-05-07 04:16:28 +08:00
|
|
|
Err = malformedError("contains LC_DYSYMTAB load command without a "
|
2016-05-06 07:41:05 +08:00
|
|
|
"LC_SYMTAB load command");
|
2016-01-23 06:49:55 +08:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
} else if (DysymtabLoadCmd) {
|
|
|
|
MachO::symtab_command Symtab =
|
2016-12-04 09:56:10 +08:00
|
|
|
getStruct<MachO::symtab_command>(*this, SymtabLoadCmd);
|
2016-01-23 06:49:55 +08:00
|
|
|
MachO::dysymtab_command Dysymtab =
|
2016-12-04 09:56:10 +08:00
|
|
|
getStruct<MachO::dysymtab_command>(*this, DysymtabLoadCmd);
|
2016-01-23 06:49:55 +08:00
|
|
|
if (Dysymtab.nlocalsym != 0 && Dysymtab.ilocalsym > Symtab.nsyms) {
|
2016-05-07 04:16:28 +08:00
|
|
|
Err = malformedError("ilocalsym in LC_DYSYMTAB load command "
|
2016-05-06 07:41:05 +08:00
|
|
|
"extends past the end of the symbol table");
|
2016-01-23 06:49:55 +08:00
|
|
|
return;
|
|
|
|
}
|
2016-04-22 04:29:49 +08:00
|
|
|
uint64_t BigSize = Dysymtab.ilocalsym;
|
|
|
|
BigSize += Dysymtab.nlocalsym;
|
|
|
|
if (Dysymtab.nlocalsym != 0 && BigSize > Symtab.nsyms) {
|
2016-05-07 04:16:28 +08:00
|
|
|
Err = malformedError("ilocalsym plus nlocalsym in LC_DYSYMTAB load "
|
2016-05-06 07:41:05 +08:00
|
|
|
"command extends past the end of the symbol table");
|
2016-01-23 06:49:55 +08:00
|
|
|
return;
|
|
|
|
}
|
2018-09-05 00:31:48 +08:00
|
|
|
if (Dysymtab.nextdefsym != 0 && Dysymtab.iextdefsym > Symtab.nsyms) {
|
2018-09-05 00:31:53 +08:00
|
|
|
Err = malformedError("iextdefsym in LC_DYSYMTAB load command "
|
2016-05-06 07:41:05 +08:00
|
|
|
"extends past the end of the symbol table");
|
2016-01-23 06:49:55 +08:00
|
|
|
return;
|
|
|
|
}
|
2016-04-22 04:29:49 +08:00
|
|
|
BigSize = Dysymtab.iextdefsym;
|
|
|
|
BigSize += Dysymtab.nextdefsym;
|
|
|
|
if (Dysymtab.nextdefsym != 0 && BigSize > Symtab.nsyms) {
|
2016-05-07 04:16:28 +08:00
|
|
|
Err = malformedError("iextdefsym plus nextdefsym in LC_DYSYMTAB "
|
2016-05-06 07:41:05 +08:00
|
|
|
"load command extends past the end of the symbol "
|
|
|
|
"table");
|
2016-01-23 06:49:55 +08:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
if (Dysymtab.nundefsym != 0 && Dysymtab.iundefsym > Symtab.nsyms) {
|
2018-09-05 00:31:53 +08:00
|
|
|
Err = malformedError("iundefsym in LC_DYSYMTAB load command "
|
2016-05-06 07:41:05 +08:00
|
|
|
"extends past the end of the symbol table");
|
2016-01-23 06:49:55 +08:00
|
|
|
return;
|
|
|
|
}
|
2016-04-22 04:29:49 +08:00
|
|
|
BigSize = Dysymtab.iundefsym;
|
|
|
|
BigSize += Dysymtab.nundefsym;
|
|
|
|
if (Dysymtab.nundefsym != 0 && BigSize > Symtab.nsyms) {
|
2016-05-07 04:16:28 +08:00
|
|
|
Err = malformedError("iundefsym plus nundefsym in LC_DYSYMTAB load "
|
2016-05-06 07:41:05 +08:00
|
|
|
" command extends past the end of the symbol table");
|
2016-01-23 06:49:55 +08:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
2016-09-21 04:14:14 +08:00
|
|
|
if ((getHeader().filetype == MachO::MH_DYLIB ||
|
|
|
|
getHeader().filetype == MachO::MH_DYLIB_STUB) &&
|
|
|
|
DyldIdLoadCmd == nullptr) {
|
|
|
|
Err = malformedError("no LC_ID_DYLIB load command in dynamic library "
|
|
|
|
"filetype");
|
|
|
|
return;
|
|
|
|
}
|
2015-06-04 06:19:36 +08:00
|
|
|
assert(LoadCommands.size() == LoadCommandCount);
|
2016-03-26 01:25:34 +08:00
|
|
|
|
|
|
|
Err = Error::success();
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2016-11-15 04:57:04 +08:00
|
|
|
Error MachOObjectFile::checkSymbolTable() const {
|
|
|
|
uint32_t Flags = 0;
|
|
|
|
if (is64Bit()) {
|
|
|
|
MachO::mach_header_64 H_64 = MachOObjectFile::getHeader64();
|
|
|
|
Flags = H_64.flags;
|
|
|
|
} else {
|
|
|
|
MachO::mach_header H = MachOObjectFile::getHeader();
|
|
|
|
Flags = H.flags;
|
|
|
|
}
|
|
|
|
uint8_t NType = 0;
|
|
|
|
uint8_t NSect = 0;
|
|
|
|
uint16_t NDesc = 0;
|
|
|
|
uint32_t NStrx = 0;
|
|
|
|
uint64_t NValue = 0;
|
|
|
|
uint32_t SymbolIndex = 0;
|
|
|
|
MachO::symtab_command S = getSymtabLoadCommand();
|
|
|
|
for (const SymbolRef &Symbol : symbols()) {
|
|
|
|
DataRefImpl SymDRI = Symbol.getRawDataRefImpl();
|
|
|
|
if (is64Bit()) {
|
|
|
|
MachO::nlist_64 STE_64 = getSymbol64TableEntry(SymDRI);
|
|
|
|
NType = STE_64.n_type;
|
|
|
|
NSect = STE_64.n_sect;
|
|
|
|
NDesc = STE_64.n_desc;
|
|
|
|
NStrx = STE_64.n_strx;
|
|
|
|
NValue = STE_64.n_value;
|
|
|
|
} else {
|
|
|
|
MachO::nlist STE = getSymbolTableEntry(SymDRI);
|
|
|
|
NType = STE.n_type;
|
|
|
|
NSect = STE.n_sect;
|
|
|
|
NDesc = STE.n_desc;
|
|
|
|
NStrx = STE.n_strx;
|
|
|
|
NValue = STE.n_value;
|
|
|
|
}
|
2019-02-23 14:19:56 +08:00
|
|
|
if ((NType & MachO::N_STAB) == 0) {
|
|
|
|
if ((NType & MachO::N_TYPE) == MachO::N_SECT) {
|
|
|
|
if (NSect == 0 || NSect > Sections.size())
|
|
|
|
return malformedError("bad section index: " + Twine((int)NSect) +
|
|
|
|
" for symbol at index " + Twine(SymbolIndex));
|
|
|
|
}
|
|
|
|
if ((NType & MachO::N_TYPE) == MachO::N_INDR) {
|
|
|
|
if (NValue >= S.strsize)
|
|
|
|
return malformedError("bad n_value: " + Twine((int)NValue) + " past "
|
|
|
|
"the end of string table, for N_INDR symbol at "
|
|
|
|
"index " + Twine(SymbolIndex));
|
2016-11-15 04:57:04 +08:00
|
|
|
}
|
2019-02-23 14:19:56 +08:00
|
|
|
if ((Flags & MachO::MH_TWOLEVEL) == MachO::MH_TWOLEVEL &&
|
|
|
|
(((NType & MachO::N_TYPE) == MachO::N_UNDF && NValue == 0) ||
|
|
|
|
(NType & MachO::N_TYPE) == MachO::N_PBUD)) {
|
|
|
|
uint32_t LibraryOrdinal = MachO::GET_LIBRARY_ORDINAL(NDesc);
|
|
|
|
if (LibraryOrdinal != 0 &&
|
|
|
|
LibraryOrdinal != MachO::EXECUTABLE_ORDINAL &&
|
|
|
|
LibraryOrdinal != MachO::DYNAMIC_LOOKUP_ORDINAL &&
|
|
|
|
LibraryOrdinal - 1 >= Libraries.size() ) {
|
|
|
|
return malformedError("bad library ordinal: " + Twine(LibraryOrdinal) +
|
|
|
|
" for symbol at index " + Twine(SymbolIndex));
|
|
|
|
}
|
|
|
|
}
|
2016-11-15 04:57:04 +08:00
|
|
|
}
|
|
|
|
if (NStrx >= S.strsize)
|
|
|
|
return malformedError("bad string table index: " + Twine((int)NStrx) +
|
|
|
|
" past the end of string table, for symbol at "
|
|
|
|
"index " + Twine(SymbolIndex));
|
|
|
|
SymbolIndex++;
|
|
|
|
}
|
|
|
|
return Error::success();
|
|
|
|
}
|
|
|
|
|
2014-01-30 10:49:50 +08:00
|
|
|
void MachOObjectFile::moveSymbolNext(DataRefImpl &Symb) const {
|
2013-04-25 03:47:55 +08:00
|
|
|
unsigned SymbolTableEntrySize = is64Bit() ?
|
2013-09-01 12:28:48 +08:00
|
|
|
sizeof(MachO::nlist_64) :
|
|
|
|
sizeof(MachO::nlist);
|
2013-04-25 03:47:55 +08:00
|
|
|
Symb.p += SymbolTableEntrySize;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2016-04-21 05:24:34 +08:00
|
|
|
Expected<StringRef> MachOObjectFile::getSymbolName(DataRefImpl Symb) const {
|
2013-04-27 04:07:33 +08:00
|
|
|
StringRef StringTable = getStringTableData();
|
2016-12-04 09:56:10 +08:00
|
|
|
MachO::nlist_base Entry = getSymbolTableEntryBase(*this, Symb);
|
2018-01-04 07:28:32 +08:00
|
|
|
if (Entry.n_strx == 0)
|
|
|
|
// A n_strx value of 0 indicates that no name is associated with a
|
|
|
|
// particular symbol table entry.
|
|
|
|
return StringRef();
|
2013-09-01 12:28:48 +08:00
|
|
|
const char *Start = &StringTable.data()[Entry.n_strx];
|
2016-04-21 05:24:34 +08:00
|
|
|
if (Start < getData().begin() || Start >= getData().end()) {
|
2016-05-07 04:16:28 +08:00
|
|
|
return malformedError("bad string index: " + Twine(Entry.n_strx) +
|
2016-05-06 07:41:05 +08:00
|
|
|
" for symbol at index " + Twine(getSymbolIndex(Symb)));
|
2016-04-21 05:24:34 +08:00
|
|
|
}
|
2015-07-03 04:55:21 +08:00
|
|
|
return StringRef(Start);
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2014-12-11 04:46:55 +08:00
|
|
|
unsigned MachOObjectFile::getSectionType(SectionRef Sec) const {
|
|
|
|
DataRefImpl DRI = Sec.getRawDataRefImpl();
|
2016-12-04 09:56:10 +08:00
|
|
|
uint32_t Flags = getSectionFlags(*this, DRI);
|
2014-12-11 04:46:55 +08:00
|
|
|
return Flags & MachO::SECTION_TYPE;
|
|
|
|
}
|
|
|
|
|
2015-06-25 02:14:41 +08:00
|
|
|
uint64_t MachOObjectFile::getNValue(DataRefImpl Sym) const {
|
|
|
|
if (is64Bit()) {
|
|
|
|
MachO::nlist_64 Entry = getSymbol64TableEntry(Sym);
|
|
|
|
return Entry.n_value;
|
|
|
|
}
|
|
|
|
MachO::nlist Entry = getSymbolTableEntry(Sym);
|
|
|
|
return Entry.n_value;
|
|
|
|
}
|
|
|
|
|
2014-06-06 05:21:57 +08:00
|
|
|
// getIndirectName() returns the name of the alias'ed symbol who's string table
|
|
|
|
// index is in the n_value field.
|
2014-06-13 05:46:39 +08:00
|
|
|
std::error_code MachOObjectFile::getIndirectName(DataRefImpl Symb,
|
|
|
|
StringRef &Res) const {
|
2014-06-06 05:21:57 +08:00
|
|
|
StringRef StringTable = getStringTableData();
|
2016-12-04 09:56:10 +08:00
|
|
|
MachO::nlist_base Entry = getSymbolTableEntryBase(*this, Symb);
|
2015-06-25 02:14:41 +08:00
|
|
|
if ((Entry.n_type & MachO::N_TYPE) != MachO::N_INDR)
|
|
|
|
return object_error::parse_failed;
|
|
|
|
uint64_t NValue = getNValue(Symb);
|
2014-06-06 05:21:57 +08:00
|
|
|
if (NValue >= StringTable.size())
|
|
|
|
return object_error::parse_failed;
|
|
|
|
const char *Start = &StringTable.data()[NValue];
|
|
|
|
Res = StringRef(Start);
|
2015-06-09 23:20:42 +08:00
|
|
|
return std::error_code();
|
2014-06-06 05:21:57 +08:00
|
|
|
}
|
|
|
|
|
2015-07-08 01:12:59 +08:00
|
|
|
uint64_t MachOObjectFile::getSymbolValueImpl(DataRefImpl Sym) const {
|
2015-07-07 23:05:09 +08:00
|
|
|
return getNValue(Sym);
|
2015-06-25 03:11:10 +08:00
|
|
|
}
|
|
|
|
|
2016-06-25 02:24:42 +08:00
|
|
|
Expected<uint64_t> MachOObjectFile::getSymbolAddress(DataRefImpl Sym) const {
|
2015-07-04 02:19:00 +08:00
|
|
|
return getSymbolValue(Sym);
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2015-06-01 07:52:50 +08:00
|
|
|
uint32_t MachOObjectFile::getSymbolAlignment(DataRefImpl DRI) const {
|
2014-02-01 04:57:12 +08:00
|
|
|
uint32_t flags = getSymbolFlags(DRI);
|
2013-04-30 06:24:22 +08:00
|
|
|
if (flags & SymbolRef::SF_Common) {
|
2016-12-04 09:56:10 +08:00
|
|
|
MachO::nlist_base Entry = getSymbolTableEntryBase(*this, DRI);
|
2015-06-01 07:52:50 +08:00
|
|
|
return 1 << MachO::GET_COMM_ALIGN(Entry.n_desc);
|
2013-04-30 06:24:22 +08:00
|
|
|
}
|
2015-06-01 07:52:50 +08:00
|
|
|
return 0;
|
2013-04-30 06:24:22 +08:00
|
|
|
}
|
|
|
|
|
2015-06-24 18:20:30 +08:00
|
|
|
uint64_t MachOObjectFile::getCommonSymbolSizeImpl(DataRefImpl DRI) const {
|
2015-07-07 21:58:32 +08:00
|
|
|
return getNValue(DRI);
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2016-05-03 04:28:12 +08:00
|
|
|
Expected<SymbolRef::Type>
|
2016-03-24 04:27:00 +08:00
|
|
|
MachOObjectFile::getSymbolType(DataRefImpl Symb) const {
|
2016-12-04 09:56:10 +08:00
|
|
|
MachO::nlist_base Entry = getSymbolTableEntryBase(*this, Symb);
|
2013-09-01 12:28:48 +08:00
|
|
|
uint8_t n_type = Entry.n_type;
|
2013-04-19 02:08:55 +08:00
|
|
|
|
|
|
|
// If this is a STAB debugging symbol, we can do nothing more.
|
2015-06-26 20:18:49 +08:00
|
|
|
if (n_type & MachO::N_STAB)
|
|
|
|
return SymbolRef::ST_Debug;
|
2013-04-19 02:08:55 +08:00
|
|
|
|
2013-08-27 13:00:13 +08:00
|
|
|
switch (n_type & MachO::N_TYPE) {
|
|
|
|
case MachO::N_UNDF :
|
2015-06-26 20:18:49 +08:00
|
|
|
return SymbolRef::ST_Unknown;
|
2013-08-27 13:00:13 +08:00
|
|
|
case MachO::N_SECT :
|
2016-05-03 04:28:12 +08:00
|
|
|
Expected<section_iterator> SecOrError = getSymbolSection(Symb);
|
2016-03-24 04:27:00 +08:00
|
|
|
if (!SecOrError)
|
2016-05-03 04:28:12 +08:00
|
|
|
return SecOrError.takeError();
|
2016-03-24 04:27:00 +08:00
|
|
|
section_iterator Sec = *SecOrError;
|
2015-11-12 17:40:29 +08:00
|
|
|
if (Sec->isData() || Sec->isBSS())
|
|
|
|
return SymbolRef::ST_Data;
|
2015-06-26 20:18:49 +08:00
|
|
|
return SymbolRef::ST_Function;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
2015-06-26 20:18:49 +08:00
|
|
|
return SymbolRef::ST_Other;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2014-02-01 04:57:12 +08:00
|
|
|
uint32_t MachOObjectFile::getSymbolFlags(DataRefImpl DRI) const {
|
2016-12-04 09:56:10 +08:00
|
|
|
MachO::nlist_base Entry = getSymbolTableEntryBase(*this, DRI);
|
2013-04-19 02:08:55 +08:00
|
|
|
|
2013-09-01 12:28:48 +08:00
|
|
|
uint8_t MachOType = Entry.n_type;
|
|
|
|
uint16_t MachOFlags = Entry.n_desc;
|
2013-04-19 02:08:55 +08:00
|
|
|
|
2014-02-01 04:57:12 +08:00
|
|
|
uint32_t Result = SymbolRef::SF_None;
|
2013-04-19 02:08:55 +08:00
|
|
|
|
2014-05-30 21:22:59 +08:00
|
|
|
if ((MachOType & MachO::N_TYPE) == MachO::N_INDR)
|
|
|
|
Result |= SymbolRef::SF_Indirect;
|
|
|
|
|
2013-11-02 13:03:24 +08:00
|
|
|
if (MachOType & MachO::N_STAB)
|
2013-04-19 02:08:55 +08:00
|
|
|
Result |= SymbolRef::SF_FormatSpecific;
|
|
|
|
|
2013-08-27 13:00:13 +08:00
|
|
|
if (MachOType & MachO::N_EXT) {
|
2013-04-19 02:08:55 +08:00
|
|
|
Result |= SymbolRef::SF_Global;
|
2013-08-27 13:00:13 +08:00
|
|
|
if ((MachOType & MachO::N_TYPE) == MachO::N_UNDF) {
|
2015-07-07 21:58:32 +08:00
|
|
|
if (getNValue(DRI))
|
2013-04-30 06:24:22 +08:00
|
|
|
Result |= SymbolRef::SF_Common;
|
2015-07-07 22:26:39 +08:00
|
|
|
else
|
|
|
|
Result |= SymbolRef::SF_Undefined;
|
2013-04-30 06:24:22 +08:00
|
|
|
}
|
2015-01-16 06:33:30 +08:00
|
|
|
|
|
|
|
if (!(MachOType & MachO::N_PEXT))
|
|
|
|
Result |= SymbolRef::SF_Exported;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2013-08-27 13:00:13 +08:00
|
|
|
if (MachOFlags & (MachO::N_WEAK_REF | MachO::N_WEAK_DEF))
|
2013-04-19 02:08:55 +08:00
|
|
|
Result |= SymbolRef::SF_Weak;
|
|
|
|
|
2014-08-19 04:21:02 +08:00
|
|
|
if (MachOFlags & (MachO::N_ARM_THUMB_DEF))
|
|
|
|
Result |= SymbolRef::SF_Thumb;
|
|
|
|
|
2013-08-27 13:00:13 +08:00
|
|
|
if ((MachOType & MachO::N_TYPE) == MachO::N_ABS)
|
2013-04-19 02:08:55 +08:00
|
|
|
Result |= SymbolRef::SF_Absolute;
|
|
|
|
|
2014-02-01 04:57:12 +08:00
|
|
|
return Result;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2016-05-03 04:28:12 +08:00
|
|
|
Expected<section_iterator>
|
2015-08-08 07:27:14 +08:00
|
|
|
MachOObjectFile::getSymbolSection(DataRefImpl Symb) const {
|
2016-12-04 09:56:10 +08:00
|
|
|
MachO::nlist_base Entry = getSymbolTableEntryBase(*this, Symb);
|
2013-09-01 12:28:48 +08:00
|
|
|
uint8_t index = Entry.n_sect;
|
2013-04-19 02:08:55 +08:00
|
|
|
|
2015-08-08 07:27:14 +08:00
|
|
|
if (index == 0)
|
|
|
|
return section_end();
|
|
|
|
DataRefImpl DRI;
|
|
|
|
DRI.d.a = index - 1;
|
2016-03-24 04:27:00 +08:00
|
|
|
if (DRI.d.a >= Sections.size()){
|
2016-05-07 04:16:28 +08:00
|
|
|
return malformedError("bad section index: " + Twine((int)index) +
|
2016-05-06 07:41:05 +08:00
|
|
|
" for symbol at index " + Twine(getSymbolIndex(Symb)));
|
2016-03-24 04:27:00 +08:00
|
|
|
}
|
2015-08-08 07:27:14 +08:00
|
|
|
return section_iterator(SectionRef(DRI, this));
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2015-06-25 03:57:32 +08:00
|
|
|
unsigned MachOObjectFile::getSymbolSectionID(SymbolRef Sym) const {
|
|
|
|
MachO::nlist_base Entry =
|
2016-12-04 09:56:10 +08:00
|
|
|
getSymbolTableEntryBase(*this, Sym.getRawDataRefImpl());
|
2015-06-25 03:57:32 +08:00
|
|
|
return Entry.n_sect - 1;
|
|
|
|
}
|
|
|
|
|
2014-01-30 10:49:50 +08:00
|
|
|
void MachOObjectFile::moveSectionNext(DataRefImpl &Sec) const {
|
2013-04-19 02:08:55 +08:00
|
|
|
Sec.d.a++;
|
|
|
|
}
|
|
|
|
|
2019-05-02 18:32:03 +08:00
|
|
|
Expected<StringRef> MachOObjectFile::getSectionName(DataRefImpl Sec) const {
|
2013-04-19 02:08:55 +08:00
|
|
|
ArrayRef<char> Raw = getSectionRawName(Sec);
|
2019-05-02 18:32:03 +08:00
|
|
|
return parseSegmentOrSectionName(Raw.data());
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2014-10-08 23:28:58 +08:00
|
|
|
uint64_t MachOObjectFile::getSectionAddress(DataRefImpl Sec) const {
|
|
|
|
if (is64Bit())
|
|
|
|
return getSection64(Sec).addr;
|
|
|
|
return getSection(Sec).addr;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2017-05-28 02:10:23 +08:00
|
|
|
uint64_t MachOObjectFile::getSectionIndex(DataRefImpl Sec) const {
|
|
|
|
return Sec.d.a;
|
|
|
|
}
|
|
|
|
|
2014-10-08 23:28:58 +08:00
|
|
|
uint64_t MachOObjectFile::getSectionSize(DataRefImpl Sec) const {
|
2015-10-09 06:50:55 +08:00
|
|
|
// In the case if a malformed Mach-O file where the section offset is past
|
|
|
|
// the end of the file or some part of the section size is past the end of
|
|
|
|
// the file return a size of zero or a size that covers the rest of the file
|
|
|
|
// but does not extend past the end of the file.
|
|
|
|
uint32_t SectOffset, SectType;
|
|
|
|
uint64_t SectSize;
|
|
|
|
|
|
|
|
if (is64Bit()) {
|
|
|
|
MachO::section_64 Sect = getSection64(Sec);
|
|
|
|
SectOffset = Sect.offset;
|
|
|
|
SectSize = Sect.size;
|
|
|
|
SectType = Sect.flags & MachO::SECTION_TYPE;
|
|
|
|
} else {
|
|
|
|
MachO::section Sect = getSection(Sec);
|
|
|
|
SectOffset = Sect.offset;
|
|
|
|
SectSize = Sect.size;
|
|
|
|
SectType = Sect.flags & MachO::SECTION_TYPE;
|
|
|
|
}
|
|
|
|
if (SectType == MachO::S_ZEROFILL || SectType == MachO::S_GB_ZEROFILL)
|
|
|
|
return SectSize;
|
|
|
|
uint64_t FileSize = getData().size();
|
|
|
|
if (SectOffset > FileSize)
|
|
|
|
return 0;
|
|
|
|
if (FileSize - SectOffset < SectSize)
|
|
|
|
return FileSize - SectOffset;
|
|
|
|
return SectSize;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2019-05-14 12:22:51 +08:00
|
|
|
Expected<ArrayRef<uint8_t>>
|
|
|
|
MachOObjectFile::getSectionContents(DataRefImpl Sec) const {
|
2013-04-19 02:08:55 +08:00
|
|
|
uint32_t Offset;
|
|
|
|
uint64_t Size;
|
|
|
|
|
|
|
|
if (is64Bit()) {
|
2013-09-01 12:28:48 +08:00
|
|
|
MachO::section_64 Sect = getSection64(Sec);
|
|
|
|
Offset = Sect.offset;
|
|
|
|
Size = Sect.size;
|
2013-04-19 02:08:55 +08:00
|
|
|
} else {
|
2013-09-01 12:28:48 +08:00
|
|
|
MachO::section Sect = getSection(Sec);
|
|
|
|
Offset = Sect.offset;
|
|
|
|
Size = Sect.size;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2019-05-14 12:22:51 +08:00
|
|
|
return arrayRefFromStringRef(getData().substr(Offset, Size));
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2014-10-08 23:28:58 +08:00
|
|
|
uint64_t MachOObjectFile::getSectionAlignment(DataRefImpl Sec) const {
|
2013-04-19 02:08:55 +08:00
|
|
|
uint32_t Align;
|
|
|
|
if (is64Bit()) {
|
2013-09-01 12:28:48 +08:00
|
|
|
MachO::section_64 Sect = getSection64(Sec);
|
|
|
|
Align = Sect.align;
|
2013-04-19 02:08:55 +08:00
|
|
|
} else {
|
2013-09-01 12:28:48 +08:00
|
|
|
MachO::section Sect = getSection(Sec);
|
|
|
|
Align = Sect.align;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2014-10-08 23:28:58 +08:00
|
|
|
return uint64_t(1) << Align;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2018-07-11 18:00:29 +08:00
|
|
|
Expected<SectionRef> MachOObjectFile::getSection(unsigned SectionIndex) const {
|
|
|
|
if (SectionIndex < 1 || SectionIndex > Sections.size())
|
|
|
|
return malformedError("bad section index: " + Twine((int)SectionIndex));
|
|
|
|
|
|
|
|
DataRefImpl DRI;
|
|
|
|
DRI.d.a = SectionIndex - 1;
|
|
|
|
return SectionRef(DRI, this);
|
|
|
|
}
|
|
|
|
|
|
|
|
Expected<SectionRef> MachOObjectFile::getSection(StringRef SectionName) const {
|
2019-08-14 16:56:55 +08:00
|
|
|
StringRef SecName;
|
2018-07-11 18:00:29 +08:00
|
|
|
for (const SectionRef &Section : sections()) {
|
2019-08-14 16:56:55 +08:00
|
|
|
if (std::error_code E = Section.getName(SecName))
|
|
|
|
return errorCodeToError(E);
|
|
|
|
if (SecName == SectionName) {
|
2018-07-11 18:00:29 +08:00
|
|
|
return Section;
|
2019-08-14 16:56:55 +08:00
|
|
|
}
|
2018-07-11 18:00:29 +08:00
|
|
|
}
|
|
|
|
return errorCodeToError(object_error::parse_failed);
|
|
|
|
}
|
|
|
|
|
2016-05-24 20:48:46 +08:00
|
|
|
bool MachOObjectFile::isSectionCompressed(DataRefImpl Sec) const {
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2014-10-08 23:28:58 +08:00
|
|
|
bool MachOObjectFile::isSectionText(DataRefImpl Sec) const {
|
2016-12-04 09:56:10 +08:00
|
|
|
uint32_t Flags = getSectionFlags(*this, Sec);
|
2014-10-08 23:28:58 +08:00
|
|
|
return Flags & MachO::S_ATTR_PURE_INSTRUCTIONS;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2014-10-08 23:28:58 +08:00
|
|
|
bool MachOObjectFile::isSectionData(DataRefImpl Sec) const {
|
2016-12-04 09:56:10 +08:00
|
|
|
uint32_t Flags = getSectionFlags(*this, Sec);
|
2014-05-20 04:36:02 +08:00
|
|
|
unsigned SectionType = Flags & MachO::SECTION_TYPE;
|
2014-10-08 23:28:58 +08:00
|
|
|
return !(Flags & MachO::S_ATTR_PURE_INSTRUCTIONS) &&
|
|
|
|
!(SectionType == MachO::S_ZEROFILL ||
|
|
|
|
SectionType == MachO::S_GB_ZEROFILL);
|
2011-09-29 04:57:30 +08:00
|
|
|
}
|
|
|
|
|
2014-10-08 23:28:58 +08:00
|
|
|
bool MachOObjectFile::isSectionBSS(DataRefImpl Sec) const {
|
2016-12-04 09:56:10 +08:00
|
|
|
uint32_t Flags = getSectionFlags(*this, Sec);
|
2014-05-20 04:36:02 +08:00
|
|
|
unsigned SectionType = Flags & MachO::SECTION_TYPE;
|
2014-10-08 23:28:58 +08:00
|
|
|
return !(Flags & MachO::S_ATTR_PURE_INSTRUCTIONS) &&
|
|
|
|
(SectionType == MachO::S_ZEROFILL ||
|
|
|
|
SectionType == MachO::S_GB_ZEROFILL);
|
2011-09-29 04:57:30 +08:00
|
|
|
}
|
|
|
|
|
2015-06-25 03:57:32 +08:00
|
|
|
unsigned MachOObjectFile::getSectionID(SectionRef Sec) const {
|
|
|
|
return Sec.getRawDataRefImpl().d.a;
|
|
|
|
}
|
|
|
|
|
2014-10-08 23:28:58 +08:00
|
|
|
bool MachOObjectFile::isSectionVirtual(DataRefImpl Sec) const {
|
2018-04-20 01:02:57 +08:00
|
|
|
uint32_t Flags = getSectionFlags(*this, Sec);
|
|
|
|
unsigned SectionType = Flags & MachO::SECTION_TYPE;
|
|
|
|
return SectionType == MachO::S_ZEROFILL ||
|
|
|
|
SectionType == MachO::S_GB_ZEROFILL;
|
2012-04-13 04:13:57 +08:00
|
|
|
}
|
|
|
|
|
2016-03-01 03:40:10 +08:00
|
|
|
bool MachOObjectFile::isSectionBitcode(DataRefImpl Sec) const {
|
|
|
|
StringRef SegmentName = getSectionFinalSegmentName(Sec);
|
2019-05-02 18:32:03 +08:00
|
|
|
if (Expected<StringRef> NameOrErr = getSectionName(Sec))
|
|
|
|
return (SegmentName == "__LLVM" && *NameOrErr == "__bitcode");
|
2016-03-01 03:40:10 +08:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2017-09-26 22:22:35 +08:00
|
|
|
bool MachOObjectFile::isSectionStripped(DataRefImpl Sec) const {
|
|
|
|
if (is64Bit())
|
|
|
|
return getSection64(Sec).offset == 0;
|
|
|
|
return getSection(Sec).offset == 0;
|
|
|
|
}
|
|
|
|
|
2013-09-28 05:47:05 +08:00
|
|
|
relocation_iterator MachOObjectFile::section_rel_begin(DataRefImpl Sec) const {
|
2013-04-25 20:45:46 +08:00
|
|
|
DataRefImpl Ret;
|
2014-04-04 07:51:28 +08:00
|
|
|
Ret.d.a = Sec.d.a;
|
|
|
|
Ret.d.b = 0;
|
2013-04-25 20:45:46 +08:00
|
|
|
return relocation_iterator(RelocationRef(Ret, this));
|
2011-10-08 03:25:32 +08:00
|
|
|
}
|
2013-04-09 04:45:01 +08:00
|
|
|
|
2013-04-19 02:08:55 +08:00
|
|
|
relocation_iterator
|
2013-09-28 05:47:05 +08:00
|
|
|
MachOObjectFile::section_rel_end(DataRefImpl Sec) const {
|
2013-04-25 20:45:46 +08:00
|
|
|
uint32_t Num;
|
2013-04-19 02:08:55 +08:00
|
|
|
if (is64Bit()) {
|
2013-09-01 12:28:48 +08:00
|
|
|
MachO::section_64 Sect = getSection64(Sec);
|
|
|
|
Num = Sect.nreloc;
|
2013-04-19 02:08:55 +08:00
|
|
|
} else {
|
2013-09-01 12:28:48 +08:00
|
|
|
MachO::section Sect = getSection(Sec);
|
|
|
|
Num = Sect.nreloc;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
2011-04-22 11:19:48 +08:00
|
|
|
|
2013-04-19 02:08:55 +08:00
|
|
|
DataRefImpl Ret;
|
2014-04-04 07:51:28 +08:00
|
|
|
Ret.d.a = Sec.d.a;
|
|
|
|
Ret.d.b = Num;
|
2013-04-19 02:08:55 +08:00
|
|
|
return relocation_iterator(RelocationRef(Ret, this));
|
|
|
|
}
|
2011-09-09 04:52:17 +08:00
|
|
|
|
2017-06-23 01:41:22 +08:00
|
|
|
relocation_iterator MachOObjectFile::extrel_begin() const {
|
|
|
|
DataRefImpl Ret;
|
2017-12-16 01:57:40 +08:00
|
|
|
// for DYSYMTAB symbols, Ret.d.a == 0 for external relocations
|
2017-06-23 01:41:22 +08:00
|
|
|
Ret.d.a = 0; // Would normally be a section index.
|
|
|
|
Ret.d.b = 0; // Index into the external relocations
|
|
|
|
return relocation_iterator(RelocationRef(Ret, this));
|
|
|
|
}
|
|
|
|
|
|
|
|
relocation_iterator MachOObjectFile::extrel_end() const {
|
|
|
|
MachO::dysymtab_command DysymtabLoadCmd = getDysymtabLoadCommand();
|
|
|
|
DataRefImpl Ret;
|
2017-12-16 01:57:40 +08:00
|
|
|
// for DYSYMTAB symbols, Ret.d.a == 0 for external relocations
|
2017-06-23 01:41:22 +08:00
|
|
|
Ret.d.a = 0; // Would normally be a section index.
|
|
|
|
Ret.d.b = DysymtabLoadCmd.nextrel; // Index into the external relocations
|
|
|
|
return relocation_iterator(RelocationRef(Ret, this));
|
|
|
|
}
|
|
|
|
|
2017-12-16 01:57:40 +08:00
|
|
|
relocation_iterator MachOObjectFile::locrel_begin() const {
|
|
|
|
DataRefImpl Ret;
|
|
|
|
// for DYSYMTAB symbols, Ret.d.a == 1 for local relocations
|
|
|
|
Ret.d.a = 1; // Would normally be a section index.
|
|
|
|
Ret.d.b = 0; // Index into the local relocations
|
|
|
|
return relocation_iterator(RelocationRef(Ret, this));
|
|
|
|
}
|
|
|
|
|
|
|
|
relocation_iterator MachOObjectFile::locrel_end() const {
|
|
|
|
MachO::dysymtab_command DysymtabLoadCmd = getDysymtabLoadCommand();
|
|
|
|
DataRefImpl Ret;
|
|
|
|
// for DYSYMTAB symbols, Ret.d.a == 1 for local relocations
|
|
|
|
Ret.d.a = 1; // Would normally be a section index.
|
|
|
|
Ret.d.b = DysymtabLoadCmd.nlocrel; // Index into the local relocations
|
|
|
|
return relocation_iterator(RelocationRef(Ret, this));
|
|
|
|
}
|
|
|
|
|
2014-01-30 10:49:50 +08:00
|
|
|
void MachOObjectFile::moveRelocationNext(DataRefImpl &Rel) const {
|
2014-04-04 07:51:28 +08:00
|
|
|
++Rel.d.b;
|
2011-09-09 04:52:17 +08:00
|
|
|
}
|
2011-10-25 07:20:07 +08:00
|
|
|
|
2015-06-30 07:29:12 +08:00
|
|
|
uint64_t MachOObjectFile::getRelocationOffset(DataRefImpl Rel) const {
|
2017-06-23 01:41:22 +08:00
|
|
|
assert((getHeader().filetype == MachO::MH_OBJECT ||
|
|
|
|
getHeader().filetype == MachO::MH_KEXT_BUNDLE) &&
|
|
|
|
"Only implemented for MH_OBJECT && MH_KEXT_BUNDLE");
|
2013-09-01 12:28:48 +08:00
|
|
|
MachO::any_relocation_info RE = getRelocation(Rel);
|
2015-06-30 07:29:12 +08:00
|
|
|
return getAnyRelocationAddress(RE);
|
2012-03-01 09:36:50 +08:00
|
|
|
}
|
|
|
|
|
2013-06-05 09:33:53 +08:00
|
|
|
symbol_iterator
|
|
|
|
MachOObjectFile::getRelocationSymbol(DataRefImpl Rel) const {
|
2013-09-01 12:28:48 +08:00
|
|
|
MachO::any_relocation_info RE = getRelocation(Rel);
|
2014-07-04 18:57:56 +08:00
|
|
|
if (isRelocationScattered(RE))
|
|
|
|
return symbol_end();
|
|
|
|
|
2013-04-19 02:08:55 +08:00
|
|
|
uint32_t SymbolIdx = getPlainRelocationSymbolNum(RE);
|
|
|
|
bool isExtern = getPlainRelocationExternal(RE);
|
2013-06-05 09:33:53 +08:00
|
|
|
if (!isExtern)
|
2014-02-11 04:24:04 +08:00
|
|
|
return symbol_end();
|
2013-04-19 02:08:55 +08:00
|
|
|
|
2013-09-01 12:28:48 +08:00
|
|
|
MachO::symtab_command S = getSymtabLoadCommand();
|
2013-04-25 03:47:55 +08:00
|
|
|
unsigned SymbolTableEntrySize = is64Bit() ?
|
2013-09-01 12:28:48 +08:00
|
|
|
sizeof(MachO::nlist_64) :
|
|
|
|
sizeof(MachO::nlist);
|
|
|
|
uint64_t Offset = S.symoff + SymbolIdx * SymbolTableEntrySize;
|
2013-04-19 02:08:55 +08:00
|
|
|
DataRefImpl Sym;
|
2016-12-04 09:56:10 +08:00
|
|
|
Sym.p = reinterpret_cast<uintptr_t>(getPtr(*this, Offset));
|
2013-06-05 09:33:53 +08:00
|
|
|
return symbol_iterator(SymbolRef(Sym, this));
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2015-05-22 05:24:32 +08:00
|
|
|
section_iterator
|
|
|
|
MachOObjectFile::getRelocationSection(DataRefImpl Rel) const {
|
|
|
|
return section_iterator(getAnyRelocationSection(getRelocation(Rel)));
|
|
|
|
}
|
|
|
|
|
2015-06-30 09:53:01 +08:00
|
|
|
uint64_t MachOObjectFile::getRelocationType(DataRefImpl Rel) const {
|
2013-09-01 12:28:48 +08:00
|
|
|
MachO::any_relocation_info RE = getRelocation(Rel);
|
2015-06-30 09:53:01 +08:00
|
|
|
return getAnyRelocationType(RE);
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2015-06-30 12:08:37 +08:00
|
|
|
void MachOObjectFile::getRelocationTypeName(
|
|
|
|
DataRefImpl Rel, SmallVectorImpl<char> &Result) const {
|
2013-04-19 02:08:55 +08:00
|
|
|
StringRef res;
|
2015-06-30 09:53:01 +08:00
|
|
|
uint64_t RType = getRelocationType(Rel);
|
2013-04-19 02:08:55 +08:00
|
|
|
|
|
|
|
unsigned Arch = this->getArch();
|
|
|
|
|
|
|
|
switch (Arch) {
|
|
|
|
case Triple::x86: {
|
|
|
|
static const char *const Table[] = {
|
|
|
|
"GENERIC_RELOC_VANILLA",
|
|
|
|
"GENERIC_RELOC_PAIR",
|
|
|
|
"GENERIC_RELOC_SECTDIFF",
|
|
|
|
"GENERIC_RELOC_PB_LA_PTR",
|
|
|
|
"GENERIC_RELOC_LOCAL_SECTDIFF",
|
|
|
|
"GENERIC_RELOC_TLV" };
|
|
|
|
|
2013-12-06 10:33:38 +08:00
|
|
|
if (RType > 5)
|
2013-04-19 02:08:55 +08:00
|
|
|
res = "Unknown";
|
|
|
|
else
|
|
|
|
res = Table[RType];
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case Triple::x86_64: {
|
|
|
|
static const char *const Table[] = {
|
|
|
|
"X86_64_RELOC_UNSIGNED",
|
|
|
|
"X86_64_RELOC_SIGNED",
|
|
|
|
"X86_64_RELOC_BRANCH",
|
|
|
|
"X86_64_RELOC_GOT_LOAD",
|
|
|
|
"X86_64_RELOC_GOT",
|
|
|
|
"X86_64_RELOC_SUBTRACTOR",
|
|
|
|
"X86_64_RELOC_SIGNED_1",
|
|
|
|
"X86_64_RELOC_SIGNED_2",
|
|
|
|
"X86_64_RELOC_SIGNED_4",
|
|
|
|
"X86_64_RELOC_TLV" };
|
|
|
|
|
|
|
|
if (RType > 9)
|
|
|
|
res = "Unknown";
|
|
|
|
else
|
|
|
|
res = Table[RType];
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case Triple::arm: {
|
|
|
|
static const char *const Table[] = {
|
|
|
|
"ARM_RELOC_VANILLA",
|
|
|
|
"ARM_RELOC_PAIR",
|
|
|
|
"ARM_RELOC_SECTDIFF",
|
|
|
|
"ARM_RELOC_LOCAL_SECTDIFF",
|
|
|
|
"ARM_RELOC_PB_LA_PTR",
|
|
|
|
"ARM_RELOC_BR24",
|
|
|
|
"ARM_THUMB_RELOC_BR22",
|
|
|
|
"ARM_THUMB_32BIT_BRANCH",
|
|
|
|
"ARM_RELOC_HALF",
|
|
|
|
"ARM_RELOC_HALF_SECTDIFF" };
|
|
|
|
|
|
|
|
if (RType > 9)
|
|
|
|
res = "Unknown";
|
|
|
|
else
|
|
|
|
res = Table[RType];
|
|
|
|
break;
|
|
|
|
}
|
2019-05-14 19:25:44 +08:00
|
|
|
case Triple::aarch64:
|
|
|
|
case Triple::aarch64_32: {
|
2014-03-29 18:18:08 +08:00
|
|
|
static const char *const Table[] = {
|
|
|
|
"ARM64_RELOC_UNSIGNED", "ARM64_RELOC_SUBTRACTOR",
|
|
|
|
"ARM64_RELOC_BRANCH26", "ARM64_RELOC_PAGE21",
|
|
|
|
"ARM64_RELOC_PAGEOFF12", "ARM64_RELOC_GOT_LOAD_PAGE21",
|
|
|
|
"ARM64_RELOC_GOT_LOAD_PAGEOFF12", "ARM64_RELOC_POINTER_TO_GOT",
|
|
|
|
"ARM64_RELOC_TLVP_LOAD_PAGE21", "ARM64_RELOC_TLVP_LOAD_PAGEOFF12",
|
|
|
|
"ARM64_RELOC_ADDEND"
|
|
|
|
};
|
|
|
|
|
|
|
|
if (RType >= array_lengthof(Table))
|
|
|
|
res = "Unknown";
|
|
|
|
else
|
|
|
|
res = Table[RType];
|
|
|
|
break;
|
|
|
|
}
|
2013-04-19 02:08:55 +08:00
|
|
|
case Triple::ppc: {
|
|
|
|
static const char *const Table[] = {
|
|
|
|
"PPC_RELOC_VANILLA",
|
|
|
|
"PPC_RELOC_PAIR",
|
|
|
|
"PPC_RELOC_BR14",
|
|
|
|
"PPC_RELOC_BR24",
|
|
|
|
"PPC_RELOC_HI16",
|
|
|
|
"PPC_RELOC_LO16",
|
|
|
|
"PPC_RELOC_HA16",
|
|
|
|
"PPC_RELOC_LO14",
|
|
|
|
"PPC_RELOC_SECTDIFF",
|
|
|
|
"PPC_RELOC_PB_LA_PTR",
|
|
|
|
"PPC_RELOC_HI16_SECTDIFF",
|
|
|
|
"PPC_RELOC_LO16_SECTDIFF",
|
|
|
|
"PPC_RELOC_HA16_SECTDIFF",
|
|
|
|
"PPC_RELOC_JBSR",
|
|
|
|
"PPC_RELOC_LO14_SECTDIFF",
|
|
|
|
"PPC_RELOC_LOCAL_SECTDIFF" };
|
|
|
|
|
2013-12-06 10:33:38 +08:00
|
|
|
if (RType > 15)
|
|
|
|
res = "Unknown";
|
|
|
|
else
|
|
|
|
res = Table[RType];
|
2013-04-19 02:08:55 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
case Triple::UnknownArch:
|
|
|
|
res = "Unknown";
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
Result.append(res.begin(), res.end());
|
|
|
|
}
|
|
|
|
|
2015-05-31 03:44:53 +08:00
|
|
|
uint8_t MachOObjectFile::getRelocationLength(DataRefImpl Rel) const {
|
|
|
|
MachO::any_relocation_info RE = getRelocation(Rel);
|
|
|
|
return getAnyRelocationLength(RE);
|
|
|
|
}
|
|
|
|
|
2014-06-06 05:21:57 +08:00
|
|
|
//
|
|
|
|
// guessLibraryShortName() is passed a name of a dynamic library and returns a
|
|
|
|
// guess on what the short name is. Then name is returned as a substring of the
|
|
|
|
// StringRef Name passed in. The name of the dynamic library is recognized as
|
|
|
|
// a framework if it has one of the two following forms:
|
|
|
|
// Foo.framework/Versions/A/Foo
|
|
|
|
// Foo.framework/Foo
|
|
|
|
// Where A and Foo can be any string. And may contain a trailing suffix
|
|
|
|
// starting with an underbar. If the Name is recognized as a framework then
|
|
|
|
// isFramework is set to true else it is set to false. If the Name has a
|
|
|
|
// suffix then Suffix is set to the substring in Name that contains the suffix
|
|
|
|
// else it is set to a NULL StringRef.
|
|
|
|
//
|
|
|
|
// The Name of the dynamic library is recognized as a library name if it has
|
|
|
|
// one of the two following forms:
|
|
|
|
// libFoo.A.dylib
|
|
|
|
// libFoo.dylib
|
2019-01-25 04:59:44 +08:00
|
|
|
//
|
2014-06-06 05:21:57 +08:00
|
|
|
// The library may have a suffix trailing the name Foo of the form:
|
|
|
|
// libFoo_profile.A.dylib
|
|
|
|
// libFoo_profile.dylib
|
2019-01-25 04:59:44 +08:00
|
|
|
// These dyld image suffixes are separated from the short name by a '_'
|
|
|
|
// character. Because the '_' character is commonly used to separate words in
|
|
|
|
// filenames guessLibraryShortName() cannot reliably separate a dylib's short
|
|
|
|
// name from an arbitrary image suffix; imagine if both the short name and the
|
|
|
|
// suffix contains an '_' character! To better deal with this ambiguity,
|
|
|
|
// guessLibraryShortName() will recognize only "_debug" and "_profile" as valid
|
|
|
|
// Suffix values. Calling code needs to be tolerant of guessLibraryShortName()
|
|
|
|
// guessing incorrectly.
|
2014-06-06 05:21:57 +08:00
|
|
|
//
|
|
|
|
// The Name of the dynamic library is also recognized as a library name if it
|
|
|
|
// has the following form:
|
|
|
|
// Foo.qtx
|
|
|
|
//
|
|
|
|
// If the Name of the dynamic library is none of the forms above then a NULL
|
|
|
|
// StringRef is returned.
|
|
|
|
StringRef MachOObjectFile::guessLibraryShortName(StringRef Name,
|
|
|
|
bool &isFramework,
|
|
|
|
StringRef &Suffix) {
|
|
|
|
StringRef Foo, F, DotFramework, V, Dylib, Lib, Dot, Qtx;
|
|
|
|
size_t a, b, c, d, Idx;
|
|
|
|
|
|
|
|
isFramework = false;
|
|
|
|
Suffix = StringRef();
|
|
|
|
|
|
|
|
// Pull off the last component and make Foo point to it
|
|
|
|
a = Name.rfind('/');
|
|
|
|
if (a == Name.npos || a == 0)
|
|
|
|
goto guess_library;
|
|
|
|
Foo = Name.slice(a+1, Name.npos);
|
|
|
|
|
|
|
|
// Look for a suffix starting with a '_'
|
|
|
|
Idx = Foo.rfind('_');
|
|
|
|
if (Idx != Foo.npos && Foo.size() >= 2) {
|
|
|
|
Suffix = Foo.slice(Idx, Foo.npos);
|
2019-01-25 04:59:44 +08:00
|
|
|
if (Suffix != "_debug" && Suffix != "_profile")
|
|
|
|
Suffix = StringRef();
|
|
|
|
else
|
|
|
|
Foo = Foo.slice(0, Idx);
|
2014-06-06 05:21:57 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
// First look for the form Foo.framework/Foo
|
|
|
|
b = Name.rfind('/', a);
|
|
|
|
if (b == Name.npos)
|
|
|
|
Idx = 0;
|
|
|
|
else
|
|
|
|
Idx = b+1;
|
|
|
|
F = Name.slice(Idx, Idx + Foo.size());
|
|
|
|
DotFramework = Name.slice(Idx + Foo.size(),
|
|
|
|
Idx + Foo.size() + sizeof(".framework/")-1);
|
|
|
|
if (F == Foo && DotFramework == ".framework/") {
|
|
|
|
isFramework = true;
|
|
|
|
return Foo;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Next look for the form Foo.framework/Versions/A/Foo
|
|
|
|
if (b == Name.npos)
|
|
|
|
goto guess_library;
|
|
|
|
c = Name.rfind('/', b);
|
|
|
|
if (c == Name.npos || c == 0)
|
|
|
|
goto guess_library;
|
|
|
|
V = Name.slice(c+1, Name.npos);
|
|
|
|
if (!V.startswith("Versions/"))
|
|
|
|
goto guess_library;
|
|
|
|
d = Name.rfind('/', c);
|
|
|
|
if (d == Name.npos)
|
|
|
|
Idx = 0;
|
|
|
|
else
|
|
|
|
Idx = d+1;
|
|
|
|
F = Name.slice(Idx, Idx + Foo.size());
|
|
|
|
DotFramework = Name.slice(Idx + Foo.size(),
|
|
|
|
Idx + Foo.size() + sizeof(".framework/")-1);
|
|
|
|
if (F == Foo && DotFramework == ".framework/") {
|
|
|
|
isFramework = true;
|
|
|
|
return Foo;
|
|
|
|
}
|
|
|
|
|
|
|
|
guess_library:
|
|
|
|
// pull off the suffix after the "." and make a point to it
|
|
|
|
a = Name.rfind('.');
|
|
|
|
if (a == Name.npos || a == 0)
|
|
|
|
return StringRef();
|
|
|
|
Dylib = Name.slice(a, Name.npos);
|
|
|
|
if (Dylib != ".dylib")
|
|
|
|
goto guess_qtx;
|
|
|
|
|
|
|
|
// First pull off the version letter for the form Foo.A.dylib if any.
|
|
|
|
if (a >= 3) {
|
|
|
|
Dot = Name.slice(a-2, a-1);
|
|
|
|
if (Dot == ".")
|
|
|
|
a = a - 2;
|
|
|
|
}
|
|
|
|
|
|
|
|
b = Name.rfind('/', a);
|
|
|
|
if (b == Name.npos)
|
|
|
|
b = 0;
|
|
|
|
else
|
|
|
|
b = b+1;
|
|
|
|
// ignore any suffix after an underbar like Foo_profile.A.dylib
|
2019-01-25 04:59:44 +08:00
|
|
|
Idx = Name.rfind('_');
|
2014-06-06 05:21:57 +08:00
|
|
|
if (Idx != Name.npos && Idx != b) {
|
|
|
|
Lib = Name.slice(b, Idx);
|
|
|
|
Suffix = Name.slice(Idx, a);
|
2019-01-25 04:59:44 +08:00
|
|
|
if (Suffix != "_debug" && Suffix != "_profile") {
|
|
|
|
Suffix = StringRef();
|
|
|
|
Lib = Name.slice(b, a);
|
|
|
|
}
|
2014-06-06 05:21:57 +08:00
|
|
|
}
|
|
|
|
else
|
|
|
|
Lib = Name.slice(b, a);
|
|
|
|
// There are incorrect library names of the form:
|
|
|
|
// libATS.A_profile.dylib so check for these.
|
|
|
|
if (Lib.size() >= 3) {
|
|
|
|
Dot = Lib.slice(Lib.size()-2, Lib.size()-1);
|
|
|
|
if (Dot == ".")
|
|
|
|
Lib = Lib.slice(0, Lib.size()-2);
|
|
|
|
}
|
|
|
|
return Lib;
|
|
|
|
|
|
|
|
guess_qtx:
|
|
|
|
Qtx = Name.slice(a, Name.npos);
|
|
|
|
if (Qtx != ".qtx")
|
|
|
|
return StringRef();
|
|
|
|
b = Name.rfind('/', a);
|
|
|
|
if (b == Name.npos)
|
|
|
|
Lib = Name.slice(0, a);
|
|
|
|
else
|
|
|
|
Lib = Name.slice(b+1, a);
|
|
|
|
// There are library names of the form: QT.A.qtx so check for these.
|
|
|
|
if (Lib.size() >= 3) {
|
|
|
|
Dot = Lib.slice(Lib.size()-2, Lib.size()-1);
|
|
|
|
if (Dot == ".")
|
|
|
|
Lib = Lib.slice(0, Lib.size()-2);
|
|
|
|
}
|
|
|
|
return Lib;
|
|
|
|
}
|
|
|
|
|
|
|
|
// getLibraryShortNameByIndex() is used to get the short name of the library
|
|
|
|
// for an undefined symbol in a linked Mach-O binary that was linked with the
|
|
|
|
// normal two-level namespace default (that is MH_TWOLEVEL in the header).
|
|
|
|
// It is passed the index (0 - based) of the library as translated from
|
|
|
|
// GET_LIBRARY_ORDINAL (1 - based).
|
2014-06-13 05:46:39 +08:00
|
|
|
std::error_code MachOObjectFile::getLibraryShortNameByIndex(unsigned Index,
|
2014-08-30 08:20:14 +08:00
|
|
|
StringRef &Res) const {
|
2014-06-06 05:21:57 +08:00
|
|
|
if (Index >= Libraries.size())
|
|
|
|
return object_error::parse_failed;
|
|
|
|
|
|
|
|
// If the cache of LibrariesShortNames is not built up do that first for
|
|
|
|
// all the Libraries.
|
|
|
|
if (LibrariesShortNames.size() == 0) {
|
|
|
|
for (unsigned i = 0; i < Libraries.size(); i++) {
|
2019-06-05 00:55:30 +08:00
|
|
|
auto CommandOrErr =
|
|
|
|
getStructOrErr<MachO::dylib_command>(*this, Libraries[i]);
|
|
|
|
if (!CommandOrErr)
|
|
|
|
return object_error::parse_failed;
|
|
|
|
MachO::dylib_command D = CommandOrErr.get();
|
2014-09-17 08:25:22 +08:00
|
|
|
if (D.dylib.name >= D.cmdsize)
|
|
|
|
return object_error::parse_failed;
|
2014-06-21 02:07:34 +08:00
|
|
|
const char *P = (const char *)(Libraries[i]) + D.dylib.name;
|
2014-06-06 05:21:57 +08:00
|
|
|
StringRef Name = StringRef(P);
|
2014-09-17 08:25:22 +08:00
|
|
|
if (D.dylib.name+Name.size() >= D.cmdsize)
|
|
|
|
return object_error::parse_failed;
|
2014-06-06 05:21:57 +08:00
|
|
|
StringRef Suffix;
|
|
|
|
bool isFramework;
|
|
|
|
StringRef shortName = guessLibraryShortName(Name, isFramework, Suffix);
|
2014-09-17 08:25:22 +08:00
|
|
|
if (shortName.empty())
|
2014-06-06 05:21:57 +08:00
|
|
|
LibrariesShortNames.push_back(Name);
|
|
|
|
else
|
|
|
|
LibrariesShortNames.push_back(shortName);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
Res = LibrariesShortNames[Index];
|
2015-06-09 23:20:42 +08:00
|
|
|
return std::error_code();
|
2014-06-06 05:21:57 +08:00
|
|
|
}
|
|
|
|
|
2017-03-01 05:47:07 +08:00
|
|
|
uint32_t MachOObjectFile::getLibraryCount() const {
|
|
|
|
return Libraries.size();
|
|
|
|
}
|
|
|
|
|
Remove getRelocationAddress.
Originally added in r139314.
Back then it didn't actually get the address, it got whatever value the
relocation used: address or offset.
The values in different object formats are:
* MachO: Always an offset.
* COFF: Always an address, but when talking about the virtual address of
sections it says: "for simplicity, compilers should set this to zero".
* ELF: An offset for .o files and and address for .so files. In the case of the
.so, the relocation in not linked to any section (sh_info is 0). We can't
really compute an offset.
Some API mappings would be:
* Use getAddress for everything. It would be quite cumbersome. To compute the
address elf has to follow sh_info, which can be corrupted and therefore the
method has to return an ErrorOr. The address of the section is also the same
for every relocation in a section, so we shouldn't have to check the error
and fetch the value for every relocation.
* Use a getValue and make it up to the user to know what it is getting.
* Use a getOffset and:
* Assert for dynamic ELF objects. That is a very peculiar case and it is
probably fair to ask any tool that wants to support it to use ELF.h. The
only tool we have that reads those (llvm-readobj) already does that. The
only other use case I can think of is a dynamic linker.
* Check that COFF .obj files have sections with zero virtual address spaces. If
it turns out that some assembler/compiler produces these, we can change
COFFObjectFile::getRelocationOffset to subtract it. Given COFF format,
this can be done without the need for ErrorOr.
The getRelocationAddress method was never implemented for COFF. It also
had exactly one use in a very peculiar case: a shortcut for adding the
section value to a pcrel reloc on MachO.
Given that, I don't expect that there is any use out there of the C API. If
that is not the case, let me know and I will add it back with the implementation
inlined and do a proper deprecation.
llvm-svn: 241450
2015-07-06 22:55:37 +08:00
|
|
|
section_iterator
|
|
|
|
MachOObjectFile::getRelocationRelocatedSection(relocation_iterator Rel) const {
|
|
|
|
DataRefImpl Sec;
|
|
|
|
Sec.d.a = Rel->getRawDataRefImpl().d.a;
|
|
|
|
return section_iterator(SectionRef(Sec, this));
|
|
|
|
}
|
|
|
|
|
2016-11-22 11:38:40 +08:00
|
|
|
basic_symbol_iterator MachOObjectFile::symbol_begin() const {
|
2016-01-23 06:49:55 +08:00
|
|
|
DataRefImpl DRI;
|
|
|
|
MachO::symtab_command Symtab = getSymtabLoadCommand();
|
|
|
|
if (!SymtabLoadCmd || Symtab.nsyms == 0)
|
|
|
|
return basic_symbol_iterator(SymbolRef(DRI, this));
|
|
|
|
|
2014-05-13 05:39:59 +08:00
|
|
|
return getSymbolByIndex(0);
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2016-11-22 11:38:40 +08:00
|
|
|
basic_symbol_iterator MachOObjectFile::symbol_end() const {
|
2013-04-19 02:08:55 +08:00
|
|
|
DataRefImpl DRI;
|
2016-01-23 06:49:55 +08:00
|
|
|
MachO::symtab_command Symtab = getSymtabLoadCommand();
|
|
|
|
if (!SymtabLoadCmd || Symtab.nsyms == 0)
|
2014-02-22 04:10:59 +08:00
|
|
|
return basic_symbol_iterator(SymbolRef(DRI, this));
|
2013-04-25 03:47:55 +08:00
|
|
|
|
|
|
|
unsigned SymbolTableEntrySize = is64Bit() ?
|
2013-09-01 12:28:48 +08:00
|
|
|
sizeof(MachO::nlist_64) :
|
|
|
|
sizeof(MachO::nlist);
|
|
|
|
unsigned Offset = Symtab.symoff +
|
|
|
|
Symtab.nsyms * SymbolTableEntrySize;
|
2016-12-04 09:56:10 +08:00
|
|
|
DRI.p = reinterpret_cast<uintptr_t>(getPtr(*this, Offset));
|
2014-02-22 04:10:59 +08:00
|
|
|
return basic_symbol_iterator(SymbolRef(DRI, this));
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2019-01-15 06:05:12 +08:00
|
|
|
symbol_iterator MachOObjectFile::getSymbolByIndex(unsigned Index) const {
|
2014-05-13 05:39:59 +08:00
|
|
|
MachO::symtab_command Symtab = getSymtabLoadCommand();
|
2016-01-23 06:49:55 +08:00
|
|
|
if (!SymtabLoadCmd || Index >= Symtab.nsyms)
|
2015-01-16 06:52:38 +08:00
|
|
|
report_fatal_error("Requested symbol index is out of range.");
|
2014-05-13 05:39:59 +08:00
|
|
|
unsigned SymbolTableEntrySize =
|
|
|
|
is64Bit() ? sizeof(MachO::nlist_64) : sizeof(MachO::nlist);
|
2016-01-23 06:49:55 +08:00
|
|
|
DataRefImpl DRI;
|
2016-12-04 09:56:10 +08:00
|
|
|
DRI.p = reinterpret_cast<uintptr_t>(getPtr(*this, Symtab.symoff));
|
2014-05-13 05:39:59 +08:00
|
|
|
DRI.p += Index * SymbolTableEntrySize;
|
|
|
|
return basic_symbol_iterator(SymbolRef(DRI, this));
|
|
|
|
}
|
|
|
|
|
2016-04-21 05:24:34 +08:00
|
|
|
uint64_t MachOObjectFile::getSymbolIndex(DataRefImpl Symb) const {
|
|
|
|
MachO::symtab_command Symtab = getSymtabLoadCommand();
|
|
|
|
if (!SymtabLoadCmd)
|
|
|
|
report_fatal_error("getSymbolIndex() called with no symbol table symbol");
|
|
|
|
unsigned SymbolTableEntrySize =
|
|
|
|
is64Bit() ? sizeof(MachO::nlist_64) : sizeof(MachO::nlist);
|
|
|
|
DataRefImpl DRIstart;
|
2016-12-04 09:56:10 +08:00
|
|
|
DRIstart.p = reinterpret_cast<uintptr_t>(getPtr(*this, Symtab.symoff));
|
2016-04-21 05:24:34 +08:00
|
|
|
uint64_t Index = (Symb.p - DRIstart.p) / SymbolTableEntrySize;
|
|
|
|
return Index;
|
|
|
|
}
|
|
|
|
|
2014-02-11 04:24:04 +08:00
|
|
|
section_iterator MachOObjectFile::section_begin() const {
|
2013-04-19 02:08:55 +08:00
|
|
|
DataRefImpl DRI;
|
|
|
|
return section_iterator(SectionRef(DRI, this));
|
|
|
|
}
|
|
|
|
|
2014-02-11 04:24:04 +08:00
|
|
|
section_iterator MachOObjectFile::section_end() const {
|
2013-04-19 02:08:55 +08:00
|
|
|
DataRefImpl DRI;
|
|
|
|
DRI.d.a = Sections.size();
|
|
|
|
return section_iterator(SectionRef(DRI, this));
|
|
|
|
}
|
|
|
|
|
|
|
|
uint8_t MachOObjectFile::getBytesInAddress() const {
|
2013-04-08 03:05:30 +08:00
|
|
|
return is64Bit() ? 8 : 4;
|
2011-04-22 11:19:48 +08:00
|
|
|
}
|
|
|
|
|
2013-04-19 02:08:55 +08:00
|
|
|
StringRef MachOObjectFile::getFileFormatName() const {
|
2016-12-04 09:56:10 +08:00
|
|
|
unsigned CPUType = getCPUType(*this);
|
2013-04-19 02:08:55 +08:00
|
|
|
if (!is64Bit()) {
|
|
|
|
switch (CPUType) {
|
2017-04-22 06:03:05 +08:00
|
|
|
case MachO::CPU_TYPE_I386:
|
2013-04-19 02:08:55 +08:00
|
|
|
return "Mach-O 32-bit i386";
|
2017-04-22 06:03:05 +08:00
|
|
|
case MachO::CPU_TYPE_ARM:
|
2013-04-19 02:08:55 +08:00
|
|
|
return "Mach-O arm";
|
2019-05-14 19:25:44 +08:00
|
|
|
case MachO::CPU_TYPE_ARM64_32:
|
|
|
|
return "Mach-O arm64 (ILP32)";
|
2017-04-22 06:03:05 +08:00
|
|
|
case MachO::CPU_TYPE_POWERPC:
|
2013-04-19 02:08:55 +08:00
|
|
|
return "Mach-O 32-bit ppc";
|
|
|
|
default:
|
|
|
|
return "Mach-O 32-bit unknown";
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
switch (CPUType) {
|
2017-04-22 06:03:05 +08:00
|
|
|
case MachO::CPU_TYPE_X86_64:
|
2013-04-19 02:08:55 +08:00
|
|
|
return "Mach-O 64-bit x86-64";
|
2017-04-22 06:03:05 +08:00
|
|
|
case MachO::CPU_TYPE_ARM64:
|
2014-03-29 18:18:08 +08:00
|
|
|
return "Mach-O arm64";
|
2017-04-22 06:03:05 +08:00
|
|
|
case MachO::CPU_TYPE_POWERPC64:
|
2013-04-19 02:08:55 +08:00
|
|
|
return "Mach-O 64-bit ppc64";
|
|
|
|
default:
|
|
|
|
return "Mach-O 64-bit unknown";
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2013-06-18 23:03:28 +08:00
|
|
|
Triple::ArchType MachOObjectFile::getArch(uint32_t CPUType) {
|
|
|
|
switch (CPUType) {
|
2017-04-22 06:03:05 +08:00
|
|
|
case MachO::CPU_TYPE_I386:
|
2013-04-19 02:08:55 +08:00
|
|
|
return Triple::x86;
|
2017-04-22 06:03:05 +08:00
|
|
|
case MachO::CPU_TYPE_X86_64:
|
2013-04-19 02:08:55 +08:00
|
|
|
return Triple::x86_64;
|
2017-04-22 06:03:05 +08:00
|
|
|
case MachO::CPU_TYPE_ARM:
|
2013-04-19 02:08:55 +08:00
|
|
|
return Triple::arm;
|
2017-04-22 06:03:05 +08:00
|
|
|
case MachO::CPU_TYPE_ARM64:
|
2014-07-23 20:32:47 +08:00
|
|
|
return Triple::aarch64;
|
2019-05-14 19:25:44 +08:00
|
|
|
case MachO::CPU_TYPE_ARM64_32:
|
|
|
|
return Triple::aarch64_32;
|
2017-04-22 06:03:05 +08:00
|
|
|
case MachO::CPU_TYPE_POWERPC:
|
2013-04-19 02:08:55 +08:00
|
|
|
return Triple::ppc;
|
2017-04-22 06:03:05 +08:00
|
|
|
case MachO::CPU_TYPE_POWERPC64:
|
2013-04-19 02:08:55 +08:00
|
|
|
return Triple::ppc64;
|
|
|
|
default:
|
|
|
|
return Triple::UnknownArch;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-04-23 07:21:13 +08:00
|
|
|
Triple MachOObjectFile::getArchTriple(uint32_t CPUType, uint32_t CPUSubType,
|
2016-12-17 06:54:02 +08:00
|
|
|
const char **McpuDefault,
|
|
|
|
const char **ArchFlag) {
|
2014-08-19 04:21:02 +08:00
|
|
|
if (McpuDefault)
|
|
|
|
*McpuDefault = nullptr;
|
2016-12-17 06:54:02 +08:00
|
|
|
if (ArchFlag)
|
|
|
|
*ArchFlag = nullptr;
|
2014-08-19 04:21:02 +08:00
|
|
|
|
2014-07-01 02:45:23 +08:00
|
|
|
switch (CPUType) {
|
|
|
|
case MachO::CPU_TYPE_I386:
|
|
|
|
switch (CPUSubType & ~MachO::CPU_SUBTYPE_MASK) {
|
|
|
|
case MachO::CPU_SUBTYPE_I386_ALL:
|
2016-12-17 06:54:02 +08:00
|
|
|
if (ArchFlag)
|
|
|
|
*ArchFlag = "i386";
|
2014-07-01 02:45:23 +08:00
|
|
|
return Triple("i386-apple-darwin");
|
|
|
|
default:
|
|
|
|
return Triple();
|
|
|
|
}
|
|
|
|
case MachO::CPU_TYPE_X86_64:
|
|
|
|
switch (CPUSubType & ~MachO::CPU_SUBTYPE_MASK) {
|
|
|
|
case MachO::CPU_SUBTYPE_X86_64_ALL:
|
2016-12-17 06:54:02 +08:00
|
|
|
if (ArchFlag)
|
|
|
|
*ArchFlag = "x86_64";
|
2014-07-01 02:45:23 +08:00
|
|
|
return Triple("x86_64-apple-darwin");
|
|
|
|
case MachO::CPU_SUBTYPE_X86_64_H:
|
2016-12-17 06:54:02 +08:00
|
|
|
if (ArchFlag)
|
|
|
|
*ArchFlag = "x86_64h";
|
2014-07-01 02:45:23 +08:00
|
|
|
return Triple("x86_64h-apple-darwin");
|
|
|
|
default:
|
|
|
|
return Triple();
|
|
|
|
}
|
|
|
|
case MachO::CPU_TYPE_ARM:
|
|
|
|
switch (CPUSubType & ~MachO::CPU_SUBTYPE_MASK) {
|
|
|
|
case MachO::CPU_SUBTYPE_ARM_V4T:
|
2016-12-17 06:54:02 +08:00
|
|
|
if (ArchFlag)
|
|
|
|
*ArchFlag = "armv4t";
|
2014-07-01 02:45:23 +08:00
|
|
|
return Triple("armv4t-apple-darwin");
|
|
|
|
case MachO::CPU_SUBTYPE_ARM_V5TEJ:
|
2016-12-17 06:54:02 +08:00
|
|
|
if (ArchFlag)
|
|
|
|
*ArchFlag = "armv5e";
|
2014-07-01 02:45:23 +08:00
|
|
|
return Triple("armv5e-apple-darwin");
|
2014-08-08 05:30:25 +08:00
|
|
|
case MachO::CPU_SUBTYPE_ARM_XSCALE:
|
2016-12-17 06:54:02 +08:00
|
|
|
if (ArchFlag)
|
|
|
|
*ArchFlag = "xscale";
|
2014-08-08 05:30:25 +08:00
|
|
|
return Triple("xscale-apple-darwin");
|
2014-07-01 02:45:23 +08:00
|
|
|
case MachO::CPU_SUBTYPE_ARM_V6:
|
2016-12-17 06:54:02 +08:00
|
|
|
if (ArchFlag)
|
|
|
|
*ArchFlag = "armv6";
|
2014-07-01 02:45:23 +08:00
|
|
|
return Triple("armv6-apple-darwin");
|
|
|
|
case MachO::CPU_SUBTYPE_ARM_V6M:
|
2014-08-19 04:21:02 +08:00
|
|
|
if (McpuDefault)
|
|
|
|
*McpuDefault = "cortex-m0";
|
2016-12-17 06:54:02 +08:00
|
|
|
if (ArchFlag)
|
|
|
|
*ArchFlag = "armv6m";
|
2014-07-01 02:45:23 +08:00
|
|
|
return Triple("armv6m-apple-darwin");
|
2014-08-08 05:30:25 +08:00
|
|
|
case MachO::CPU_SUBTYPE_ARM_V7:
|
2016-12-17 06:54:02 +08:00
|
|
|
if (ArchFlag)
|
|
|
|
*ArchFlag = "armv7";
|
2014-08-08 05:30:25 +08:00
|
|
|
return Triple("armv7-apple-darwin");
|
2014-07-01 02:45:23 +08:00
|
|
|
case MachO::CPU_SUBTYPE_ARM_V7EM:
|
2014-08-19 04:21:02 +08:00
|
|
|
if (McpuDefault)
|
|
|
|
*McpuDefault = "cortex-m4";
|
2016-12-17 06:54:02 +08:00
|
|
|
if (ArchFlag)
|
|
|
|
*ArchFlag = "armv7em";
|
2016-04-23 07:21:13 +08:00
|
|
|
return Triple("thumbv7em-apple-darwin");
|
2014-07-01 02:45:23 +08:00
|
|
|
case MachO::CPU_SUBTYPE_ARM_V7K:
|
2017-01-25 07:41:04 +08:00
|
|
|
if (McpuDefault)
|
|
|
|
*McpuDefault = "cortex-a7";
|
2016-12-17 06:54:02 +08:00
|
|
|
if (ArchFlag)
|
|
|
|
*ArchFlag = "armv7k";
|
2014-07-01 02:45:23 +08:00
|
|
|
return Triple("armv7k-apple-darwin");
|
|
|
|
case MachO::CPU_SUBTYPE_ARM_V7M:
|
2014-08-19 04:21:02 +08:00
|
|
|
if (McpuDefault)
|
|
|
|
*McpuDefault = "cortex-m3";
|
2016-12-17 06:54:02 +08:00
|
|
|
if (ArchFlag)
|
|
|
|
*ArchFlag = "armv7m";
|
2016-04-23 07:21:13 +08:00
|
|
|
return Triple("thumbv7m-apple-darwin");
|
2014-07-01 02:45:23 +08:00
|
|
|
case MachO::CPU_SUBTYPE_ARM_V7S:
|
2017-01-25 07:41:04 +08:00
|
|
|
if (McpuDefault)
|
|
|
|
*McpuDefault = "cortex-a7";
|
2016-12-17 06:54:02 +08:00
|
|
|
if (ArchFlag)
|
|
|
|
*ArchFlag = "armv7s";
|
2014-07-01 02:45:23 +08:00
|
|
|
return Triple("armv7s-apple-darwin");
|
|
|
|
default:
|
|
|
|
return Triple();
|
|
|
|
}
|
|
|
|
case MachO::CPU_TYPE_ARM64:
|
|
|
|
switch (CPUSubType & ~MachO::CPU_SUBTYPE_MASK) {
|
|
|
|
case MachO::CPU_SUBTYPE_ARM64_ALL:
|
2017-02-11 03:27:10 +08:00
|
|
|
if (McpuDefault)
|
|
|
|
*McpuDefault = "cyclone";
|
2016-12-17 06:54:02 +08:00
|
|
|
if (ArchFlag)
|
|
|
|
*ArchFlag = "arm64";
|
2014-07-01 02:45:23 +08:00
|
|
|
return Triple("arm64-apple-darwin");
|
|
|
|
default:
|
|
|
|
return Triple();
|
|
|
|
}
|
2019-05-14 19:25:44 +08:00
|
|
|
case MachO::CPU_TYPE_ARM64_32:
|
|
|
|
switch (CPUSubType & ~MachO::CPU_SUBTYPE_MASK) {
|
|
|
|
case MachO::CPU_SUBTYPE_ARM64_32_V8:
|
|
|
|
if (McpuDefault)
|
|
|
|
*McpuDefault = "cyclone";
|
|
|
|
if (ArchFlag)
|
|
|
|
*ArchFlag = "arm64_32";
|
|
|
|
return Triple("arm64_32-apple-darwin");
|
|
|
|
default:
|
|
|
|
return Triple();
|
|
|
|
}
|
2014-07-01 02:45:23 +08:00
|
|
|
case MachO::CPU_TYPE_POWERPC:
|
|
|
|
switch (CPUSubType & ~MachO::CPU_SUBTYPE_MASK) {
|
|
|
|
case MachO::CPU_SUBTYPE_POWERPC_ALL:
|
2016-12-17 06:54:02 +08:00
|
|
|
if (ArchFlag)
|
|
|
|
*ArchFlag = "ppc";
|
2014-07-01 02:45:23 +08:00
|
|
|
return Triple("ppc-apple-darwin");
|
|
|
|
default:
|
|
|
|
return Triple();
|
|
|
|
}
|
|
|
|
case MachO::CPU_TYPE_POWERPC64:
|
2014-07-01 04:12:59 +08:00
|
|
|
switch (CPUSubType & ~MachO::CPU_SUBTYPE_MASK) {
|
2014-07-01 02:45:23 +08:00
|
|
|
case MachO::CPU_SUBTYPE_POWERPC_ALL:
|
2016-12-17 06:54:02 +08:00
|
|
|
if (ArchFlag)
|
|
|
|
*ArchFlag = "ppc64";
|
2014-07-01 02:45:23 +08:00
|
|
|
return Triple("ppc64-apple-darwin");
|
|
|
|
default:
|
|
|
|
return Triple();
|
|
|
|
}
|
|
|
|
default:
|
|
|
|
return Triple();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
Triple MachOObjectFile::getHostArch() {
|
|
|
|
return Triple(sys::getDefaultTargetTriple());
|
|
|
|
}
|
|
|
|
|
2014-08-09 00:30:17 +08:00
|
|
|
bool MachOObjectFile::isValidArch(StringRef ArchFlag) {
|
2019-07-19 05:01:21 +08:00
|
|
|
auto validArchs = getValidArchs();
|
|
|
|
return llvm::find(validArchs, ArchFlag) != validArchs.end();
|
2014-07-01 02:45:23 +08:00
|
|
|
}
|
|
|
|
|
2019-07-19 05:01:21 +08:00
|
|
|
ArrayRef<StringRef> MachOObjectFile::getValidArchs() {
|
|
|
|
static const std::array<StringRef, 17> validArchs = {
|
|
|
|
"i386", "x86_64", "x86_64h", "armv4t", "arm", "armv5e",
|
|
|
|
"armv6", "armv6m", "armv7", "armv7em", "armv7k", "armv7m",
|
|
|
|
"armv7s", "arm64", "arm64_32", "ppc", "ppc64",
|
|
|
|
};
|
|
|
|
|
|
|
|
return validArchs;
|
|
|
|
}
|
2019-07-04 08:17:02 +08:00
|
|
|
|
2017-12-15 06:07:03 +08:00
|
|
|
Triple::ArchType MachOObjectFile::getArch() const {
|
2016-12-04 09:56:10 +08:00
|
|
|
return getArch(getCPUType(*this));
|
2013-06-18 23:03:28 +08:00
|
|
|
}
|
|
|
|
|
2016-04-23 07:21:13 +08:00
|
|
|
Triple MachOObjectFile::getArchTriple(const char **McpuDefault) const {
|
|
|
|
return getArchTriple(Header.cputype, Header.cpusubtype, McpuDefault);
|
2014-08-19 04:21:02 +08:00
|
|
|
}
|
|
|
|
|
2013-09-28 05:47:05 +08:00
|
|
|
relocation_iterator MachOObjectFile::section_rel_begin(unsigned Index) const {
|
2013-04-27 04:07:33 +08:00
|
|
|
DataRefImpl DRI;
|
|
|
|
DRI.d.a = Index;
|
2013-09-28 05:47:05 +08:00
|
|
|
return section_rel_begin(DRI);
|
2013-04-27 04:07:33 +08:00
|
|
|
}
|
|
|
|
|
2013-09-28 05:47:05 +08:00
|
|
|
relocation_iterator MachOObjectFile::section_rel_end(unsigned Index) const {
|
2013-04-27 04:07:33 +08:00
|
|
|
DataRefImpl DRI;
|
|
|
|
DRI.d.a = Index;
|
2013-09-28 05:47:05 +08:00
|
|
|
return section_rel_end(DRI);
|
2013-04-27 04:07:33 +08:00
|
|
|
}
|
|
|
|
|
2013-06-07 01:20:50 +08:00
|
|
|
dice_iterator MachOObjectFile::begin_dices() const {
|
|
|
|
DataRefImpl DRI;
|
|
|
|
if (!DataInCodeLoadCmd)
|
|
|
|
return dice_iterator(DiceRef(DRI, this));
|
|
|
|
|
2013-09-01 12:28:48 +08:00
|
|
|
MachO::linkedit_data_command DicLC = getDataInCodeLoadCommand();
|
2016-12-04 09:56:10 +08:00
|
|
|
DRI.p = reinterpret_cast<uintptr_t>(getPtr(*this, DicLC.dataoff));
|
2013-06-07 01:20:50 +08:00
|
|
|
return dice_iterator(DiceRef(DRI, this));
|
|
|
|
}
|
|
|
|
|
|
|
|
dice_iterator MachOObjectFile::end_dices() const {
|
|
|
|
DataRefImpl DRI;
|
|
|
|
if (!DataInCodeLoadCmd)
|
|
|
|
return dice_iterator(DiceRef(DRI, this));
|
|
|
|
|
2013-09-01 12:28:48 +08:00
|
|
|
MachO::linkedit_data_command DicLC = getDataInCodeLoadCommand();
|
|
|
|
unsigned Offset = DicLC.dataoff + DicLC.datasize;
|
2016-12-04 09:56:10 +08:00
|
|
|
DRI.p = reinterpret_cast<uintptr_t>(getPtr(*this, Offset));
|
2013-06-07 01:20:50 +08:00
|
|
|
return dice_iterator(DiceRef(DRI, this));
|
|
|
|
}
|
|
|
|
|
2017-07-21 07:08:41 +08:00
|
|
|
ExportEntry::ExportEntry(Error *E, const MachOObjectFile *O,
|
|
|
|
ArrayRef<uint8_t> T) : E(E), O(O), Trie(T) {}
|
2014-08-30 08:20:14 +08:00
|
|
|
|
|
|
|
void ExportEntry::moveToFirst() {
|
2017-07-21 07:08:41 +08:00
|
|
|
ErrorAsOutParameter ErrAsOutParam(E);
|
2014-08-30 08:20:14 +08:00
|
|
|
pushNode(0);
|
2017-07-21 07:08:41 +08:00
|
|
|
if (*E)
|
|
|
|
return;
|
2014-08-30 08:20:14 +08:00
|
|
|
pushDownUntilBottom();
|
|
|
|
}
|
|
|
|
|
|
|
|
void ExportEntry::moveToEnd() {
|
|
|
|
Stack.clear();
|
|
|
|
Done = true;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool ExportEntry::operator==(const ExportEntry &Other) const {
|
2015-09-22 19:14:12 +08:00
|
|
|
// Common case, one at end, other iterating from begin.
|
2014-08-30 08:20:14 +08:00
|
|
|
if (Done || Other.Done)
|
|
|
|
return (Done == Other.Done);
|
|
|
|
// Not equal if different stack sizes.
|
|
|
|
if (Stack.size() != Other.Stack.size())
|
|
|
|
return false;
|
|
|
|
// Not equal if different cumulative strings.
|
2015-03-30 23:42:36 +08:00
|
|
|
if (!CumulativeString.equals(Other.CumulativeString))
|
2014-08-30 08:20:14 +08:00
|
|
|
return false;
|
|
|
|
// Equal if all nodes in both stacks match.
|
|
|
|
for (unsigned i=0; i < Stack.size(); ++i) {
|
|
|
|
if (Stack[i].Start != Other.Stack[i].Start)
|
|
|
|
return false;
|
|
|
|
}
|
2015-09-22 19:19:03 +08:00
|
|
|
return true;
|
2014-08-30 08:20:14 +08:00
|
|
|
}
|
|
|
|
|
2017-07-21 07:08:41 +08:00
|
|
|
uint64_t ExportEntry::readULEB128(const uint8_t *&Ptr, const char **error) {
|
2014-09-03 02:50:24 +08:00
|
|
|
unsigned Count;
|
2017-07-21 07:08:41 +08:00
|
|
|
uint64_t Result = decodeULEB128(Ptr, &Count, Trie.end(), error);
|
2014-09-03 02:50:24 +08:00
|
|
|
Ptr += Count;
|
2017-07-21 07:08:41 +08:00
|
|
|
if (Ptr > Trie.end())
|
2014-09-03 02:50:24 +08:00
|
|
|
Ptr = Trie.end();
|
|
|
|
return Result;
|
2014-08-30 08:20:14 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
StringRef ExportEntry::name() const {
|
2015-03-30 23:42:36 +08:00
|
|
|
return CumulativeString;
|
2014-08-30 08:20:14 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
uint64_t ExportEntry::flags() const {
|
|
|
|
return Stack.back().Flags;
|
|
|
|
}
|
|
|
|
|
|
|
|
uint64_t ExportEntry::address() const {
|
|
|
|
return Stack.back().Address;
|
|
|
|
}
|
|
|
|
|
|
|
|
uint64_t ExportEntry::other() const {
|
|
|
|
return Stack.back().Other;
|
|
|
|
}
|
|
|
|
|
|
|
|
StringRef ExportEntry::otherName() const {
|
|
|
|
const char* ImportName = Stack.back().ImportName;
|
|
|
|
if (ImportName)
|
|
|
|
return StringRef(ImportName);
|
|
|
|
return StringRef();
|
|
|
|
}
|
|
|
|
|
|
|
|
uint32_t ExportEntry::nodeOffset() const {
|
|
|
|
return Stack.back().Start - Trie.begin();
|
|
|
|
}
|
|
|
|
|
2015-09-22 19:13:55 +08:00
|
|
|
ExportEntry::NodeState::NodeState(const uint8_t *Ptr)
|
2017-04-22 06:03:05 +08:00
|
|
|
: Start(Ptr), Current(Ptr) {}
|
2014-08-30 08:20:14 +08:00
|
|
|
|
|
|
|
void ExportEntry::pushNode(uint64_t offset) {
|
2017-07-21 07:08:41 +08:00
|
|
|
ErrorAsOutParameter ErrAsOutParam(E);
|
2014-08-30 08:20:14 +08:00
|
|
|
const uint8_t *Ptr = Trie.begin() + offset;
|
|
|
|
NodeState State(Ptr);
|
2017-07-21 07:08:41 +08:00
|
|
|
const char *error;
|
|
|
|
uint64_t ExportInfoSize = readULEB128(State.Current, &error);
|
|
|
|
if (error) {
|
2017-08-20 23:13:39 +08:00
|
|
|
*E = malformedError("export info size " + Twine(error) +
|
|
|
|
" in export trie data at node: 0x" +
|
|
|
|
Twine::utohexstr(offset));
|
2017-07-21 07:08:41 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
2014-08-30 08:20:14 +08:00
|
|
|
State.IsExportNode = (ExportInfoSize != 0);
|
|
|
|
const uint8_t* Children = State.Current + ExportInfoSize;
|
2017-07-21 07:08:41 +08:00
|
|
|
if (Children > Trie.end()) {
|
2017-08-20 23:13:39 +08:00
|
|
|
*E = malformedError(
|
|
|
|
"export info size: 0x" + Twine::utohexstr(ExportInfoSize) +
|
|
|
|
" in export trie data at node: 0x" + Twine::utohexstr(offset) +
|
|
|
|
" too big and extends past end of trie data");
|
2017-07-21 07:08:41 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
2014-08-30 08:20:14 +08:00
|
|
|
if (State.IsExportNode) {
|
2017-07-21 07:08:41 +08:00
|
|
|
const uint8_t *ExportStart = State.Current;
|
|
|
|
State.Flags = readULEB128(State.Current, &error);
|
|
|
|
if (error) {
|
2017-08-20 23:13:39 +08:00
|
|
|
*E = malformedError("flags " + Twine(error) +
|
|
|
|
" in export trie data at node: 0x" +
|
|
|
|
Twine::utohexstr(offset));
|
2017-07-21 07:08:41 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
uint64_t Kind = State.Flags & MachO::EXPORT_SYMBOL_FLAGS_KIND_MASK;
|
|
|
|
if (State.Flags != 0 &&
|
|
|
|
(Kind != MachO::EXPORT_SYMBOL_FLAGS_KIND_REGULAR &&
|
|
|
|
Kind != MachO::EXPORT_SYMBOL_FLAGS_KIND_ABSOLUTE &&
|
|
|
|
Kind != MachO::EXPORT_SYMBOL_FLAGS_KIND_THREAD_LOCAL)) {
|
2017-08-20 23:13:39 +08:00
|
|
|
*E = malformedError(
|
|
|
|
"unsupported exported symbol kind: " + Twine((int)Kind) +
|
|
|
|
" in flags: 0x" + Twine::utohexstr(State.Flags) +
|
|
|
|
" in export trie data at node: 0x" + Twine::utohexstr(offset));
|
2017-07-21 07:08:41 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
2014-08-30 08:20:14 +08:00
|
|
|
if (State.Flags & MachO::EXPORT_SYMBOL_FLAGS_REEXPORT) {
|
|
|
|
State.Address = 0;
|
2017-07-21 07:08:41 +08:00
|
|
|
State.Other = readULEB128(State.Current, &error); // dylib ordinal
|
|
|
|
if (error) {
|
|
|
|
*E = malformedError("dylib ordinal of re-export " + Twine(error) +
|
2017-08-20 23:13:39 +08:00
|
|
|
" in export trie data at node: 0x" +
|
|
|
|
Twine::utohexstr(offset));
|
2017-07-21 07:08:41 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
if (O != nullptr) {
|
|
|
|
if (State.Other > O->getLibraryCount()) {
|
2017-08-20 23:13:39 +08:00
|
|
|
*E = malformedError(
|
|
|
|
"bad library ordinal: " + Twine((int)State.Other) + " (max " +
|
|
|
|
Twine((int)O->getLibraryCount()) +
|
|
|
|
") in export trie data at node: 0x" + Twine::utohexstr(offset));
|
2017-07-21 07:08:41 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
2014-08-30 08:20:14 +08:00
|
|
|
State.ImportName = reinterpret_cast<const char*>(State.Current);
|
2017-07-21 07:08:41 +08:00
|
|
|
if (*State.ImportName == '\0') {
|
|
|
|
State.Current++;
|
|
|
|
} else {
|
|
|
|
const uint8_t *End = State.Current + 1;
|
|
|
|
if (End >= Trie.end()) {
|
|
|
|
*E = malformedError("import name of re-export in export trie data at "
|
2017-08-20 23:13:39 +08:00
|
|
|
"node: 0x" +
|
|
|
|
Twine::utohexstr(offset) +
|
|
|
|
" starts past end of trie data");
|
2017-07-21 07:08:41 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
while(*End != '\0' && End < Trie.end())
|
|
|
|
End++;
|
|
|
|
if (*End != '\0') {
|
|
|
|
*E = malformedError("import name of re-export in export trie data at "
|
2017-08-20 23:13:39 +08:00
|
|
|
"node: 0x" +
|
|
|
|
Twine::utohexstr(offset) +
|
|
|
|
" extends past end of trie data");
|
2017-07-21 07:08:41 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
State.Current = End + 1;
|
|
|
|
}
|
2014-08-30 08:20:14 +08:00
|
|
|
} else {
|
2017-07-21 07:08:41 +08:00
|
|
|
State.Address = readULEB128(State.Current, &error);
|
|
|
|
if (error) {
|
2017-08-20 23:13:39 +08:00
|
|
|
*E = malformedError("address " + Twine(error) +
|
|
|
|
" in export trie data at node: 0x" +
|
|
|
|
Twine::utohexstr(offset));
|
2017-07-21 07:08:41 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
if (State.Flags & MachO::EXPORT_SYMBOL_FLAGS_STUB_AND_RESOLVER) {
|
|
|
|
State.Other = readULEB128(State.Current, &error);
|
|
|
|
if (error) {
|
|
|
|
*E = malformedError("resolver of stub and resolver " + Twine(error) +
|
2017-08-20 23:13:39 +08:00
|
|
|
" in export trie data at node: 0x" +
|
|
|
|
Twine::utohexstr(offset));
|
2017-07-21 07:08:41 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
2014-08-30 08:20:14 +08:00
|
|
|
}
|
2017-07-21 07:08:41 +08:00
|
|
|
if(ExportStart + ExportInfoSize != State.Current) {
|
2017-08-20 23:13:39 +08:00
|
|
|
*E = malformedError(
|
|
|
|
"inconsistant export info size: 0x" +
|
|
|
|
Twine::utohexstr(ExportInfoSize) + " where actual size was: 0x" +
|
|
|
|
Twine::utohexstr(State.Current - ExportStart) +
|
|
|
|
" in export trie data at node: 0x" + Twine::utohexstr(offset));
|
2017-07-21 07:08:41 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
2017-07-25 04:33:41 +08:00
|
|
|
State.ChildCount = *Children;
|
|
|
|
if (State.ChildCount != 0 && Children + 1 >= Trie.end()) {
|
2017-07-21 07:08:41 +08:00
|
|
|
*E = malformedError("byte for count of childern in export trie data at "
|
2017-08-20 23:13:39 +08:00
|
|
|
"node: 0x" +
|
|
|
|
Twine::utohexstr(offset) +
|
|
|
|
" extends past end of trie data");
|
2017-07-21 07:08:41 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
2014-08-30 08:20:14 +08:00
|
|
|
}
|
|
|
|
State.Current = Children + 1;
|
|
|
|
State.NextChildIndex = 0;
|
|
|
|
State.ParentStringLength = CumulativeString.size();
|
|
|
|
Stack.push_back(State);
|
|
|
|
}
|
|
|
|
|
|
|
|
void ExportEntry::pushDownUntilBottom() {
|
2017-07-21 07:08:41 +08:00
|
|
|
ErrorAsOutParameter ErrAsOutParam(E);
|
|
|
|
const char *error;
|
2014-08-30 08:20:14 +08:00
|
|
|
while (Stack.back().NextChildIndex < Stack.back().ChildCount) {
|
|
|
|
NodeState &Top = Stack.back();
|
|
|
|
CumulativeString.resize(Top.ParentStringLength);
|
2017-07-21 07:08:41 +08:00
|
|
|
for (;*Top.Current != 0 && Top.Current < Trie.end(); Top.Current++) {
|
2014-09-03 02:50:24 +08:00
|
|
|
char C = *Top.Current;
|
|
|
|
CumulativeString.push_back(C);
|
2014-08-30 08:20:14 +08:00
|
|
|
}
|
2017-07-21 07:08:41 +08:00
|
|
|
if (Top.Current >= Trie.end()) {
|
|
|
|
*E = malformedError("edge sub-string in export trie data at node: 0x" +
|
2017-08-20 23:13:39 +08:00
|
|
|
Twine::utohexstr(Top.Start - Trie.begin()) +
|
|
|
|
" for child #" + Twine((int)Top.NextChildIndex) +
|
|
|
|
" extends past end of trie data");
|
2017-07-21 07:08:41 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
2014-08-30 08:20:14 +08:00
|
|
|
Top.Current += 1;
|
2017-07-21 07:08:41 +08:00
|
|
|
uint64_t childNodeIndex = readULEB128(Top.Current, &error);
|
|
|
|
if (error) {
|
|
|
|
*E = malformedError("child node offset " + Twine(error) +
|
2017-08-20 23:13:39 +08:00
|
|
|
" in export trie data at node: 0x" +
|
|
|
|
Twine::utohexstr(Top.Start - Trie.begin()));
|
2017-07-21 07:08:41 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
for (const NodeState &node : nodes()) {
|
|
|
|
if (node.Start == Trie.begin() + childNodeIndex){
|
|
|
|
*E = malformedError("loop in childern in export trie data at node: 0x" +
|
2017-08-20 23:13:39 +08:00
|
|
|
Twine::utohexstr(Top.Start - Trie.begin()) +
|
|
|
|
" back to node: 0x" +
|
|
|
|
Twine::utohexstr(childNodeIndex));
|
2017-07-21 07:08:41 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
2014-08-30 08:20:14 +08:00
|
|
|
Top.NextChildIndex += 1;
|
|
|
|
pushNode(childNodeIndex);
|
2017-07-21 07:08:41 +08:00
|
|
|
if (*E)
|
|
|
|
return;
|
2014-08-30 08:20:14 +08:00
|
|
|
}
|
|
|
|
if (!Stack.back().IsExportNode) {
|
2017-07-21 07:08:41 +08:00
|
|
|
*E = malformedError("node is not an export node in export trie data at "
|
2017-08-20 23:13:39 +08:00
|
|
|
"node: 0x" +
|
|
|
|
Twine::utohexstr(Stack.back().Start - Trie.begin()));
|
2014-08-30 08:20:14 +08:00
|
|
|
moveToEnd();
|
2017-07-21 07:08:41 +08:00
|
|
|
return;
|
2014-08-30 08:20:14 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// We have a trie data structure and need a way to walk it that is compatible
|
|
|
|
// with the C++ iterator model. The solution is a non-recursive depth first
|
|
|
|
// traversal where the iterator contains a stack of parent nodes along with a
|
|
|
|
// string that is the accumulation of all edge strings along the parent chain
|
|
|
|
// to this point.
|
|
|
|
//
|
2014-10-27 16:08:18 +08:00
|
|
|
// There is one "export" node for each exported symbol. But because some
|
2014-08-30 08:20:14 +08:00
|
|
|
// symbols may be a prefix of another symbol (e.g. _dup and _dup2), an export
|
2015-09-22 19:14:12 +08:00
|
|
|
// node may have child nodes too.
|
2014-08-30 08:20:14 +08:00
|
|
|
//
|
|
|
|
// The algorithm for moveNext() is to keep moving down the leftmost unvisited
|
|
|
|
// child until hitting a node with no children (which is an export node or
|
|
|
|
// else the trie is malformed). On the way down, each node is pushed on the
|
|
|
|
// stack ivar. If there is no more ways down, it pops up one and tries to go
|
|
|
|
// down a sibling path until a childless node is reached.
|
|
|
|
void ExportEntry::moveNext() {
|
2017-07-21 07:08:41 +08:00
|
|
|
assert(!Stack.empty() && "ExportEntry::moveNext() with empty node stack");
|
|
|
|
if (!Stack.back().IsExportNode) {
|
|
|
|
*E = malformedError("node is not an export node in export trie data at "
|
2017-08-20 23:13:39 +08:00
|
|
|
"node: 0x" +
|
|
|
|
Twine::utohexstr(Stack.back().Start - Trie.begin()));
|
2014-08-30 08:20:14 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
Stack.pop_back();
|
|
|
|
while (!Stack.empty()) {
|
|
|
|
NodeState &Top = Stack.back();
|
|
|
|
if (Top.NextChildIndex < Top.ChildCount) {
|
|
|
|
pushDownUntilBottom();
|
|
|
|
// Now at the next export node.
|
|
|
|
return;
|
|
|
|
} else {
|
|
|
|
if (Top.IsExportNode) {
|
|
|
|
// This node has no children but is itself an export node.
|
|
|
|
CumulativeString.resize(Top.ParentStringLength);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
Stack.pop_back();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
Done = true;
|
|
|
|
}
|
|
|
|
|
2015-09-22 19:19:03 +08:00
|
|
|
iterator_range<export_iterator>
|
2017-07-21 07:08:41 +08:00
|
|
|
MachOObjectFile::exports(Error &E, ArrayRef<uint8_t> Trie,
|
|
|
|
const MachOObjectFile *O) {
|
|
|
|
ExportEntry Start(&E, O, Trie);
|
2017-04-22 06:03:05 +08:00
|
|
|
if (Trie.empty())
|
2014-12-19 10:31:01 +08:00
|
|
|
Start.moveToEnd();
|
|
|
|
else
|
|
|
|
Start.moveToFirst();
|
2014-08-30 08:20:14 +08:00
|
|
|
|
2017-07-21 07:08:41 +08:00
|
|
|
ExportEntry Finish(&E, O, Trie);
|
2014-08-30 08:20:14 +08:00
|
|
|
Finish.moveToEnd();
|
|
|
|
|
2015-12-06 13:08:07 +08:00
|
|
|
return make_range(export_iterator(Start), export_iterator(Finish));
|
2014-08-30 08:20:14 +08:00
|
|
|
}
|
|
|
|
|
2017-07-29 08:30:45 +08:00
|
|
|
iterator_range<export_iterator> MachOObjectFile::exports(Error &Err) const {
|
|
|
|
return exports(Err, getDyldInfoExportsTrie(), this);
|
2014-08-30 08:20:14 +08:00
|
|
|
}
|
|
|
|
|
2017-03-21 03:46:55 +08:00
|
|
|
MachORebaseEntry::MachORebaseEntry(Error *E, const MachOObjectFile *O,
|
|
|
|
ArrayRef<uint8_t> Bytes, bool is64Bit)
|
2017-04-22 06:03:05 +08:00
|
|
|
: E(E), O(O), Opcodes(Bytes), Ptr(Bytes.begin()),
|
|
|
|
PointerSize(is64Bit ? 8 : 4) {}
|
2014-09-13 05:34:15 +08:00
|
|
|
|
|
|
|
void MachORebaseEntry::moveToFirst() {
|
|
|
|
Ptr = Opcodes.begin();
|
|
|
|
moveNext();
|
|
|
|
}
|
|
|
|
|
|
|
|
void MachORebaseEntry::moveToEnd() {
|
|
|
|
Ptr = Opcodes.end();
|
|
|
|
RemainingLoopCount = 0;
|
|
|
|
Done = true;
|
|
|
|
}
|
|
|
|
|
|
|
|
void MachORebaseEntry::moveNext() {
|
2017-03-28 04:09:23 +08:00
|
|
|
ErrorAsOutParameter ErrAsOutParam(E);
|
2014-09-13 05:34:15 +08:00
|
|
|
// If in the middle of some loop, move to next rebasing in loop.
|
|
|
|
SegmentOffset += AdvanceAmount;
|
|
|
|
if (RemainingLoopCount) {
|
|
|
|
--RemainingLoopCount;
|
|
|
|
return;
|
|
|
|
}
|
2017-03-31 03:56:50 +08:00
|
|
|
// REBASE_OPCODE_DONE is only used for padding if we are not aligned to
|
|
|
|
// pointer size. Therefore it is possible to reach the end without ever having
|
|
|
|
// seen REBASE_OPCODE_DONE.
|
|
|
|
if (Ptr == Opcodes.end()) {
|
2014-09-13 05:34:15 +08:00
|
|
|
Done = true;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
bool More = true;
|
2017-03-28 04:09:23 +08:00
|
|
|
while (More) {
|
2014-09-13 05:34:15 +08:00
|
|
|
// Parse next opcode and set up next loop.
|
2017-03-28 04:09:23 +08:00
|
|
|
const uint8_t *OpcodeStart = Ptr;
|
2014-09-13 05:34:15 +08:00
|
|
|
uint8_t Byte = *Ptr++;
|
|
|
|
uint8_t ImmValue = Byte & MachO::REBASE_IMMEDIATE_MASK;
|
|
|
|
uint8_t Opcode = Byte & MachO::REBASE_OPCODE_MASK;
|
2017-03-28 04:09:23 +08:00
|
|
|
uint32_t Count, Skip;
|
|
|
|
const char *error = nullptr;
|
2014-09-13 05:34:15 +08:00
|
|
|
switch (Opcode) {
|
|
|
|
case MachO::REBASE_OPCODE_DONE:
|
|
|
|
More = false;
|
|
|
|
Done = true;
|
|
|
|
moveToEnd();
|
2017-04-22 06:03:05 +08:00
|
|
|
DEBUG_WITH_TYPE("mach-o-rebase", dbgs() << "REBASE_OPCODE_DONE\n");
|
2014-09-13 05:34:15 +08:00
|
|
|
break;
|
|
|
|
case MachO::REBASE_OPCODE_SET_TYPE_IMM:
|
|
|
|
RebaseType = ImmValue;
|
2017-03-28 04:09:23 +08:00
|
|
|
if (RebaseType > MachO::REBASE_TYPE_TEXT_PCREL32) {
|
2017-08-20 23:13:39 +08:00
|
|
|
*E = malformedError("for REBASE_OPCODE_SET_TYPE_IMM bad bind type: " +
|
|
|
|
Twine((int)RebaseType) + " for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
|
|
|
moveToEnd();
|
|
|
|
return;
|
2017-03-28 04:09:23 +08:00
|
|
|
}
|
2014-09-13 05:34:15 +08:00
|
|
|
DEBUG_WITH_TYPE(
|
|
|
|
"mach-o-rebase",
|
2017-04-22 06:03:05 +08:00
|
|
|
dbgs() << "REBASE_OPCODE_SET_TYPE_IMM: "
|
|
|
|
<< "RebaseType=" << (int) RebaseType << "\n");
|
2014-09-13 05:34:15 +08:00
|
|
|
break;
|
|
|
|
case MachO::REBASE_OPCODE_SET_SEGMENT_AND_OFFSET_ULEB:
|
|
|
|
SegmentIndex = ImmValue;
|
2017-03-28 04:09:23 +08:00
|
|
|
SegmentOffset = readULEB128(&error);
|
|
|
|
if (error) {
|
|
|
|
*E = malformedError("for REBASE_OPCODE_SET_SEGMENT_AND_OFFSET_ULEB " +
|
2017-08-20 23:13:39 +08:00
|
|
|
Twine(error) + " for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-28 04:09:23 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
Fix Mach-O bind and rebase validation errors in libObject
Summary:
llvm-objdump (via libObject) validates DYLD_INFO rebase and bind
entries against the basic structure found in the Mach-O file before
evaluating the contents of those entries. Certain malformed Mach-Os can
defeat the validation check and force llvm-objdump (libObject) to crash.
The previous logic verified a rebase or bind started in a valid Mach-O
section, but did not verify that the section wholely contained the
fixup. It also generally allows rebases or binds to start immediately
after a valid section even if that range is not itself part of a valid
section. Finally, bind and rebase opcodes that indicate more than one
fixup (apply N times...) are not completely validated: only the first
and final fixups are checked.
The previous logic also rejected certain binaries as false positives.
Some bind and rebase opcodes can modify the state machine such that the
next bind or rebase will fail. libObject will reject these opcodes as
invalid in order to be helpful and print an error message associated
with the instruction that caused the problem, even though the binary is
not actually illegal until it consumes the invalid state in the state
machine. In other words, libObject may reject a Mach-O binary that
Apple's dynamic linker may consider legal. The original version of
macho-rebase-add-addr-uleb-too-big is an example of such a binary.
I have replaced the existing checkSegAndOffset and checkCountAndSkip
functions with a single function, checkSegAndOffsets, which validates
all of the fixups realized by a DYLD_INFO opcode. checkSegAndOffsets
verifies that a Mach-O section fully contains each fixup. Every fixup
realized by an opcode is validated, and some (but not all!)
inconsistencies in the state machine are allowed until a fixup is
realized. This means that libObject may fail on an opcode that realizes
a fixup, not on the opcode that introduced the arithmetic error.
Existing test cases have been modified to reflect the changes in error
messages returned by libObject. What's more, the test case for
macho-rebase-add-addr-uleb-too-big has been modified so that it actually
triggers the error condition; the new code in libObject considers the
original test binary "legal".
rdar://47797757
Reviewers: lhames, pete, ab
Reviewed By: pete
Subscribers: rupprecht, jdoerfert, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59574
llvm-svn: 356629
2019-03-21 07:21:16 +08:00
|
|
|
error = O->RebaseEntryCheckSegAndOffsets(SegmentIndex, SegmentOffset,
|
|
|
|
PointerSize);
|
2017-03-28 04:09:23 +08:00
|
|
|
if (error) {
|
|
|
|
*E = malformedError("for REBASE_OPCODE_SET_SEGMENT_AND_OFFSET_ULEB " +
|
2017-08-20 23:13:39 +08:00
|
|
|
Twine(error) + " for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-28 04:09:23 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
2014-09-13 05:34:15 +08:00
|
|
|
DEBUG_WITH_TYPE(
|
|
|
|
"mach-o-rebase",
|
2017-04-22 06:03:05 +08:00
|
|
|
dbgs() << "REBASE_OPCODE_SET_SEGMENT_AND_OFFSET_ULEB: "
|
|
|
|
<< "SegmentIndex=" << SegmentIndex << ", "
|
|
|
|
<< format("SegmentOffset=0x%06X", SegmentOffset)
|
|
|
|
<< "\n");
|
2014-09-13 05:34:15 +08:00
|
|
|
break;
|
|
|
|
case MachO::REBASE_OPCODE_ADD_ADDR_ULEB:
|
2017-03-28 04:09:23 +08:00
|
|
|
SegmentOffset += readULEB128(&error);
|
|
|
|
if (error) {
|
2017-08-20 23:13:39 +08:00
|
|
|
*E = malformedError("for REBASE_OPCODE_ADD_ADDR_ULEB " + Twine(error) +
|
|
|
|
" for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-28 04:09:23 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
Fix Mach-O bind and rebase validation errors in libObject
Summary:
llvm-objdump (via libObject) validates DYLD_INFO rebase and bind
entries against the basic structure found in the Mach-O file before
evaluating the contents of those entries. Certain malformed Mach-Os can
defeat the validation check and force llvm-objdump (libObject) to crash.
The previous logic verified a rebase or bind started in a valid Mach-O
section, but did not verify that the section wholely contained the
fixup. It also generally allows rebases or binds to start immediately
after a valid section even if that range is not itself part of a valid
section. Finally, bind and rebase opcodes that indicate more than one
fixup (apply N times...) are not completely validated: only the first
and final fixups are checked.
The previous logic also rejected certain binaries as false positives.
Some bind and rebase opcodes can modify the state machine such that the
next bind or rebase will fail. libObject will reject these opcodes as
invalid in order to be helpful and print an error message associated
with the instruction that caused the problem, even though the binary is
not actually illegal until it consumes the invalid state in the state
machine. In other words, libObject may reject a Mach-O binary that
Apple's dynamic linker may consider legal. The original version of
macho-rebase-add-addr-uleb-too-big is an example of such a binary.
I have replaced the existing checkSegAndOffset and checkCountAndSkip
functions with a single function, checkSegAndOffsets, which validates
all of the fixups realized by a DYLD_INFO opcode. checkSegAndOffsets
verifies that a Mach-O section fully contains each fixup. Every fixup
realized by an opcode is validated, and some (but not all!)
inconsistencies in the state machine are allowed until a fixup is
realized. This means that libObject may fail on an opcode that realizes
a fixup, not on the opcode that introduced the arithmetic error.
Existing test cases have been modified to reflect the changes in error
messages returned by libObject. What's more, the test case for
macho-rebase-add-addr-uleb-too-big has been modified so that it actually
triggers the error condition; the new code in libObject considers the
original test binary "legal".
rdar://47797757
Reviewers: lhames, pete, ab
Reviewed By: pete
Subscribers: rupprecht, jdoerfert, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59574
llvm-svn: 356629
2019-03-21 07:21:16 +08:00
|
|
|
error = O->RebaseEntryCheckSegAndOffsets(SegmentIndex, SegmentOffset,
|
|
|
|
PointerSize);
|
2017-03-28 04:09:23 +08:00
|
|
|
if (error) {
|
2017-08-20 23:13:39 +08:00
|
|
|
*E = malformedError("for REBASE_OPCODE_ADD_ADDR_ULEB " + Twine(error) +
|
|
|
|
" for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-28 04:09:23 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
2014-09-13 05:34:15 +08:00
|
|
|
DEBUG_WITH_TYPE("mach-o-rebase",
|
2017-04-22 06:03:05 +08:00
|
|
|
dbgs() << "REBASE_OPCODE_ADD_ADDR_ULEB: "
|
|
|
|
<< format("SegmentOffset=0x%06X",
|
|
|
|
SegmentOffset) << "\n");
|
2014-09-13 05:34:15 +08:00
|
|
|
break;
|
|
|
|
case MachO::REBASE_OPCODE_ADD_ADDR_IMM_SCALED:
|
Fix Mach-O bind and rebase validation errors in libObject
Summary:
llvm-objdump (via libObject) validates DYLD_INFO rebase and bind
entries against the basic structure found in the Mach-O file before
evaluating the contents of those entries. Certain malformed Mach-Os can
defeat the validation check and force llvm-objdump (libObject) to crash.
The previous logic verified a rebase or bind started in a valid Mach-O
section, but did not verify that the section wholely contained the
fixup. It also generally allows rebases or binds to start immediately
after a valid section even if that range is not itself part of a valid
section. Finally, bind and rebase opcodes that indicate more than one
fixup (apply N times...) are not completely validated: only the first
and final fixups are checked.
The previous logic also rejected certain binaries as false positives.
Some bind and rebase opcodes can modify the state machine such that the
next bind or rebase will fail. libObject will reject these opcodes as
invalid in order to be helpful and print an error message associated
with the instruction that caused the problem, even though the binary is
not actually illegal until it consumes the invalid state in the state
machine. In other words, libObject may reject a Mach-O binary that
Apple's dynamic linker may consider legal. The original version of
macho-rebase-add-addr-uleb-too-big is an example of such a binary.
I have replaced the existing checkSegAndOffset and checkCountAndSkip
functions with a single function, checkSegAndOffsets, which validates
all of the fixups realized by a DYLD_INFO opcode. checkSegAndOffsets
verifies that a Mach-O section fully contains each fixup. Every fixup
realized by an opcode is validated, and some (but not all!)
inconsistencies in the state machine are allowed until a fixup is
realized. This means that libObject may fail on an opcode that realizes
a fixup, not on the opcode that introduced the arithmetic error.
Existing test cases have been modified to reflect the changes in error
messages returned by libObject. What's more, the test case for
macho-rebase-add-addr-uleb-too-big has been modified so that it actually
triggers the error condition; the new code in libObject considers the
original test binary "legal".
rdar://47797757
Reviewers: lhames, pete, ab
Reviewed By: pete
Subscribers: rupprecht, jdoerfert, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59574
llvm-svn: 356629
2019-03-21 07:21:16 +08:00
|
|
|
error = O->RebaseEntryCheckSegAndOffsets(SegmentIndex, SegmentOffset,
|
|
|
|
PointerSize);
|
2017-03-28 04:09:23 +08:00
|
|
|
if (error) {
|
|
|
|
*E = malformedError("for REBASE_OPCODE_ADD_ADDR_IMM_SCALED " +
|
2017-08-20 23:13:39 +08:00
|
|
|
Twine(error) + " for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-28 04:09:23 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
2014-09-13 05:34:15 +08:00
|
|
|
SegmentOffset += ImmValue * PointerSize;
|
Fix Mach-O bind and rebase validation errors in libObject
Summary:
llvm-objdump (via libObject) validates DYLD_INFO rebase and bind
entries against the basic structure found in the Mach-O file before
evaluating the contents of those entries. Certain malformed Mach-Os can
defeat the validation check and force llvm-objdump (libObject) to crash.
The previous logic verified a rebase or bind started in a valid Mach-O
section, but did not verify that the section wholely contained the
fixup. It also generally allows rebases or binds to start immediately
after a valid section even if that range is not itself part of a valid
section. Finally, bind and rebase opcodes that indicate more than one
fixup (apply N times...) are not completely validated: only the first
and final fixups are checked.
The previous logic also rejected certain binaries as false positives.
Some bind and rebase opcodes can modify the state machine such that the
next bind or rebase will fail. libObject will reject these opcodes as
invalid in order to be helpful and print an error message associated
with the instruction that caused the problem, even though the binary is
not actually illegal until it consumes the invalid state in the state
machine. In other words, libObject may reject a Mach-O binary that
Apple's dynamic linker may consider legal. The original version of
macho-rebase-add-addr-uleb-too-big is an example of such a binary.
I have replaced the existing checkSegAndOffset and checkCountAndSkip
functions with a single function, checkSegAndOffsets, which validates
all of the fixups realized by a DYLD_INFO opcode. checkSegAndOffsets
verifies that a Mach-O section fully contains each fixup. Every fixup
realized by an opcode is validated, and some (but not all!)
inconsistencies in the state machine are allowed until a fixup is
realized. This means that libObject may fail on an opcode that realizes
a fixup, not on the opcode that introduced the arithmetic error.
Existing test cases have been modified to reflect the changes in error
messages returned by libObject. What's more, the test case for
macho-rebase-add-addr-uleb-too-big has been modified so that it actually
triggers the error condition; the new code in libObject considers the
original test binary "legal".
rdar://47797757
Reviewers: lhames, pete, ab
Reviewed By: pete
Subscribers: rupprecht, jdoerfert, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59574
llvm-svn: 356629
2019-03-21 07:21:16 +08:00
|
|
|
error = O->RebaseEntryCheckSegAndOffsets(SegmentIndex, SegmentOffset,
|
|
|
|
PointerSize);
|
2017-03-28 04:09:23 +08:00
|
|
|
if (error) {
|
2017-08-20 23:13:39 +08:00
|
|
|
*E =
|
|
|
|
malformedError("for REBASE_OPCODE_ADD_ADDR_IMM_SCALED "
|
|
|
|
" (after adding immediate times the pointer size) " +
|
|
|
|
Twine(error) + " for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-28 04:09:23 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
2014-09-13 05:34:15 +08:00
|
|
|
DEBUG_WITH_TYPE("mach-o-rebase",
|
2017-04-22 06:03:05 +08:00
|
|
|
dbgs() << "REBASE_OPCODE_ADD_ADDR_IMM_SCALED: "
|
|
|
|
<< format("SegmentOffset=0x%06X",
|
|
|
|
SegmentOffset) << "\n");
|
2014-09-13 05:34:15 +08:00
|
|
|
break;
|
|
|
|
case MachO::REBASE_OPCODE_DO_REBASE_IMM_TIMES:
|
|
|
|
AdvanceAmount = PointerSize;
|
2017-03-28 04:09:23 +08:00
|
|
|
Skip = 0;
|
|
|
|
Count = ImmValue;
|
|
|
|
if (ImmValue != 0)
|
|
|
|
RemainingLoopCount = ImmValue - 1;
|
|
|
|
else
|
|
|
|
RemainingLoopCount = 0;
|
Fix Mach-O bind and rebase validation errors in libObject
Summary:
llvm-objdump (via libObject) validates DYLD_INFO rebase and bind
entries against the basic structure found in the Mach-O file before
evaluating the contents of those entries. Certain malformed Mach-Os can
defeat the validation check and force llvm-objdump (libObject) to crash.
The previous logic verified a rebase or bind started in a valid Mach-O
section, but did not verify that the section wholely contained the
fixup. It also generally allows rebases or binds to start immediately
after a valid section even if that range is not itself part of a valid
section. Finally, bind and rebase opcodes that indicate more than one
fixup (apply N times...) are not completely validated: only the first
and final fixups are checked.
The previous logic also rejected certain binaries as false positives.
Some bind and rebase opcodes can modify the state machine such that the
next bind or rebase will fail. libObject will reject these opcodes as
invalid in order to be helpful and print an error message associated
with the instruction that caused the problem, even though the binary is
not actually illegal until it consumes the invalid state in the state
machine. In other words, libObject may reject a Mach-O binary that
Apple's dynamic linker may consider legal. The original version of
macho-rebase-add-addr-uleb-too-big is an example of such a binary.
I have replaced the existing checkSegAndOffset and checkCountAndSkip
functions with a single function, checkSegAndOffsets, which validates
all of the fixups realized by a DYLD_INFO opcode. checkSegAndOffsets
verifies that a Mach-O section fully contains each fixup. Every fixup
realized by an opcode is validated, and some (but not all!)
inconsistencies in the state machine are allowed until a fixup is
realized. This means that libObject may fail on an opcode that realizes
a fixup, not on the opcode that introduced the arithmetic error.
Existing test cases have been modified to reflect the changes in error
messages returned by libObject. What's more, the test case for
macho-rebase-add-addr-uleb-too-big has been modified so that it actually
triggers the error condition; the new code in libObject considers the
original test binary "legal".
rdar://47797757
Reviewers: lhames, pete, ab
Reviewed By: pete
Subscribers: rupprecht, jdoerfert, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59574
llvm-svn: 356629
2019-03-21 07:21:16 +08:00
|
|
|
error = O->RebaseEntryCheckSegAndOffsets(SegmentIndex, SegmentOffset,
|
|
|
|
PointerSize, Count, Skip);
|
2017-03-28 04:09:23 +08:00
|
|
|
if (error) {
|
2017-08-20 23:13:39 +08:00
|
|
|
*E = malformedError("for REBASE_OPCODE_DO_REBASE_IMM_TIMES " +
|
|
|
|
Twine(error) + " for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-28 04:09:23 +08:00
|
|
|
moveToEnd();
|
2017-08-28 14:47:47 +08:00
|
|
|
return;
|
2017-03-28 04:09:23 +08:00
|
|
|
}
|
2014-09-13 05:34:15 +08:00
|
|
|
DEBUG_WITH_TYPE(
|
|
|
|
"mach-o-rebase",
|
2017-04-22 06:03:05 +08:00
|
|
|
dbgs() << "REBASE_OPCODE_DO_REBASE_IMM_TIMES: "
|
|
|
|
<< format("SegmentOffset=0x%06X", SegmentOffset)
|
|
|
|
<< ", AdvanceAmount=" << AdvanceAmount
|
|
|
|
<< ", RemainingLoopCount=" << RemainingLoopCount
|
|
|
|
<< "\n");
|
2014-09-13 05:34:15 +08:00
|
|
|
return;
|
|
|
|
case MachO::REBASE_OPCODE_DO_REBASE_ULEB_TIMES:
|
|
|
|
AdvanceAmount = PointerSize;
|
2017-03-28 04:09:23 +08:00
|
|
|
Skip = 0;
|
|
|
|
Count = readULEB128(&error);
|
|
|
|
if (error) {
|
|
|
|
*E = malformedError("for REBASE_OPCODE_DO_REBASE_ULEB_TIMES " +
|
2017-08-20 23:13:39 +08:00
|
|
|
Twine(error) + " for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-28 04:09:23 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
if (Count != 0)
|
|
|
|
RemainingLoopCount = Count - 1;
|
|
|
|
else
|
|
|
|
RemainingLoopCount = 0;
|
Fix Mach-O bind and rebase validation errors in libObject
Summary:
llvm-objdump (via libObject) validates DYLD_INFO rebase and bind
entries against the basic structure found in the Mach-O file before
evaluating the contents of those entries. Certain malformed Mach-Os can
defeat the validation check and force llvm-objdump (libObject) to crash.
The previous logic verified a rebase or bind started in a valid Mach-O
section, but did not verify that the section wholely contained the
fixup. It also generally allows rebases or binds to start immediately
after a valid section even if that range is not itself part of a valid
section. Finally, bind and rebase opcodes that indicate more than one
fixup (apply N times...) are not completely validated: only the first
and final fixups are checked.
The previous logic also rejected certain binaries as false positives.
Some bind and rebase opcodes can modify the state machine such that the
next bind or rebase will fail. libObject will reject these opcodes as
invalid in order to be helpful and print an error message associated
with the instruction that caused the problem, even though the binary is
not actually illegal until it consumes the invalid state in the state
machine. In other words, libObject may reject a Mach-O binary that
Apple's dynamic linker may consider legal. The original version of
macho-rebase-add-addr-uleb-too-big is an example of such a binary.
I have replaced the existing checkSegAndOffset and checkCountAndSkip
functions with a single function, checkSegAndOffsets, which validates
all of the fixups realized by a DYLD_INFO opcode. checkSegAndOffsets
verifies that a Mach-O section fully contains each fixup. Every fixup
realized by an opcode is validated, and some (but not all!)
inconsistencies in the state machine are allowed until a fixup is
realized. This means that libObject may fail on an opcode that realizes
a fixup, not on the opcode that introduced the arithmetic error.
Existing test cases have been modified to reflect the changes in error
messages returned by libObject. What's more, the test case for
macho-rebase-add-addr-uleb-too-big has been modified so that it actually
triggers the error condition; the new code in libObject considers the
original test binary "legal".
rdar://47797757
Reviewers: lhames, pete, ab
Reviewed By: pete
Subscribers: rupprecht, jdoerfert, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59574
llvm-svn: 356629
2019-03-21 07:21:16 +08:00
|
|
|
error = O->RebaseEntryCheckSegAndOffsets(SegmentIndex, SegmentOffset,
|
|
|
|
PointerSize, Count, Skip);
|
2017-03-28 04:09:23 +08:00
|
|
|
if (error) {
|
2017-08-20 23:13:39 +08:00
|
|
|
*E = malformedError("for REBASE_OPCODE_DO_REBASE_ULEB_TIMES " +
|
|
|
|
Twine(error) + " for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-28 04:09:23 +08:00
|
|
|
moveToEnd();
|
2017-08-28 14:47:47 +08:00
|
|
|
return;
|
2017-03-28 04:09:23 +08:00
|
|
|
}
|
2014-09-13 05:34:15 +08:00
|
|
|
DEBUG_WITH_TYPE(
|
|
|
|
"mach-o-rebase",
|
2017-04-22 06:03:05 +08:00
|
|
|
dbgs() << "REBASE_OPCODE_DO_REBASE_ULEB_TIMES: "
|
|
|
|
<< format("SegmentOffset=0x%06X", SegmentOffset)
|
|
|
|
<< ", AdvanceAmount=" << AdvanceAmount
|
|
|
|
<< ", RemainingLoopCount=" << RemainingLoopCount
|
|
|
|
<< "\n");
|
2014-09-13 05:34:15 +08:00
|
|
|
return;
|
|
|
|
case MachO::REBASE_OPCODE_DO_REBASE_ADD_ADDR_ULEB:
|
2017-03-28 04:09:23 +08:00
|
|
|
Skip = readULEB128(&error);
|
|
|
|
if (error) {
|
|
|
|
*E = malformedError("for REBASE_OPCODE_DO_REBASE_ADD_ADDR_ULEB " +
|
2017-08-20 23:13:39 +08:00
|
|
|
Twine(error) + " for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-28 04:09:23 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
AdvanceAmount = Skip + PointerSize;
|
|
|
|
Count = 1;
|
2014-09-13 05:34:15 +08:00
|
|
|
RemainingLoopCount = 0;
|
Fix Mach-O bind and rebase validation errors in libObject
Summary:
llvm-objdump (via libObject) validates DYLD_INFO rebase and bind
entries against the basic structure found in the Mach-O file before
evaluating the contents of those entries. Certain malformed Mach-Os can
defeat the validation check and force llvm-objdump (libObject) to crash.
The previous logic verified a rebase or bind started in a valid Mach-O
section, but did not verify that the section wholely contained the
fixup. It also generally allows rebases or binds to start immediately
after a valid section even if that range is not itself part of a valid
section. Finally, bind and rebase opcodes that indicate more than one
fixup (apply N times...) are not completely validated: only the first
and final fixups are checked.
The previous logic also rejected certain binaries as false positives.
Some bind and rebase opcodes can modify the state machine such that the
next bind or rebase will fail. libObject will reject these opcodes as
invalid in order to be helpful and print an error message associated
with the instruction that caused the problem, even though the binary is
not actually illegal until it consumes the invalid state in the state
machine. In other words, libObject may reject a Mach-O binary that
Apple's dynamic linker may consider legal. The original version of
macho-rebase-add-addr-uleb-too-big is an example of such a binary.
I have replaced the existing checkSegAndOffset and checkCountAndSkip
functions with a single function, checkSegAndOffsets, which validates
all of the fixups realized by a DYLD_INFO opcode. checkSegAndOffsets
verifies that a Mach-O section fully contains each fixup. Every fixup
realized by an opcode is validated, and some (but not all!)
inconsistencies in the state machine are allowed until a fixup is
realized. This means that libObject may fail on an opcode that realizes
a fixup, not on the opcode that introduced the arithmetic error.
Existing test cases have been modified to reflect the changes in error
messages returned by libObject. What's more, the test case for
macho-rebase-add-addr-uleb-too-big has been modified so that it actually
triggers the error condition; the new code in libObject considers the
original test binary "legal".
rdar://47797757
Reviewers: lhames, pete, ab
Reviewed By: pete
Subscribers: rupprecht, jdoerfert, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59574
llvm-svn: 356629
2019-03-21 07:21:16 +08:00
|
|
|
error = O->RebaseEntryCheckSegAndOffsets(SegmentIndex, SegmentOffset,
|
|
|
|
PointerSize, Count, Skip);
|
2017-03-28 04:09:23 +08:00
|
|
|
if (error) {
|
2017-08-20 23:13:39 +08:00
|
|
|
*E = malformedError("for REBASE_OPCODE_DO_REBASE_ADD_ADDR_ULEB " +
|
|
|
|
Twine(error) + " for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-28 04:09:23 +08:00
|
|
|
moveToEnd();
|
2017-08-28 14:47:47 +08:00
|
|
|
return;
|
2017-03-28 04:09:23 +08:00
|
|
|
}
|
2014-09-13 05:34:15 +08:00
|
|
|
DEBUG_WITH_TYPE(
|
|
|
|
"mach-o-rebase",
|
2017-04-22 06:03:05 +08:00
|
|
|
dbgs() << "REBASE_OPCODE_DO_REBASE_ADD_ADDR_ULEB: "
|
|
|
|
<< format("SegmentOffset=0x%06X", SegmentOffset)
|
|
|
|
<< ", AdvanceAmount=" << AdvanceAmount
|
|
|
|
<< ", RemainingLoopCount=" << RemainingLoopCount
|
|
|
|
<< "\n");
|
2014-09-13 05:34:15 +08:00
|
|
|
return;
|
|
|
|
case MachO::REBASE_OPCODE_DO_REBASE_ULEB_TIMES_SKIPPING_ULEB:
|
2017-03-28 04:09:23 +08:00
|
|
|
Count = readULEB128(&error);
|
|
|
|
if (error) {
|
|
|
|
*E = malformedError("for REBASE_OPCODE_DO_REBASE_ULEB_TIMES_SKIPPING_"
|
2017-08-20 23:13:39 +08:00
|
|
|
"ULEB " +
|
|
|
|
Twine(error) + " for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-28 04:09:23 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
if (Count != 0)
|
|
|
|
RemainingLoopCount = Count - 1;
|
|
|
|
else
|
|
|
|
RemainingLoopCount = 0;
|
|
|
|
Skip = readULEB128(&error);
|
|
|
|
if (error) {
|
|
|
|
*E = malformedError("for REBASE_OPCODE_DO_REBASE_ULEB_TIMES_SKIPPING_"
|
2017-08-20 23:13:39 +08:00
|
|
|
"ULEB " +
|
|
|
|
Twine(error) + " for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-28 04:09:23 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
AdvanceAmount = Skip + PointerSize;
|
|
|
|
|
Fix Mach-O bind and rebase validation errors in libObject
Summary:
llvm-objdump (via libObject) validates DYLD_INFO rebase and bind
entries against the basic structure found in the Mach-O file before
evaluating the contents of those entries. Certain malformed Mach-Os can
defeat the validation check and force llvm-objdump (libObject) to crash.
The previous logic verified a rebase or bind started in a valid Mach-O
section, but did not verify that the section wholely contained the
fixup. It also generally allows rebases or binds to start immediately
after a valid section even if that range is not itself part of a valid
section. Finally, bind and rebase opcodes that indicate more than one
fixup (apply N times...) are not completely validated: only the first
and final fixups are checked.
The previous logic also rejected certain binaries as false positives.
Some bind and rebase opcodes can modify the state machine such that the
next bind or rebase will fail. libObject will reject these opcodes as
invalid in order to be helpful and print an error message associated
with the instruction that caused the problem, even though the binary is
not actually illegal until it consumes the invalid state in the state
machine. In other words, libObject may reject a Mach-O binary that
Apple's dynamic linker may consider legal. The original version of
macho-rebase-add-addr-uleb-too-big is an example of such a binary.
I have replaced the existing checkSegAndOffset and checkCountAndSkip
functions with a single function, checkSegAndOffsets, which validates
all of the fixups realized by a DYLD_INFO opcode. checkSegAndOffsets
verifies that a Mach-O section fully contains each fixup. Every fixup
realized by an opcode is validated, and some (but not all!)
inconsistencies in the state machine are allowed until a fixup is
realized. This means that libObject may fail on an opcode that realizes
a fixup, not on the opcode that introduced the arithmetic error.
Existing test cases have been modified to reflect the changes in error
messages returned by libObject. What's more, the test case for
macho-rebase-add-addr-uleb-too-big has been modified so that it actually
triggers the error condition; the new code in libObject considers the
original test binary "legal".
rdar://47797757
Reviewers: lhames, pete, ab
Reviewed By: pete
Subscribers: rupprecht, jdoerfert, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59574
llvm-svn: 356629
2019-03-21 07:21:16 +08:00
|
|
|
error = O->RebaseEntryCheckSegAndOffsets(SegmentIndex, SegmentOffset,
|
|
|
|
PointerSize, Count, Skip);
|
2017-03-28 04:09:23 +08:00
|
|
|
if (error) {
|
|
|
|
*E = malformedError("for REBASE_OPCODE_DO_REBASE_ULEB_TIMES_SKIPPING_"
|
2017-08-20 23:13:39 +08:00
|
|
|
"ULEB " +
|
|
|
|
Twine(error) + " for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-28 04:09:23 +08:00
|
|
|
moveToEnd();
|
2017-08-28 14:47:47 +08:00
|
|
|
return;
|
2017-03-28 04:09:23 +08:00
|
|
|
}
|
2014-09-13 05:34:15 +08:00
|
|
|
DEBUG_WITH_TYPE(
|
|
|
|
"mach-o-rebase",
|
2017-04-22 06:03:05 +08:00
|
|
|
dbgs() << "REBASE_OPCODE_DO_REBASE_ULEB_TIMES_SKIPPING_ULEB: "
|
|
|
|
<< format("SegmentOffset=0x%06X", SegmentOffset)
|
|
|
|
<< ", AdvanceAmount=" << AdvanceAmount
|
|
|
|
<< ", RemainingLoopCount=" << RemainingLoopCount
|
|
|
|
<< "\n");
|
2014-09-13 05:34:15 +08:00
|
|
|
return;
|
|
|
|
default:
|
2017-03-28 04:09:23 +08:00
|
|
|
*E = malformedError("bad rebase info (bad opcode value 0x" +
|
2017-08-20 23:13:39 +08:00
|
|
|
Twine::utohexstr(Opcode) + " for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-28 04:09:23 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
2014-09-13 05:34:15 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-03-28 04:09:23 +08:00
|
|
|
uint64_t MachORebaseEntry::readULEB128(const char **error) {
|
2014-09-13 05:34:15 +08:00
|
|
|
unsigned Count;
|
2017-03-28 04:09:23 +08:00
|
|
|
uint64_t Result = decodeULEB128(Ptr, &Count, Opcodes.end(), error);
|
2014-09-13 05:34:15 +08:00
|
|
|
Ptr += Count;
|
2017-03-28 04:09:23 +08:00
|
|
|
if (Ptr > Opcodes.end())
|
2014-09-13 05:34:15 +08:00
|
|
|
Ptr = Opcodes.end();
|
|
|
|
return Result;
|
|
|
|
}
|
|
|
|
|
2017-03-28 04:09:23 +08:00
|
|
|
int32_t MachORebaseEntry::segmentIndex() const { return SegmentIndex; }
|
2014-09-13 05:34:15 +08:00
|
|
|
|
|
|
|
uint64_t MachORebaseEntry::segmentOffset() const { return SegmentOffset; }
|
|
|
|
|
|
|
|
StringRef MachORebaseEntry::typeName() const {
|
|
|
|
switch (RebaseType) {
|
|
|
|
case MachO::REBASE_TYPE_POINTER:
|
|
|
|
return "pointer";
|
|
|
|
case MachO::REBASE_TYPE_TEXT_ABSOLUTE32:
|
|
|
|
return "text abs32";
|
|
|
|
case MachO::REBASE_TYPE_TEXT_PCREL32:
|
|
|
|
return "text rel32";
|
|
|
|
}
|
|
|
|
return "unknown";
|
|
|
|
}
|
|
|
|
|
2017-03-21 03:46:55 +08:00
|
|
|
// For use with the SegIndex of a checked Mach-O Rebase entry
|
|
|
|
// to get the segment name.
|
|
|
|
StringRef MachORebaseEntry::segmentName() const {
|
|
|
|
return O->BindRebaseSegmentName(SegmentIndex);
|
|
|
|
}
|
|
|
|
|
|
|
|
// For use with a SegIndex,SegOffset pair from a checked Mach-O Rebase entry
|
|
|
|
// to get the section name.
|
|
|
|
StringRef MachORebaseEntry::sectionName() const {
|
|
|
|
return O->BindRebaseSectionName(SegmentIndex, SegmentOffset);
|
|
|
|
}
|
|
|
|
|
|
|
|
// For use with a SegIndex,SegOffset pair from a checked Mach-O Rebase entry
|
|
|
|
// to get the address.
|
|
|
|
uint64_t MachORebaseEntry::address() const {
|
|
|
|
return O->BindRebaseAddress(SegmentIndex, SegmentOffset);
|
|
|
|
}
|
|
|
|
|
2014-09-13 05:34:15 +08:00
|
|
|
bool MachORebaseEntry::operator==(const MachORebaseEntry &Other) const {
|
2017-01-09 03:14:15 +08:00
|
|
|
#ifdef EXPENSIVE_CHECKS
|
2014-09-13 05:34:15 +08:00
|
|
|
assert(Opcodes == Other.Opcodes && "compare iterators of different files");
|
2017-01-09 03:14:15 +08:00
|
|
|
#else
|
|
|
|
assert(Opcodes.data() == Other.Opcodes.data() && "compare iterators of different files");
|
|
|
|
#endif
|
2014-09-13 05:34:15 +08:00
|
|
|
return (Ptr == Other.Ptr) &&
|
|
|
|
(RemainingLoopCount == Other.RemainingLoopCount) &&
|
|
|
|
(Done == Other.Done);
|
|
|
|
}
|
|
|
|
|
|
|
|
iterator_range<rebase_iterator>
|
2017-03-21 03:46:55 +08:00
|
|
|
MachOObjectFile::rebaseTable(Error &Err, MachOObjectFile *O,
|
|
|
|
ArrayRef<uint8_t> Opcodes, bool is64) {
|
|
|
|
if (O->BindRebaseSectionTable == nullptr)
|
|
|
|
O->BindRebaseSectionTable = llvm::make_unique<BindRebaseSegInfo>(O);
|
|
|
|
MachORebaseEntry Start(&Err, O, Opcodes, is64);
|
2014-09-13 05:34:15 +08:00
|
|
|
Start.moveToFirst();
|
|
|
|
|
2017-03-21 03:46:55 +08:00
|
|
|
MachORebaseEntry Finish(&Err, O, Opcodes, is64);
|
2014-09-13 05:34:15 +08:00
|
|
|
Finish.moveToEnd();
|
|
|
|
|
2015-12-06 13:08:07 +08:00
|
|
|
return make_range(rebase_iterator(Start), rebase_iterator(Finish));
|
2014-09-13 05:34:15 +08:00
|
|
|
}
|
|
|
|
|
2017-03-21 03:46:55 +08:00
|
|
|
iterator_range<rebase_iterator> MachOObjectFile::rebaseTable(Error &Err) {
|
|
|
|
return rebaseTable(Err, this, getDyldInfoRebaseOpcodes(), is64Bit());
|
2014-09-13 05:34:15 +08:00
|
|
|
}
|
|
|
|
|
2017-03-01 05:47:07 +08:00
|
|
|
MachOBindEntry::MachOBindEntry(Error *E, const MachOObjectFile *O,
|
|
|
|
ArrayRef<uint8_t> Bytes, bool is64Bit, Kind BK)
|
2017-04-22 06:03:05 +08:00
|
|
|
: E(E), O(O), Opcodes(Bytes), Ptr(Bytes.begin()),
|
|
|
|
PointerSize(is64Bit ? 8 : 4), TableKind(BK) {}
|
2014-09-16 09:41:51 +08:00
|
|
|
|
|
|
|
void MachOBindEntry::moveToFirst() {
|
|
|
|
Ptr = Opcodes.begin();
|
|
|
|
moveNext();
|
|
|
|
}
|
|
|
|
|
|
|
|
void MachOBindEntry::moveToEnd() {
|
|
|
|
Ptr = Opcodes.end();
|
|
|
|
RemainingLoopCount = 0;
|
|
|
|
Done = true;
|
|
|
|
}
|
|
|
|
|
|
|
|
void MachOBindEntry::moveNext() {
|
2017-03-01 05:47:07 +08:00
|
|
|
ErrorAsOutParameter ErrAsOutParam(E);
|
2014-09-16 09:41:51 +08:00
|
|
|
// If in the middle of some loop, move to next binding in loop.
|
|
|
|
SegmentOffset += AdvanceAmount;
|
|
|
|
if (RemainingLoopCount) {
|
|
|
|
--RemainingLoopCount;
|
|
|
|
return;
|
|
|
|
}
|
2017-03-31 03:56:50 +08:00
|
|
|
// BIND_OPCODE_DONE is only used for padding if we are not aligned to
|
|
|
|
// pointer size. Therefore it is possible to reach the end without ever having
|
|
|
|
// seen BIND_OPCODE_DONE.
|
|
|
|
if (Ptr == Opcodes.end()) {
|
2014-09-16 09:41:51 +08:00
|
|
|
Done = true;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
bool More = true;
|
2017-03-28 04:09:23 +08:00
|
|
|
while (More) {
|
2014-09-16 09:41:51 +08:00
|
|
|
// Parse next opcode and set up next loop.
|
2017-03-01 05:47:07 +08:00
|
|
|
const uint8_t *OpcodeStart = Ptr;
|
2014-09-16 09:41:51 +08:00
|
|
|
uint8_t Byte = *Ptr++;
|
|
|
|
uint8_t ImmValue = Byte & MachO::BIND_IMMEDIATE_MASK;
|
|
|
|
uint8_t Opcode = Byte & MachO::BIND_OPCODE_MASK;
|
|
|
|
int8_t SignExtended;
|
|
|
|
const uint8_t *SymStart;
|
2017-03-21 03:46:55 +08:00
|
|
|
uint32_t Count, Skip;
|
|
|
|
const char *error = nullptr;
|
2014-09-16 09:41:51 +08:00
|
|
|
switch (Opcode) {
|
|
|
|
case MachO::BIND_OPCODE_DONE:
|
|
|
|
if (TableKind == Kind::Lazy) {
|
|
|
|
// Lazying bindings have a DONE opcode between entries. Need to ignore
|
|
|
|
// it to advance to next entry. But need not if this is last entry.
|
|
|
|
bool NotLastEntry = false;
|
|
|
|
for (const uint8_t *P = Ptr; P < Opcodes.end(); ++P) {
|
|
|
|
if (*P) {
|
|
|
|
NotLastEntry = true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (NotLastEntry)
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
More = false;
|
|
|
|
moveToEnd();
|
2017-04-22 06:03:05 +08:00
|
|
|
DEBUG_WITH_TYPE("mach-o-bind", dbgs() << "BIND_OPCODE_DONE\n");
|
2014-09-16 09:41:51 +08:00
|
|
|
break;
|
|
|
|
case MachO::BIND_OPCODE_SET_DYLIB_ORDINAL_IMM:
|
2017-03-28 04:09:23 +08:00
|
|
|
if (TableKind == Kind::Weak) {
|
|
|
|
*E = malformedError("BIND_OPCODE_SET_DYLIB_ORDINAL_IMM not allowed in "
|
2017-08-20 23:13:39 +08:00
|
|
|
"weak bind table for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-28 04:09:23 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
2014-09-16 09:41:51 +08:00
|
|
|
Ordinal = ImmValue;
|
2017-03-21 03:46:55 +08:00
|
|
|
LibraryOrdinalSet = true;
|
2017-03-01 05:47:07 +08:00
|
|
|
if (ImmValue > O->getLibraryCount()) {
|
|
|
|
*E = malformedError("for BIND_OPCODE_SET_DYLIB_ORDINAL_ULEB bad "
|
2017-08-20 23:13:39 +08:00
|
|
|
"library ordinal: " +
|
|
|
|
Twine((int)ImmValue) + " (max " +
|
|
|
|
Twine((int)O->getLibraryCount()) +
|
|
|
|
") for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-01 05:47:07 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
2014-09-16 09:41:51 +08:00
|
|
|
DEBUG_WITH_TYPE(
|
|
|
|
"mach-o-bind",
|
2017-04-22 06:03:05 +08:00
|
|
|
dbgs() << "BIND_OPCODE_SET_DYLIB_ORDINAL_IMM: "
|
|
|
|
<< "Ordinal=" << Ordinal << "\n");
|
2014-09-16 09:41:51 +08:00
|
|
|
break;
|
|
|
|
case MachO::BIND_OPCODE_SET_DYLIB_ORDINAL_ULEB:
|
2017-03-28 04:09:23 +08:00
|
|
|
if (TableKind == Kind::Weak) {
|
|
|
|
*E = malformedError("BIND_OPCODE_SET_DYLIB_ORDINAL_ULEB not allowed in "
|
2017-08-20 23:13:39 +08:00
|
|
|
"weak bind table for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-28 04:09:23 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
2017-03-21 03:46:55 +08:00
|
|
|
Ordinal = readULEB128(&error);
|
|
|
|
LibraryOrdinalSet = true;
|
|
|
|
if (error) {
|
|
|
|
*E = malformedError("for BIND_OPCODE_SET_DYLIB_ORDINAL_ULEB " +
|
2017-08-20 23:13:39 +08:00
|
|
|
Twine(error) + " for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-21 03:46:55 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
if (Ordinal > (int)O->getLibraryCount()) {
|
|
|
|
*E = malformedError("for BIND_OPCODE_SET_DYLIB_ORDINAL_ULEB bad "
|
2017-08-20 23:13:39 +08:00
|
|
|
"library ordinal: " +
|
|
|
|
Twine((int)Ordinal) + " (max " +
|
|
|
|
Twine((int)O->getLibraryCount()) +
|
|
|
|
") for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-21 03:46:55 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
2014-09-16 09:41:51 +08:00
|
|
|
DEBUG_WITH_TYPE(
|
|
|
|
"mach-o-bind",
|
2017-04-22 06:03:05 +08:00
|
|
|
dbgs() << "BIND_OPCODE_SET_DYLIB_ORDINAL_ULEB: "
|
|
|
|
<< "Ordinal=" << Ordinal << "\n");
|
2014-09-16 09:41:51 +08:00
|
|
|
break;
|
|
|
|
case MachO::BIND_OPCODE_SET_DYLIB_SPECIAL_IMM:
|
2017-03-28 04:09:23 +08:00
|
|
|
if (TableKind == Kind::Weak) {
|
|
|
|
*E = malformedError("BIND_OPCODE_SET_DYLIB_SPECIAL_IMM not allowed in "
|
2017-08-20 23:13:39 +08:00
|
|
|
"weak bind table for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-28 04:09:23 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
2014-09-16 09:41:51 +08:00
|
|
|
if (ImmValue) {
|
|
|
|
SignExtended = MachO::BIND_OPCODE_MASK | ImmValue;
|
|
|
|
Ordinal = SignExtended;
|
2017-03-21 03:46:55 +08:00
|
|
|
if (Ordinal < MachO::BIND_SPECIAL_DYLIB_FLAT_LOOKUP) {
|
|
|
|
*E = malformedError("for BIND_OPCODE_SET_DYLIB_SPECIAL_IMM unknown "
|
2017-08-20 23:13:39 +08:00
|
|
|
"special ordinal: " +
|
|
|
|
Twine((int)Ordinal) + " for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-21 03:46:55 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
2014-09-16 09:41:51 +08:00
|
|
|
} else
|
|
|
|
Ordinal = 0;
|
2017-06-01 06:17:43 +08:00
|
|
|
LibraryOrdinalSet = true;
|
2014-09-16 09:41:51 +08:00
|
|
|
DEBUG_WITH_TYPE(
|
|
|
|
"mach-o-bind",
|
2017-04-22 06:03:05 +08:00
|
|
|
dbgs() << "BIND_OPCODE_SET_DYLIB_SPECIAL_IMM: "
|
|
|
|
<< "Ordinal=" << Ordinal << "\n");
|
2014-09-16 09:41:51 +08:00
|
|
|
break;
|
|
|
|
case MachO::BIND_OPCODE_SET_SYMBOL_TRAILING_FLAGS_IMM:
|
|
|
|
Flags = ImmValue;
|
|
|
|
SymStart = Ptr;
|
2017-03-21 03:46:55 +08:00
|
|
|
while (*Ptr && (Ptr < Opcodes.end())) {
|
2014-09-16 09:41:51 +08:00
|
|
|
++Ptr;
|
|
|
|
}
|
2017-03-21 03:46:55 +08:00
|
|
|
if (Ptr == Opcodes.end()) {
|
2017-08-20 23:13:39 +08:00
|
|
|
*E = malformedError(
|
|
|
|
"for BIND_OPCODE_SET_SYMBOL_TRAILING_FLAGS_IMM "
|
|
|
|
"symbol name extends past opcodes for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
|
|
|
moveToEnd();
|
|
|
|
return;
|
2017-03-21 03:46:55 +08:00
|
|
|
}
|
2014-09-16 09:41:51 +08:00
|
|
|
SymbolName = StringRef(reinterpret_cast<const char*>(SymStart),
|
|
|
|
Ptr-SymStart);
|
2014-09-17 09:51:43 +08:00
|
|
|
++Ptr;
|
2014-09-16 09:41:51 +08:00
|
|
|
DEBUG_WITH_TYPE(
|
|
|
|
"mach-o-bind",
|
2017-04-22 06:03:05 +08:00
|
|
|
dbgs() << "BIND_OPCODE_SET_SYMBOL_TRAILING_FLAGS_IMM: "
|
|
|
|
<< "SymbolName=" << SymbolName << "\n");
|
2014-09-16 09:41:51 +08:00
|
|
|
if (TableKind == Kind::Weak) {
|
|
|
|
if (ImmValue & MachO::BIND_SYMBOL_FLAGS_NON_WEAK_DEFINITION)
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case MachO::BIND_OPCODE_SET_TYPE_IMM:
|
|
|
|
BindType = ImmValue;
|
2017-03-21 03:46:55 +08:00
|
|
|
if (ImmValue > MachO::BIND_TYPE_TEXT_PCREL32) {
|
2017-08-20 23:13:39 +08:00
|
|
|
*E = malformedError("for BIND_OPCODE_SET_TYPE_IMM bad bind type: " +
|
|
|
|
Twine((int)ImmValue) + " for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
|
|
|
moveToEnd();
|
|
|
|
return;
|
2017-03-21 03:46:55 +08:00
|
|
|
}
|
2014-09-16 09:41:51 +08:00
|
|
|
DEBUG_WITH_TYPE(
|
|
|
|
"mach-o-bind",
|
2017-04-22 06:03:05 +08:00
|
|
|
dbgs() << "BIND_OPCODE_SET_TYPE_IMM: "
|
|
|
|
<< "BindType=" << (int)BindType << "\n");
|
2014-09-16 09:41:51 +08:00
|
|
|
break;
|
|
|
|
case MachO::BIND_OPCODE_SET_ADDEND_SLEB:
|
2017-03-21 03:46:55 +08:00
|
|
|
Addend = readSLEB128(&error);
|
|
|
|
if (error) {
|
2017-08-20 23:13:39 +08:00
|
|
|
*E = malformedError("for BIND_OPCODE_SET_ADDEND_SLEB " + Twine(error) +
|
|
|
|
" for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-21 03:46:55 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
2014-09-16 09:41:51 +08:00
|
|
|
DEBUG_WITH_TYPE(
|
|
|
|
"mach-o-bind",
|
2017-04-22 06:03:05 +08:00
|
|
|
dbgs() << "BIND_OPCODE_SET_ADDEND_SLEB: "
|
|
|
|
<< "Addend=" << Addend << "\n");
|
2014-09-16 09:41:51 +08:00
|
|
|
break;
|
|
|
|
case MachO::BIND_OPCODE_SET_SEGMENT_AND_OFFSET_ULEB:
|
|
|
|
SegmentIndex = ImmValue;
|
2017-03-21 03:46:55 +08:00
|
|
|
SegmentOffset = readULEB128(&error);
|
|
|
|
if (error) {
|
|
|
|
*E = malformedError("for BIND_OPCODE_SET_SEGMENT_AND_OFFSET_ULEB " +
|
2017-08-20 23:13:39 +08:00
|
|
|
Twine(error) + " for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-21 03:46:55 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
Fix Mach-O bind and rebase validation errors in libObject
Summary:
llvm-objdump (via libObject) validates DYLD_INFO rebase and bind
entries against the basic structure found in the Mach-O file before
evaluating the contents of those entries. Certain malformed Mach-Os can
defeat the validation check and force llvm-objdump (libObject) to crash.
The previous logic verified a rebase or bind started in a valid Mach-O
section, but did not verify that the section wholely contained the
fixup. It also generally allows rebases or binds to start immediately
after a valid section even if that range is not itself part of a valid
section. Finally, bind and rebase opcodes that indicate more than one
fixup (apply N times...) are not completely validated: only the first
and final fixups are checked.
The previous logic also rejected certain binaries as false positives.
Some bind and rebase opcodes can modify the state machine such that the
next bind or rebase will fail. libObject will reject these opcodes as
invalid in order to be helpful and print an error message associated
with the instruction that caused the problem, even though the binary is
not actually illegal until it consumes the invalid state in the state
machine. In other words, libObject may reject a Mach-O binary that
Apple's dynamic linker may consider legal. The original version of
macho-rebase-add-addr-uleb-too-big is an example of such a binary.
I have replaced the existing checkSegAndOffset and checkCountAndSkip
functions with a single function, checkSegAndOffsets, which validates
all of the fixups realized by a DYLD_INFO opcode. checkSegAndOffsets
verifies that a Mach-O section fully contains each fixup. Every fixup
realized by an opcode is validated, and some (but not all!)
inconsistencies in the state machine are allowed until a fixup is
realized. This means that libObject may fail on an opcode that realizes
a fixup, not on the opcode that introduced the arithmetic error.
Existing test cases have been modified to reflect the changes in error
messages returned by libObject. What's more, the test case for
macho-rebase-add-addr-uleb-too-big has been modified so that it actually
triggers the error condition; the new code in libObject considers the
original test binary "legal".
rdar://47797757
Reviewers: lhames, pete, ab
Reviewed By: pete
Subscribers: rupprecht, jdoerfert, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59574
llvm-svn: 356629
2019-03-21 07:21:16 +08:00
|
|
|
error = O->BindEntryCheckSegAndOffsets(SegmentIndex, SegmentOffset,
|
|
|
|
PointerSize);
|
2017-03-21 03:46:55 +08:00
|
|
|
if (error) {
|
|
|
|
*E = malformedError("for BIND_OPCODE_SET_SEGMENT_AND_OFFSET_ULEB " +
|
2017-08-20 23:13:39 +08:00
|
|
|
Twine(error) + " for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-21 03:46:55 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
2014-09-16 09:41:51 +08:00
|
|
|
DEBUG_WITH_TYPE(
|
|
|
|
"mach-o-bind",
|
2017-04-22 06:03:05 +08:00
|
|
|
dbgs() << "BIND_OPCODE_SET_SEGMENT_AND_OFFSET_ULEB: "
|
|
|
|
<< "SegmentIndex=" << SegmentIndex << ", "
|
|
|
|
<< format("SegmentOffset=0x%06X", SegmentOffset)
|
|
|
|
<< "\n");
|
2014-09-16 09:41:51 +08:00
|
|
|
break;
|
|
|
|
case MachO::BIND_OPCODE_ADD_ADDR_ULEB:
|
2017-03-21 03:46:55 +08:00
|
|
|
SegmentOffset += readULEB128(&error);
|
|
|
|
if (error) {
|
2017-08-20 23:13:39 +08:00
|
|
|
*E = malformedError("for BIND_OPCODE_ADD_ADDR_ULEB " + Twine(error) +
|
|
|
|
" for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-21 03:46:55 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
Fix Mach-O bind and rebase validation errors in libObject
Summary:
llvm-objdump (via libObject) validates DYLD_INFO rebase and bind
entries against the basic structure found in the Mach-O file before
evaluating the contents of those entries. Certain malformed Mach-Os can
defeat the validation check and force llvm-objdump (libObject) to crash.
The previous logic verified a rebase or bind started in a valid Mach-O
section, but did not verify that the section wholely contained the
fixup. It also generally allows rebases or binds to start immediately
after a valid section even if that range is not itself part of a valid
section. Finally, bind and rebase opcodes that indicate more than one
fixup (apply N times...) are not completely validated: only the first
and final fixups are checked.
The previous logic also rejected certain binaries as false positives.
Some bind and rebase opcodes can modify the state machine such that the
next bind or rebase will fail. libObject will reject these opcodes as
invalid in order to be helpful and print an error message associated
with the instruction that caused the problem, even though the binary is
not actually illegal until it consumes the invalid state in the state
machine. In other words, libObject may reject a Mach-O binary that
Apple's dynamic linker may consider legal. The original version of
macho-rebase-add-addr-uleb-too-big is an example of such a binary.
I have replaced the existing checkSegAndOffset and checkCountAndSkip
functions with a single function, checkSegAndOffsets, which validates
all of the fixups realized by a DYLD_INFO opcode. checkSegAndOffsets
verifies that a Mach-O section fully contains each fixup. Every fixup
realized by an opcode is validated, and some (but not all!)
inconsistencies in the state machine are allowed until a fixup is
realized. This means that libObject may fail on an opcode that realizes
a fixup, not on the opcode that introduced the arithmetic error.
Existing test cases have been modified to reflect the changes in error
messages returned by libObject. What's more, the test case for
macho-rebase-add-addr-uleb-too-big has been modified so that it actually
triggers the error condition; the new code in libObject considers the
original test binary "legal".
rdar://47797757
Reviewers: lhames, pete, ab
Reviewed By: pete
Subscribers: rupprecht, jdoerfert, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59574
llvm-svn: 356629
2019-03-21 07:21:16 +08:00
|
|
|
error = O->BindEntryCheckSegAndOffsets(SegmentIndex, SegmentOffset,
|
|
|
|
PointerSize);
|
2017-03-21 03:46:55 +08:00
|
|
|
if (error) {
|
2017-08-20 23:13:39 +08:00
|
|
|
*E = malformedError("for BIND_OPCODE_ADD_ADDR_ULEB " + Twine(error) +
|
|
|
|
" for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-21 03:46:55 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
2014-09-16 09:41:51 +08:00
|
|
|
DEBUG_WITH_TYPE("mach-o-bind",
|
2017-04-22 06:03:05 +08:00
|
|
|
dbgs() << "BIND_OPCODE_ADD_ADDR_ULEB: "
|
|
|
|
<< format("SegmentOffset=0x%06X",
|
|
|
|
SegmentOffset) << "\n");
|
2014-09-16 09:41:51 +08:00
|
|
|
break;
|
|
|
|
case MachO::BIND_OPCODE_DO_BIND:
|
|
|
|
AdvanceAmount = PointerSize;
|
|
|
|
RemainingLoopCount = 0;
|
Fix Mach-O bind and rebase validation errors in libObject
Summary:
llvm-objdump (via libObject) validates DYLD_INFO rebase and bind
entries against the basic structure found in the Mach-O file before
evaluating the contents of those entries. Certain malformed Mach-Os can
defeat the validation check and force llvm-objdump (libObject) to crash.
The previous logic verified a rebase or bind started in a valid Mach-O
section, but did not verify that the section wholely contained the
fixup. It also generally allows rebases or binds to start immediately
after a valid section even if that range is not itself part of a valid
section. Finally, bind and rebase opcodes that indicate more than one
fixup (apply N times...) are not completely validated: only the first
and final fixups are checked.
The previous logic also rejected certain binaries as false positives.
Some bind and rebase opcodes can modify the state machine such that the
next bind or rebase will fail. libObject will reject these opcodes as
invalid in order to be helpful and print an error message associated
with the instruction that caused the problem, even though the binary is
not actually illegal until it consumes the invalid state in the state
machine. In other words, libObject may reject a Mach-O binary that
Apple's dynamic linker may consider legal. The original version of
macho-rebase-add-addr-uleb-too-big is an example of such a binary.
I have replaced the existing checkSegAndOffset and checkCountAndSkip
functions with a single function, checkSegAndOffsets, which validates
all of the fixups realized by a DYLD_INFO opcode. checkSegAndOffsets
verifies that a Mach-O section fully contains each fixup. Every fixup
realized by an opcode is validated, and some (but not all!)
inconsistencies in the state machine are allowed until a fixup is
realized. This means that libObject may fail on an opcode that realizes
a fixup, not on the opcode that introduced the arithmetic error.
Existing test cases have been modified to reflect the changes in error
messages returned by libObject. What's more, the test case for
macho-rebase-add-addr-uleb-too-big has been modified so that it actually
triggers the error condition; the new code in libObject considers the
original test binary "legal".
rdar://47797757
Reviewers: lhames, pete, ab
Reviewed By: pete
Subscribers: rupprecht, jdoerfert, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59574
llvm-svn: 356629
2019-03-21 07:21:16 +08:00
|
|
|
error = O->BindEntryCheckSegAndOffsets(SegmentIndex, SegmentOffset,
|
|
|
|
PointerSize);
|
2017-03-21 03:46:55 +08:00
|
|
|
if (error) {
|
|
|
|
*E = malformedError("for BIND_OPCODE_DO_BIND " + Twine(error) +
|
2017-08-20 23:13:39 +08:00
|
|
|
" for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-21 03:46:55 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
if (SymbolName == StringRef()) {
|
2017-08-20 23:13:39 +08:00
|
|
|
*E = malformedError(
|
|
|
|
"for BIND_OPCODE_DO_BIND missing preceding "
|
|
|
|
"BIND_OPCODE_SET_SYMBOL_TRAILING_FLAGS_IMM for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-21 03:46:55 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
if (!LibraryOrdinalSet && TableKind != Kind::Weak) {
|
2017-08-20 23:13:39 +08:00
|
|
|
*E =
|
|
|
|
malformedError("for BIND_OPCODE_DO_BIND missing preceding "
|
|
|
|
"BIND_OPCODE_SET_DYLIB_ORDINAL_* for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-21 03:46:55 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
2014-09-16 09:41:51 +08:00
|
|
|
DEBUG_WITH_TYPE("mach-o-bind",
|
2017-04-22 06:03:05 +08:00
|
|
|
dbgs() << "BIND_OPCODE_DO_BIND: "
|
|
|
|
<< format("SegmentOffset=0x%06X",
|
|
|
|
SegmentOffset) << "\n");
|
2014-09-16 09:41:51 +08:00
|
|
|
return;
|
|
|
|
case MachO::BIND_OPCODE_DO_BIND_ADD_ADDR_ULEB:
|
2017-03-28 04:09:23 +08:00
|
|
|
if (TableKind == Kind::Lazy) {
|
|
|
|
*E = malformedError("BIND_OPCODE_DO_BIND_ADD_ADDR_ULEB not allowed in "
|
2017-08-20 23:13:39 +08:00
|
|
|
"lazy bind table for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-28 04:09:23 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
Fix Mach-O bind and rebase validation errors in libObject
Summary:
llvm-objdump (via libObject) validates DYLD_INFO rebase and bind
entries against the basic structure found in the Mach-O file before
evaluating the contents of those entries. Certain malformed Mach-Os can
defeat the validation check and force llvm-objdump (libObject) to crash.
The previous logic verified a rebase or bind started in a valid Mach-O
section, but did not verify that the section wholely contained the
fixup. It also generally allows rebases or binds to start immediately
after a valid section even if that range is not itself part of a valid
section. Finally, bind and rebase opcodes that indicate more than one
fixup (apply N times...) are not completely validated: only the first
and final fixups are checked.
The previous logic also rejected certain binaries as false positives.
Some bind and rebase opcodes can modify the state machine such that the
next bind or rebase will fail. libObject will reject these opcodes as
invalid in order to be helpful and print an error message associated
with the instruction that caused the problem, even though the binary is
not actually illegal until it consumes the invalid state in the state
machine. In other words, libObject may reject a Mach-O binary that
Apple's dynamic linker may consider legal. The original version of
macho-rebase-add-addr-uleb-too-big is an example of such a binary.
I have replaced the existing checkSegAndOffset and checkCountAndSkip
functions with a single function, checkSegAndOffsets, which validates
all of the fixups realized by a DYLD_INFO opcode. checkSegAndOffsets
verifies that a Mach-O section fully contains each fixup. Every fixup
realized by an opcode is validated, and some (but not all!)
inconsistencies in the state machine are allowed until a fixup is
realized. This means that libObject may fail on an opcode that realizes
a fixup, not on the opcode that introduced the arithmetic error.
Existing test cases have been modified to reflect the changes in error
messages returned by libObject. What's more, the test case for
macho-rebase-add-addr-uleb-too-big has been modified so that it actually
triggers the error condition; the new code in libObject considers the
original test binary "legal".
rdar://47797757
Reviewers: lhames, pete, ab
Reviewed By: pete
Subscribers: rupprecht, jdoerfert, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59574
llvm-svn: 356629
2019-03-21 07:21:16 +08:00
|
|
|
error = O->BindEntryCheckSegAndOffsets(SegmentIndex, SegmentOffset,
|
|
|
|
PointerSize);
|
2017-03-21 03:46:55 +08:00
|
|
|
if (error) {
|
|
|
|
*E = malformedError("for BIND_OPCODE_DO_BIND_ADD_ADDR_ULEB " +
|
2017-08-20 23:13:39 +08:00
|
|
|
Twine(error) + " for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-21 03:46:55 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
if (SymbolName == StringRef()) {
|
2017-08-20 23:13:39 +08:00
|
|
|
*E = malformedError(
|
|
|
|
"for BIND_OPCODE_DO_BIND_ADD_ADDR_ULEB missing "
|
|
|
|
"preceding BIND_OPCODE_SET_SYMBOL_TRAILING_FLAGS_IMM for opcode "
|
|
|
|
"at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-21 03:46:55 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
if (!LibraryOrdinalSet && TableKind != Kind::Weak) {
|
2017-08-20 23:13:39 +08:00
|
|
|
*E = malformedError(
|
|
|
|
"for BIND_OPCODE_DO_BIND_ADD_ADDR_ULEB missing "
|
|
|
|
"preceding BIND_OPCODE_SET_DYLIB_ORDINAL_* for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-21 03:46:55 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
AdvanceAmount = readULEB128(&error) + PointerSize;
|
|
|
|
if (error) {
|
|
|
|
*E = malformedError("for BIND_OPCODE_DO_BIND_ADD_ADDR_ULEB " +
|
2017-08-20 23:13:39 +08:00
|
|
|
Twine(error) + " for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-21 03:46:55 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
// Note, this is not really an error until the next bind but make no sense
|
|
|
|
// for a BIND_OPCODE_DO_BIND_ADD_ADDR_ULEB to not be followed by another
|
|
|
|
// bind operation.
|
Fix Mach-O bind and rebase validation errors in libObject
Summary:
llvm-objdump (via libObject) validates DYLD_INFO rebase and bind
entries against the basic structure found in the Mach-O file before
evaluating the contents of those entries. Certain malformed Mach-Os can
defeat the validation check and force llvm-objdump (libObject) to crash.
The previous logic verified a rebase or bind started in a valid Mach-O
section, but did not verify that the section wholely contained the
fixup. It also generally allows rebases or binds to start immediately
after a valid section even if that range is not itself part of a valid
section. Finally, bind and rebase opcodes that indicate more than one
fixup (apply N times...) are not completely validated: only the first
and final fixups are checked.
The previous logic also rejected certain binaries as false positives.
Some bind and rebase opcodes can modify the state machine such that the
next bind or rebase will fail. libObject will reject these opcodes as
invalid in order to be helpful and print an error message associated
with the instruction that caused the problem, even though the binary is
not actually illegal until it consumes the invalid state in the state
machine. In other words, libObject may reject a Mach-O binary that
Apple's dynamic linker may consider legal. The original version of
macho-rebase-add-addr-uleb-too-big is an example of such a binary.
I have replaced the existing checkSegAndOffset and checkCountAndSkip
functions with a single function, checkSegAndOffsets, which validates
all of the fixups realized by a DYLD_INFO opcode. checkSegAndOffsets
verifies that a Mach-O section fully contains each fixup. Every fixup
realized by an opcode is validated, and some (but not all!)
inconsistencies in the state machine are allowed until a fixup is
realized. This means that libObject may fail on an opcode that realizes
a fixup, not on the opcode that introduced the arithmetic error.
Existing test cases have been modified to reflect the changes in error
messages returned by libObject. What's more, the test case for
macho-rebase-add-addr-uleb-too-big has been modified so that it actually
triggers the error condition; the new code in libObject considers the
original test binary "legal".
rdar://47797757
Reviewers: lhames, pete, ab
Reviewed By: pete
Subscribers: rupprecht, jdoerfert, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59574
llvm-svn: 356629
2019-03-21 07:21:16 +08:00
|
|
|
error = O->BindEntryCheckSegAndOffsets(SegmentIndex, SegmentOffset +
|
|
|
|
AdvanceAmount, PointerSize);
|
2017-03-21 03:46:55 +08:00
|
|
|
if (error) {
|
|
|
|
*E = malformedError("for BIND_OPCODE_ADD_ADDR_ULEB (after adding "
|
2017-08-20 23:13:39 +08:00
|
|
|
"ULEB) " +
|
|
|
|
Twine(error) + " for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-21 03:46:55 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
2014-09-16 09:41:51 +08:00
|
|
|
RemainingLoopCount = 0;
|
|
|
|
DEBUG_WITH_TYPE(
|
|
|
|
"mach-o-bind",
|
2017-04-22 06:03:05 +08:00
|
|
|
dbgs() << "BIND_OPCODE_DO_BIND_ADD_ADDR_ULEB: "
|
|
|
|
<< format("SegmentOffset=0x%06X", SegmentOffset)
|
|
|
|
<< ", AdvanceAmount=" << AdvanceAmount
|
|
|
|
<< ", RemainingLoopCount=" << RemainingLoopCount
|
|
|
|
<< "\n");
|
2014-09-16 09:41:51 +08:00
|
|
|
return;
|
|
|
|
case MachO::BIND_OPCODE_DO_BIND_ADD_ADDR_IMM_SCALED:
|
2017-03-28 04:09:23 +08:00
|
|
|
if (TableKind == Kind::Lazy) {
|
|
|
|
*E = malformedError("BIND_OPCODE_DO_BIND_ADD_ADDR_IMM_SCALED not "
|
2017-08-20 23:13:39 +08:00
|
|
|
"allowed in lazy bind table for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-28 04:09:23 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
Fix Mach-O bind and rebase validation errors in libObject
Summary:
llvm-objdump (via libObject) validates DYLD_INFO rebase and bind
entries against the basic structure found in the Mach-O file before
evaluating the contents of those entries. Certain malformed Mach-Os can
defeat the validation check and force llvm-objdump (libObject) to crash.
The previous logic verified a rebase or bind started in a valid Mach-O
section, but did not verify that the section wholely contained the
fixup. It also generally allows rebases or binds to start immediately
after a valid section even if that range is not itself part of a valid
section. Finally, bind and rebase opcodes that indicate more than one
fixup (apply N times...) are not completely validated: only the first
and final fixups are checked.
The previous logic also rejected certain binaries as false positives.
Some bind and rebase opcodes can modify the state machine such that the
next bind or rebase will fail. libObject will reject these opcodes as
invalid in order to be helpful and print an error message associated
with the instruction that caused the problem, even though the binary is
not actually illegal until it consumes the invalid state in the state
machine. In other words, libObject may reject a Mach-O binary that
Apple's dynamic linker may consider legal. The original version of
macho-rebase-add-addr-uleb-too-big is an example of such a binary.
I have replaced the existing checkSegAndOffset and checkCountAndSkip
functions with a single function, checkSegAndOffsets, which validates
all of the fixups realized by a DYLD_INFO opcode. checkSegAndOffsets
verifies that a Mach-O section fully contains each fixup. Every fixup
realized by an opcode is validated, and some (but not all!)
inconsistencies in the state machine are allowed until a fixup is
realized. This means that libObject may fail on an opcode that realizes
a fixup, not on the opcode that introduced the arithmetic error.
Existing test cases have been modified to reflect the changes in error
messages returned by libObject. What's more, the test case for
macho-rebase-add-addr-uleb-too-big has been modified so that it actually
triggers the error condition; the new code in libObject considers the
original test binary "legal".
rdar://47797757
Reviewers: lhames, pete, ab
Reviewed By: pete
Subscribers: rupprecht, jdoerfert, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59574
llvm-svn: 356629
2019-03-21 07:21:16 +08:00
|
|
|
error = O->BindEntryCheckSegAndOffsets(SegmentIndex, SegmentOffset,
|
|
|
|
PointerSize);
|
2017-03-21 03:46:55 +08:00
|
|
|
if (error) {
|
|
|
|
*E = malformedError("for BIND_OPCODE_DO_BIND_ADD_ADDR_IMM_SCALED " +
|
2017-08-20 23:13:39 +08:00
|
|
|
Twine(error) + " for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-21 03:46:55 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
if (SymbolName == StringRef()) {
|
2017-08-20 23:13:39 +08:00
|
|
|
*E = malformedError(
|
|
|
|
"for BIND_OPCODE_DO_BIND_ADD_ADDR_IMM_SCALED "
|
|
|
|
"missing preceding BIND_OPCODE_SET_SYMBOL_TRAILING_FLAGS_IMM for "
|
|
|
|
"opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-21 03:46:55 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
if (!LibraryOrdinalSet && TableKind != Kind::Weak) {
|
2017-08-20 23:13:39 +08:00
|
|
|
*E = malformedError(
|
|
|
|
"for BIND_OPCODE_DO_BIND_ADD_ADDR_IMM_SCALED "
|
|
|
|
"missing preceding BIND_OPCODE_SET_DYLIB_ORDINAL_* for opcode "
|
|
|
|
"at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-21 03:46:55 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
2014-10-18 09:21:02 +08:00
|
|
|
AdvanceAmount = ImmValue * PointerSize + PointerSize;
|
2014-09-16 09:41:51 +08:00
|
|
|
RemainingLoopCount = 0;
|
Fix Mach-O bind and rebase validation errors in libObject
Summary:
llvm-objdump (via libObject) validates DYLD_INFO rebase and bind
entries against the basic structure found in the Mach-O file before
evaluating the contents of those entries. Certain malformed Mach-Os can
defeat the validation check and force llvm-objdump (libObject) to crash.
The previous logic verified a rebase or bind started in a valid Mach-O
section, but did not verify that the section wholely contained the
fixup. It also generally allows rebases or binds to start immediately
after a valid section even if that range is not itself part of a valid
section. Finally, bind and rebase opcodes that indicate more than one
fixup (apply N times...) are not completely validated: only the first
and final fixups are checked.
The previous logic also rejected certain binaries as false positives.
Some bind and rebase opcodes can modify the state machine such that the
next bind or rebase will fail. libObject will reject these opcodes as
invalid in order to be helpful and print an error message associated
with the instruction that caused the problem, even though the binary is
not actually illegal until it consumes the invalid state in the state
machine. In other words, libObject may reject a Mach-O binary that
Apple's dynamic linker may consider legal. The original version of
macho-rebase-add-addr-uleb-too-big is an example of such a binary.
I have replaced the existing checkSegAndOffset and checkCountAndSkip
functions with a single function, checkSegAndOffsets, which validates
all of the fixups realized by a DYLD_INFO opcode. checkSegAndOffsets
verifies that a Mach-O section fully contains each fixup. Every fixup
realized by an opcode is validated, and some (but not all!)
inconsistencies in the state machine are allowed until a fixup is
realized. This means that libObject may fail on an opcode that realizes
a fixup, not on the opcode that introduced the arithmetic error.
Existing test cases have been modified to reflect the changes in error
messages returned by libObject. What's more, the test case for
macho-rebase-add-addr-uleb-too-big has been modified so that it actually
triggers the error condition; the new code in libObject considers the
original test binary "legal".
rdar://47797757
Reviewers: lhames, pete, ab
Reviewed By: pete
Subscribers: rupprecht, jdoerfert, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59574
llvm-svn: 356629
2019-03-21 07:21:16 +08:00
|
|
|
error = O->BindEntryCheckSegAndOffsets(SegmentIndex, SegmentOffset +
|
|
|
|
AdvanceAmount, PointerSize);
|
2017-03-21 03:46:55 +08:00
|
|
|
if (error) {
|
2017-08-20 23:13:39 +08:00
|
|
|
*E =
|
|
|
|
malformedError("for BIND_OPCODE_DO_BIND_ADD_ADDR_IMM_SCALED "
|
|
|
|
" (after adding immediate times the pointer size) " +
|
|
|
|
Twine(error) + " for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-21 03:46:55 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
2014-09-16 09:41:51 +08:00
|
|
|
DEBUG_WITH_TYPE("mach-o-bind",
|
2017-04-22 06:03:05 +08:00
|
|
|
dbgs()
|
2014-09-16 09:41:51 +08:00
|
|
|
<< "BIND_OPCODE_DO_BIND_ADD_ADDR_IMM_SCALED: "
|
2017-04-22 06:03:05 +08:00
|
|
|
<< format("SegmentOffset=0x%06X", SegmentOffset) << "\n");
|
2014-09-16 09:41:51 +08:00
|
|
|
return;
|
|
|
|
case MachO::BIND_OPCODE_DO_BIND_ULEB_TIMES_SKIPPING_ULEB:
|
2017-03-28 04:09:23 +08:00
|
|
|
if (TableKind == Kind::Lazy) {
|
|
|
|
*E = malformedError("BIND_OPCODE_DO_BIND_ULEB_TIMES_SKIPPING_ULEB not "
|
2017-08-20 23:13:39 +08:00
|
|
|
"allowed in lazy bind table for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-28 04:09:23 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
2017-03-21 03:46:55 +08:00
|
|
|
Count = readULEB128(&error);
|
|
|
|
if (Count != 0)
|
|
|
|
RemainingLoopCount = Count - 1;
|
|
|
|
else
|
|
|
|
RemainingLoopCount = 0;
|
|
|
|
if (error) {
|
|
|
|
*E = malformedError("for BIND_OPCODE_DO_BIND_ULEB_TIMES_SKIPPING_ULEB "
|
2017-08-20 23:13:39 +08:00
|
|
|
" (count value) " +
|
|
|
|
Twine(error) + " for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-21 03:46:55 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
Skip = readULEB128(&error);
|
|
|
|
AdvanceAmount = Skip + PointerSize;
|
|
|
|
if (error) {
|
|
|
|
*E = malformedError("for BIND_OPCODE_DO_BIND_ULEB_TIMES_SKIPPING_ULEB "
|
2017-08-20 23:13:39 +08:00
|
|
|
" (skip value) " +
|
|
|
|
Twine(error) + " for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-21 03:46:55 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
if (SymbolName == StringRef()) {
|
2017-08-20 23:13:39 +08:00
|
|
|
*E = malformedError(
|
|
|
|
"for BIND_OPCODE_DO_BIND_ULEB_TIMES_SKIPPING_ULEB "
|
|
|
|
"missing preceding BIND_OPCODE_SET_SYMBOL_TRAILING_FLAGS_IMM for "
|
|
|
|
"opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-21 03:46:55 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
if (!LibraryOrdinalSet && TableKind != Kind::Weak) {
|
2017-08-20 23:13:39 +08:00
|
|
|
*E = malformedError(
|
|
|
|
"for BIND_OPCODE_DO_BIND_ULEB_TIMES_SKIPPING_ULEB "
|
|
|
|
"missing preceding BIND_OPCODE_SET_DYLIB_ORDINAL_* for opcode "
|
|
|
|
"at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-21 03:46:55 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
|
|
|
}
|
Fix Mach-O bind and rebase validation errors in libObject
Summary:
llvm-objdump (via libObject) validates DYLD_INFO rebase and bind
entries against the basic structure found in the Mach-O file before
evaluating the contents of those entries. Certain malformed Mach-Os can
defeat the validation check and force llvm-objdump (libObject) to crash.
The previous logic verified a rebase or bind started in a valid Mach-O
section, but did not verify that the section wholely contained the
fixup. It also generally allows rebases or binds to start immediately
after a valid section even if that range is not itself part of a valid
section. Finally, bind and rebase opcodes that indicate more than one
fixup (apply N times...) are not completely validated: only the first
and final fixups are checked.
The previous logic also rejected certain binaries as false positives.
Some bind and rebase opcodes can modify the state machine such that the
next bind or rebase will fail. libObject will reject these opcodes as
invalid in order to be helpful and print an error message associated
with the instruction that caused the problem, even though the binary is
not actually illegal until it consumes the invalid state in the state
machine. In other words, libObject may reject a Mach-O binary that
Apple's dynamic linker may consider legal. The original version of
macho-rebase-add-addr-uleb-too-big is an example of such a binary.
I have replaced the existing checkSegAndOffset and checkCountAndSkip
functions with a single function, checkSegAndOffsets, which validates
all of the fixups realized by a DYLD_INFO opcode. checkSegAndOffsets
verifies that a Mach-O section fully contains each fixup. Every fixup
realized by an opcode is validated, and some (but not all!)
inconsistencies in the state machine are allowed until a fixup is
realized. This means that libObject may fail on an opcode that realizes
a fixup, not on the opcode that introduced the arithmetic error.
Existing test cases have been modified to reflect the changes in error
messages returned by libObject. What's more, the test case for
macho-rebase-add-addr-uleb-too-big has been modified so that it actually
triggers the error condition; the new code in libObject considers the
original test binary "legal".
rdar://47797757
Reviewers: lhames, pete, ab
Reviewed By: pete
Subscribers: rupprecht, jdoerfert, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59574
llvm-svn: 356629
2019-03-21 07:21:16 +08:00
|
|
|
error = O->BindEntryCheckSegAndOffsets(SegmentIndex, SegmentOffset,
|
|
|
|
PointerSize, Count, Skip);
|
2017-03-21 03:46:55 +08:00
|
|
|
if (error) {
|
2017-08-20 23:13:39 +08:00
|
|
|
*E =
|
|
|
|
malformedError("for BIND_OPCODE_DO_BIND_ULEB_TIMES_SKIPPING_ULEB " +
|
|
|
|
Twine(error) + " for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-21 03:46:55 +08:00
|
|
|
moveToEnd();
|
2017-08-28 14:47:47 +08:00
|
|
|
return;
|
2017-03-21 03:46:55 +08:00
|
|
|
}
|
2014-09-16 09:41:51 +08:00
|
|
|
DEBUG_WITH_TYPE(
|
|
|
|
"mach-o-bind",
|
2017-04-22 06:03:05 +08:00
|
|
|
dbgs() << "BIND_OPCODE_DO_BIND_ULEB_TIMES_SKIPPING_ULEB: "
|
|
|
|
<< format("SegmentOffset=0x%06X", SegmentOffset)
|
|
|
|
<< ", AdvanceAmount=" << AdvanceAmount
|
|
|
|
<< ", RemainingLoopCount=" << RemainingLoopCount
|
|
|
|
<< "\n");
|
2014-09-16 09:41:51 +08:00
|
|
|
return;
|
|
|
|
default:
|
2017-03-21 03:46:55 +08:00
|
|
|
*E = malformedError("bad bind info (bad opcode value 0x" +
|
2017-08-20 23:13:39 +08:00
|
|
|
Twine::utohexstr(Opcode) + " for opcode at: 0x" +
|
|
|
|
Twine::utohexstr(OpcodeStart - Opcodes.begin()));
|
2017-03-21 03:46:55 +08:00
|
|
|
moveToEnd();
|
|
|
|
return;
|
2014-09-16 09:41:51 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-03-21 03:46:55 +08:00
|
|
|
uint64_t MachOBindEntry::readULEB128(const char **error) {
|
2014-09-16 09:41:51 +08:00
|
|
|
unsigned Count;
|
2017-03-21 03:46:55 +08:00
|
|
|
uint64_t Result = decodeULEB128(Ptr, &Count, Opcodes.end(), error);
|
2014-09-16 09:41:51 +08:00
|
|
|
Ptr += Count;
|
2017-03-28 04:09:23 +08:00
|
|
|
if (Ptr > Opcodes.end())
|
2014-09-16 09:41:51 +08:00
|
|
|
Ptr = Opcodes.end();
|
|
|
|
return Result;
|
|
|
|
}
|
|
|
|
|
2017-03-21 03:46:55 +08:00
|
|
|
int64_t MachOBindEntry::readSLEB128(const char **error) {
|
2014-09-16 09:41:51 +08:00
|
|
|
unsigned Count;
|
2017-03-21 03:46:55 +08:00
|
|
|
int64_t Result = decodeSLEB128(Ptr, &Count, Opcodes.end(), error);
|
2014-09-16 09:41:51 +08:00
|
|
|
Ptr += Count;
|
2017-03-28 04:09:23 +08:00
|
|
|
if (Ptr > Opcodes.end())
|
2014-09-16 09:41:51 +08:00
|
|
|
Ptr = Opcodes.end();
|
|
|
|
return Result;
|
|
|
|
}
|
|
|
|
|
2017-03-21 03:46:55 +08:00
|
|
|
int32_t MachOBindEntry::segmentIndex() const { return SegmentIndex; }
|
2014-09-16 09:41:51 +08:00
|
|
|
|
|
|
|
uint64_t MachOBindEntry::segmentOffset() const { return SegmentOffset; }
|
|
|
|
|
|
|
|
StringRef MachOBindEntry::typeName() const {
|
|
|
|
switch (BindType) {
|
|
|
|
case MachO::BIND_TYPE_POINTER:
|
|
|
|
return "pointer";
|
|
|
|
case MachO::BIND_TYPE_TEXT_ABSOLUTE32:
|
|
|
|
return "text abs32";
|
|
|
|
case MachO::BIND_TYPE_TEXT_PCREL32:
|
|
|
|
return "text rel32";
|
|
|
|
}
|
|
|
|
return "unknown";
|
|
|
|
}
|
|
|
|
|
|
|
|
StringRef MachOBindEntry::symbolName() const { return SymbolName; }
|
|
|
|
|
|
|
|
int64_t MachOBindEntry::addend() const { return Addend; }
|
|
|
|
|
|
|
|
uint32_t MachOBindEntry::flags() const { return Flags; }
|
|
|
|
|
|
|
|
int MachOBindEntry::ordinal() const { return Ordinal; }
|
|
|
|
|
2017-03-21 03:46:55 +08:00
|
|
|
// For use with the SegIndex of a checked Mach-O Bind entry
|
|
|
|
// to get the segment name.
|
|
|
|
StringRef MachOBindEntry::segmentName() const {
|
|
|
|
return O->BindRebaseSegmentName(SegmentIndex);
|
|
|
|
}
|
|
|
|
|
|
|
|
// For use with a SegIndex,SegOffset pair from a checked Mach-O Bind entry
|
|
|
|
// to get the section name.
|
|
|
|
StringRef MachOBindEntry::sectionName() const {
|
|
|
|
return O->BindRebaseSectionName(SegmentIndex, SegmentOffset);
|
|
|
|
}
|
|
|
|
|
|
|
|
// For use with a SegIndex,SegOffset pair from a checked Mach-O Bind entry
|
|
|
|
// to get the address.
|
|
|
|
uint64_t MachOBindEntry::address() const {
|
|
|
|
return O->BindRebaseAddress(SegmentIndex, SegmentOffset);
|
|
|
|
}
|
|
|
|
|
2014-09-16 09:41:51 +08:00
|
|
|
bool MachOBindEntry::operator==(const MachOBindEntry &Other) const {
|
2017-01-09 03:14:15 +08:00
|
|
|
#ifdef EXPENSIVE_CHECKS
|
2014-09-16 09:41:51 +08:00
|
|
|
assert(Opcodes == Other.Opcodes && "compare iterators of different files");
|
2017-01-09 03:14:15 +08:00
|
|
|
#else
|
|
|
|
assert(Opcodes.data() == Other.Opcodes.data() && "compare iterators of different files");
|
|
|
|
#endif
|
2014-09-16 09:41:51 +08:00
|
|
|
return (Ptr == Other.Ptr) &&
|
|
|
|
(RemainingLoopCount == Other.RemainingLoopCount) &&
|
|
|
|
(Done == Other.Done);
|
|
|
|
}
|
|
|
|
|
2017-03-21 03:46:55 +08:00
|
|
|
// Build table of sections so SegIndex/SegOffset pairs can be translated.
|
|
|
|
BindRebaseSegInfo::BindRebaseSegInfo(const object::MachOObjectFile *Obj) {
|
|
|
|
uint32_t CurSegIndex = Obj->hasPageZeroSegment() ? 1 : 0;
|
|
|
|
StringRef CurSegName;
|
|
|
|
uint64_t CurSegAddress;
|
|
|
|
for (const SectionRef &Section : Obj->sections()) {
|
|
|
|
SectionInfo Info;
|
2019-08-14 16:56:55 +08:00
|
|
|
Section.getName(Info.SectionName);
|
2017-03-21 03:46:55 +08:00
|
|
|
Info.Address = Section.getAddress();
|
|
|
|
Info.Size = Section.getSize();
|
|
|
|
Info.SegmentName =
|
|
|
|
Obj->getSectionFinalSegmentName(Section.getRawDataRefImpl());
|
|
|
|
if (!Info.SegmentName.equals(CurSegName)) {
|
|
|
|
++CurSegIndex;
|
|
|
|
CurSegName = Info.SegmentName;
|
|
|
|
CurSegAddress = Info.Address;
|
|
|
|
}
|
|
|
|
Info.SegmentIndex = CurSegIndex - 1;
|
|
|
|
Info.OffsetInSegment = Info.Address - CurSegAddress;
|
|
|
|
Info.SegmentStartAddress = CurSegAddress;
|
|
|
|
Sections.push_back(Info);
|
|
|
|
}
|
|
|
|
MaxSegIndex = CurSegIndex;
|
|
|
|
}
|
|
|
|
|
Fix Mach-O bind and rebase validation errors in libObject
Summary:
llvm-objdump (via libObject) validates DYLD_INFO rebase and bind
entries against the basic structure found in the Mach-O file before
evaluating the contents of those entries. Certain malformed Mach-Os can
defeat the validation check and force llvm-objdump (libObject) to crash.
The previous logic verified a rebase or bind started in a valid Mach-O
section, but did not verify that the section wholely contained the
fixup. It also generally allows rebases or binds to start immediately
after a valid section even if that range is not itself part of a valid
section. Finally, bind and rebase opcodes that indicate more than one
fixup (apply N times...) are not completely validated: only the first
and final fixups are checked.
The previous logic also rejected certain binaries as false positives.
Some bind and rebase opcodes can modify the state machine such that the
next bind or rebase will fail. libObject will reject these opcodes as
invalid in order to be helpful and print an error message associated
with the instruction that caused the problem, even though the binary is
not actually illegal until it consumes the invalid state in the state
machine. In other words, libObject may reject a Mach-O binary that
Apple's dynamic linker may consider legal. The original version of
macho-rebase-add-addr-uleb-too-big is an example of such a binary.
I have replaced the existing checkSegAndOffset and checkCountAndSkip
functions with a single function, checkSegAndOffsets, which validates
all of the fixups realized by a DYLD_INFO opcode. checkSegAndOffsets
verifies that a Mach-O section fully contains each fixup. Every fixup
realized by an opcode is validated, and some (but not all!)
inconsistencies in the state machine are allowed until a fixup is
realized. This means that libObject may fail on an opcode that realizes
a fixup, not on the opcode that introduced the arithmetic error.
Existing test cases have been modified to reflect the changes in error
messages returned by libObject. What's more, the test case for
macho-rebase-add-addr-uleb-too-big has been modified so that it actually
triggers the error condition; the new code in libObject considers the
original test binary "legal".
rdar://47797757
Reviewers: lhames, pete, ab
Reviewed By: pete
Subscribers: rupprecht, jdoerfert, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59574
llvm-svn: 356629
2019-03-21 07:21:16 +08:00
|
|
|
// For use with a SegIndex, SegOffset, and PointerSize triple in
|
|
|
|
// MachOBindEntry::moveNext() to validate a MachOBindEntry or MachORebaseEntry.
|
|
|
|
//
|
|
|
|
// Given a SegIndex, SegOffset, and PointerSize, verify a valid section exists
|
|
|
|
// that fully contains a pointer at that location. Multiple fixups in a bind
|
|
|
|
// (such as with the BIND_OPCODE_DO_BIND_ULEB_TIMES_SKIPPING_ULEB opcode) can
|
|
|
|
// be tested via the Count and Skip parameters.
|
|
|
|
const char * BindRebaseSegInfo::checkSegAndOffsets(int32_t SegIndex,
|
|
|
|
uint64_t SegOffset,
|
|
|
|
uint8_t PointerSize,
|
|
|
|
uint32_t Count,
|
|
|
|
uint32_t Skip) {
|
2017-03-21 03:46:55 +08:00
|
|
|
if (SegIndex == -1)
|
2017-03-28 04:09:23 +08:00
|
|
|
return "missing preceding *_OPCODE_SET_SEGMENT_AND_OFFSET_ULEB";
|
2017-03-21 03:46:55 +08:00
|
|
|
if (SegIndex >= MaxSegIndex)
|
|
|
|
return "bad segIndex (too large)";
|
Fix Mach-O bind and rebase validation errors in libObject
Summary:
llvm-objdump (via libObject) validates DYLD_INFO rebase and bind
entries against the basic structure found in the Mach-O file before
evaluating the contents of those entries. Certain malformed Mach-Os can
defeat the validation check and force llvm-objdump (libObject) to crash.
The previous logic verified a rebase or bind started in a valid Mach-O
section, but did not verify that the section wholely contained the
fixup. It also generally allows rebases or binds to start immediately
after a valid section even if that range is not itself part of a valid
section. Finally, bind and rebase opcodes that indicate more than one
fixup (apply N times...) are not completely validated: only the first
and final fixups are checked.
The previous logic also rejected certain binaries as false positives.
Some bind and rebase opcodes can modify the state machine such that the
next bind or rebase will fail. libObject will reject these opcodes as
invalid in order to be helpful and print an error message associated
with the instruction that caused the problem, even though the binary is
not actually illegal until it consumes the invalid state in the state
machine. In other words, libObject may reject a Mach-O binary that
Apple's dynamic linker may consider legal. The original version of
macho-rebase-add-addr-uleb-too-big is an example of such a binary.
I have replaced the existing checkSegAndOffset and checkCountAndSkip
functions with a single function, checkSegAndOffsets, which validates
all of the fixups realized by a DYLD_INFO opcode. checkSegAndOffsets
verifies that a Mach-O section fully contains each fixup. Every fixup
realized by an opcode is validated, and some (but not all!)
inconsistencies in the state machine are allowed until a fixup is
realized. This means that libObject may fail on an opcode that realizes
a fixup, not on the opcode that introduced the arithmetic error.
Existing test cases have been modified to reflect the changes in error
messages returned by libObject. What's more, the test case for
macho-rebase-add-addr-uleb-too-big has been modified so that it actually
triggers the error condition; the new code in libObject considers the
original test binary "legal".
rdar://47797757
Reviewers: lhames, pete, ab
Reviewed By: pete
Subscribers: rupprecht, jdoerfert, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59574
llvm-svn: 356629
2019-03-21 07:21:16 +08:00
|
|
|
for (uint32_t i = 0; i < Count; ++i) {
|
|
|
|
uint32_t Start = SegOffset + i * (PointerSize + Skip);
|
|
|
|
uint32_t End = Start + PointerSize;
|
|
|
|
bool Found = false;
|
|
|
|
for (const SectionInfo &SI : Sections) {
|
|
|
|
if (SI.SegmentIndex != SegIndex)
|
|
|
|
continue;
|
|
|
|
if ((SI.OffsetInSegment<=Start) && (Start<(SI.OffsetInSegment+SI.Size))) {
|
|
|
|
if (End <= SI.OffsetInSegment + SI.Size) {
|
|
|
|
Found = true;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
return "bad offset, extends beyond section boundary";
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (!Found)
|
|
|
|
return "bad offset, not in section";
|
2017-03-28 04:09:23 +08:00
|
|
|
}
|
2017-03-21 03:46:55 +08:00
|
|
|
return nullptr;
|
|
|
|
}
|
|
|
|
|
|
|
|
// For use with the SegIndex of a checked Mach-O Bind or Rebase entry
|
|
|
|
// to get the segment name.
|
|
|
|
StringRef BindRebaseSegInfo::segmentName(int32_t SegIndex) {
|
|
|
|
for (const SectionInfo &SI : Sections) {
|
|
|
|
if (SI.SegmentIndex == SegIndex)
|
|
|
|
return SI.SegmentName;
|
|
|
|
}
|
|
|
|
llvm_unreachable("invalid SegIndex");
|
|
|
|
}
|
|
|
|
|
|
|
|
// For use with a SegIndex,SegOffset pair from a checked Mach-O Bind or Rebase
|
|
|
|
// to get the SectionInfo.
|
|
|
|
const BindRebaseSegInfo::SectionInfo &BindRebaseSegInfo::findSection(
|
|
|
|
int32_t SegIndex, uint64_t SegOffset) {
|
|
|
|
for (const SectionInfo &SI : Sections) {
|
|
|
|
if (SI.SegmentIndex != SegIndex)
|
|
|
|
continue;
|
|
|
|
if (SI.OffsetInSegment > SegOffset)
|
|
|
|
continue;
|
|
|
|
if (SegOffset >= (SI.OffsetInSegment + SI.Size))
|
|
|
|
continue;
|
|
|
|
return SI;
|
|
|
|
}
|
|
|
|
llvm_unreachable("SegIndex and SegOffset not in any section");
|
|
|
|
}
|
|
|
|
|
|
|
|
// For use with a SegIndex,SegOffset pair from a checked Mach-O Bind or Rebase
|
|
|
|
// entry to get the section name.
|
|
|
|
StringRef BindRebaseSegInfo::sectionName(int32_t SegIndex,
|
|
|
|
uint64_t SegOffset) {
|
|
|
|
return findSection(SegIndex, SegOffset).SectionName;
|
|
|
|
}
|
|
|
|
|
|
|
|
// For use with a SegIndex,SegOffset pair from a checked Mach-O Bind or Rebase
|
|
|
|
// entry to get the address.
|
|
|
|
uint64_t BindRebaseSegInfo::address(uint32_t SegIndex, uint64_t OffsetInSeg) {
|
|
|
|
const SectionInfo &SI = findSection(SegIndex, OffsetInSeg);
|
|
|
|
return SI.SegmentStartAddress + OffsetInSeg;
|
|
|
|
}
|
|
|
|
|
2014-09-16 09:41:51 +08:00
|
|
|
iterator_range<bind_iterator>
|
2017-03-21 03:46:55 +08:00
|
|
|
MachOObjectFile::bindTable(Error &Err, MachOObjectFile *O,
|
2017-03-01 05:47:07 +08:00
|
|
|
ArrayRef<uint8_t> Opcodes, bool is64,
|
2014-09-16 09:41:51 +08:00
|
|
|
MachOBindEntry::Kind BKind) {
|
2017-03-21 03:46:55 +08:00
|
|
|
if (O->BindRebaseSectionTable == nullptr)
|
|
|
|
O->BindRebaseSectionTable = llvm::make_unique<BindRebaseSegInfo>(O);
|
2017-03-01 05:47:07 +08:00
|
|
|
MachOBindEntry Start(&Err, O, Opcodes, is64, BKind);
|
2014-09-16 09:41:51 +08:00
|
|
|
Start.moveToFirst();
|
|
|
|
|
2017-03-01 05:47:07 +08:00
|
|
|
MachOBindEntry Finish(&Err, O, Opcodes, is64, BKind);
|
2014-09-16 09:41:51 +08:00
|
|
|
Finish.moveToEnd();
|
|
|
|
|
2015-12-06 13:08:07 +08:00
|
|
|
return make_range(bind_iterator(Start), bind_iterator(Finish));
|
2014-09-16 09:41:51 +08:00
|
|
|
}
|
|
|
|
|
2017-03-21 03:46:55 +08:00
|
|
|
iterator_range<bind_iterator> MachOObjectFile::bindTable(Error &Err) {
|
2017-03-01 05:47:07 +08:00
|
|
|
return bindTable(Err, this, getDyldInfoBindOpcodes(), is64Bit(),
|
2014-09-16 09:41:51 +08:00
|
|
|
MachOBindEntry::Kind::Regular);
|
|
|
|
}
|
|
|
|
|
2017-03-21 03:46:55 +08:00
|
|
|
iterator_range<bind_iterator> MachOObjectFile::lazyBindTable(Error &Err) {
|
2017-03-01 05:47:07 +08:00
|
|
|
return bindTable(Err, this, getDyldInfoLazyBindOpcodes(), is64Bit(),
|
2014-09-16 09:41:51 +08:00
|
|
|
MachOBindEntry::Kind::Lazy);
|
|
|
|
}
|
|
|
|
|
2017-03-21 03:46:55 +08:00
|
|
|
iterator_range<bind_iterator> MachOObjectFile::weakBindTable(Error &Err) {
|
2017-03-01 05:47:07 +08:00
|
|
|
return bindTable(Err, this, getDyldInfoWeakBindOpcodes(), is64Bit(),
|
2014-09-16 09:41:51 +08:00
|
|
|
MachOBindEntry::Kind::Weak);
|
|
|
|
}
|
|
|
|
|
2015-06-04 06:19:36 +08:00
|
|
|
MachOObjectFile::load_command_iterator
|
|
|
|
MachOObjectFile::begin_load_commands() const {
|
|
|
|
return LoadCommands.begin();
|
|
|
|
}
|
|
|
|
|
|
|
|
MachOObjectFile::load_command_iterator
|
|
|
|
MachOObjectFile::end_load_commands() const {
|
|
|
|
return LoadCommands.end();
|
|
|
|
}
|
|
|
|
|
|
|
|
iterator_range<MachOObjectFile::load_command_iterator>
|
|
|
|
MachOObjectFile::load_commands() const {
|
2015-12-06 13:08:07 +08:00
|
|
|
return make_range(begin_load_commands(), end_load_commands());
|
2015-06-04 06:19:36 +08:00
|
|
|
}
|
|
|
|
|
2013-04-19 02:08:55 +08:00
|
|
|
StringRef
|
|
|
|
MachOObjectFile::getSectionFinalSegmentName(DataRefImpl Sec) const {
|
|
|
|
ArrayRef<char> Raw = getSectionRawFinalSegmentName(Sec);
|
|
|
|
return parseSegmentOrSectionName(Raw.data());
|
|
|
|
}
|
|
|
|
|
|
|
|
ArrayRef<char>
|
|
|
|
MachOObjectFile::getSectionRawName(DataRefImpl Sec) const {
|
2015-05-22 22:59:27 +08:00
|
|
|
assert(Sec.d.a < Sections.size() && "Should have detected this earlier");
|
2013-09-01 12:28:48 +08:00
|
|
|
const section_base *Base =
|
|
|
|
reinterpret_cast<const section_base *>(Sections[Sec.d.a]);
|
2014-08-27 13:25:25 +08:00
|
|
|
return makeArrayRef(Base->sectname);
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
ArrayRef<char>
|
|
|
|
MachOObjectFile::getSectionRawFinalSegmentName(DataRefImpl Sec) const {
|
2015-05-22 22:59:27 +08:00
|
|
|
assert(Sec.d.a < Sections.size() && "Should have detected this earlier");
|
2013-09-01 12:28:48 +08:00
|
|
|
const section_base *Base =
|
|
|
|
reinterpret_cast<const section_base *>(Sections[Sec.d.a]);
|
2014-08-27 13:25:25 +08:00
|
|
|
return makeArrayRef(Base->segname);
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
bool
|
2013-09-01 12:28:48 +08:00
|
|
|
MachOObjectFile::isRelocationScattered(const MachO::any_relocation_info &RE)
|
2013-04-19 02:08:55 +08:00
|
|
|
const {
|
2016-12-04 09:56:10 +08:00
|
|
|
if (getCPUType(*this) == MachO::CPU_TYPE_X86_64)
|
2013-04-19 02:08:55 +08:00
|
|
|
return false;
|
2013-09-01 12:28:48 +08:00
|
|
|
return getPlainRelocationAddress(RE) & MachO::R_SCATTERED;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2013-07-23 06:25:07 +08:00
|
|
|
unsigned MachOObjectFile::getPlainRelocationSymbolNum(
|
2013-09-01 12:28:48 +08:00
|
|
|
const MachO::any_relocation_info &RE) const {
|
2013-04-19 02:08:55 +08:00
|
|
|
if (isLittleEndian())
|
2013-09-01 12:28:48 +08:00
|
|
|
return RE.r_word1 & 0xffffff;
|
|
|
|
return RE.r_word1 >> 8;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2013-07-23 06:25:07 +08:00
|
|
|
bool MachOObjectFile::getPlainRelocationExternal(
|
2013-09-01 12:28:48 +08:00
|
|
|
const MachO::any_relocation_info &RE) const {
|
2013-04-19 02:08:55 +08:00
|
|
|
if (isLittleEndian())
|
2013-09-01 12:28:48 +08:00
|
|
|
return (RE.r_word1 >> 27) & 1;
|
|
|
|
return (RE.r_word1 >> 4) & 1;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2013-07-23 06:25:07 +08:00
|
|
|
bool MachOObjectFile::getScatteredRelocationScattered(
|
2013-09-01 12:28:48 +08:00
|
|
|
const MachO::any_relocation_info &RE) const {
|
|
|
|
return RE.r_word0 >> 31;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2013-07-23 06:25:07 +08:00
|
|
|
uint32_t MachOObjectFile::getScatteredRelocationValue(
|
2013-09-01 12:28:48 +08:00
|
|
|
const MachO::any_relocation_info &RE) const {
|
|
|
|
return RE.r_word1;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2014-11-04 08:43:16 +08:00
|
|
|
uint32_t MachOObjectFile::getScatteredRelocationType(
|
|
|
|
const MachO::any_relocation_info &RE) const {
|
|
|
|
return (RE.r_word0 >> 24) & 0xf;
|
|
|
|
}
|
|
|
|
|
2013-07-23 06:25:07 +08:00
|
|
|
unsigned MachOObjectFile::getAnyRelocationAddress(
|
2013-09-01 12:28:48 +08:00
|
|
|
const MachO::any_relocation_info &RE) const {
|
2013-04-19 02:08:55 +08:00
|
|
|
if (isRelocationScattered(RE))
|
|
|
|
return getScatteredRelocationAddress(RE);
|
|
|
|
return getPlainRelocationAddress(RE);
|
|
|
|
}
|
|
|
|
|
2013-09-01 12:28:48 +08:00
|
|
|
unsigned MachOObjectFile::getAnyRelocationPCRel(
|
|
|
|
const MachO::any_relocation_info &RE) const {
|
2013-04-19 02:08:55 +08:00
|
|
|
if (isRelocationScattered(RE))
|
2016-12-04 09:56:10 +08:00
|
|
|
return getScatteredRelocationPCRel(RE);
|
|
|
|
return getPlainRelocationPCRel(*this, RE);
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2013-07-23 06:25:07 +08:00
|
|
|
unsigned MachOObjectFile::getAnyRelocationLength(
|
2013-09-01 12:28:48 +08:00
|
|
|
const MachO::any_relocation_info &RE) const {
|
2013-04-19 02:08:55 +08:00
|
|
|
if (isRelocationScattered(RE))
|
|
|
|
return getScatteredRelocationLength(RE);
|
2016-12-04 09:56:10 +08:00
|
|
|
return getPlainRelocationLength(*this, RE);
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
unsigned
|
2013-09-01 12:28:48 +08:00
|
|
|
MachOObjectFile::getAnyRelocationType(
|
|
|
|
const MachO::any_relocation_info &RE) const {
|
2013-04-19 02:08:55 +08:00
|
|
|
if (isRelocationScattered(RE))
|
|
|
|
return getScatteredRelocationType(RE);
|
2016-12-04 09:56:10 +08:00
|
|
|
return getPlainRelocationType(*this, RE);
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2013-04-30 23:40:54 +08:00
|
|
|
SectionRef
|
2015-05-22 05:24:32 +08:00
|
|
|
MachOObjectFile::getAnyRelocationSection(
|
2013-09-01 12:28:48 +08:00
|
|
|
const MachO::any_relocation_info &RE) const {
|
2013-04-30 23:40:54 +08:00
|
|
|
if (isRelocationScattered(RE) || getPlainRelocationExternal(RE))
|
2014-02-11 04:24:04 +08:00
|
|
|
return *section_end();
|
2015-06-19 06:38:20 +08:00
|
|
|
unsigned SecNum = getPlainRelocationSymbolNum(RE);
|
|
|
|
if (SecNum == MachO::R_ABS || SecNum > Sections.size())
|
|
|
|
return *section_end();
|
2013-04-30 23:40:54 +08:00
|
|
|
DataRefImpl DRI;
|
2015-06-19 06:38:20 +08:00
|
|
|
DRI.d.a = SecNum - 1;
|
2013-04-30 23:40:54 +08:00
|
|
|
return SectionRef(DRI, this);
|
|
|
|
}
|
|
|
|
|
2013-09-01 12:28:48 +08:00
|
|
|
MachO::section MachOObjectFile::getSection(DataRefImpl DRI) const {
|
2015-05-22 23:43:00 +08:00
|
|
|
assert(DRI.d.a < Sections.size() && "Should have detected this earlier");
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::section>(*this, Sections[DRI.d.a]);
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2013-09-01 12:28:48 +08:00
|
|
|
MachO::section_64 MachOObjectFile::getSection64(DataRefImpl DRI) const {
|
2015-05-22 23:43:00 +08:00
|
|
|
assert(DRI.d.a < Sections.size() && "Should have detected this earlier");
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::section_64>(*this, Sections[DRI.d.a]);
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2013-09-01 12:28:48 +08:00
|
|
|
MachO::section MachOObjectFile::getSection(const LoadCommandInfo &L,
|
2013-04-27 04:07:33 +08:00
|
|
|
unsigned Index) const {
|
2016-12-04 09:56:10 +08:00
|
|
|
const char *Sec = getSectionPtr(*this, L, Index);
|
|
|
|
return getStruct<MachO::section>(*this, Sec);
|
2013-04-27 04:07:33 +08:00
|
|
|
}
|
|
|
|
|
2013-09-01 12:28:48 +08:00
|
|
|
MachO::section_64 MachOObjectFile::getSection64(const LoadCommandInfo &L,
|
|
|
|
unsigned Index) const {
|
2016-12-04 09:56:10 +08:00
|
|
|
const char *Sec = getSectionPtr(*this, L, Index);
|
|
|
|
return getStruct<MachO::section_64>(*this, Sec);
|
2013-04-27 04:07:33 +08:00
|
|
|
}
|
|
|
|
|
2013-09-01 12:28:48 +08:00
|
|
|
MachO::nlist
|
2013-04-19 02:08:55 +08:00
|
|
|
MachOObjectFile::getSymbolTableEntry(DataRefImpl DRI) const {
|
2013-04-25 03:47:55 +08:00
|
|
|
const char *P = reinterpret_cast<const char *>(DRI.p);
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::nlist>(*this, P);
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2013-09-01 12:28:48 +08:00
|
|
|
MachO::nlist_64
|
2013-04-19 02:08:55 +08:00
|
|
|
MachOObjectFile::getSymbol64TableEntry(DataRefImpl DRI) const {
|
2013-04-25 03:47:55 +08:00
|
|
|
const char *P = reinterpret_cast<const char *>(DRI.p);
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::nlist_64>(*this, P);
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2013-09-01 12:28:48 +08:00
|
|
|
MachO::linkedit_data_command
|
|
|
|
MachOObjectFile::getLinkeditDataLoadCommand(const LoadCommandInfo &L) const {
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::linkedit_data_command>(*this, L.Ptr);
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2013-09-01 12:28:48 +08:00
|
|
|
MachO::segment_command
|
2013-04-27 04:07:33 +08:00
|
|
|
MachOObjectFile::getSegmentLoadCommand(const LoadCommandInfo &L) const {
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::segment_command>(*this, L.Ptr);
|
2013-04-27 04:07:33 +08:00
|
|
|
}
|
|
|
|
|
2013-09-01 12:28:48 +08:00
|
|
|
MachO::segment_command_64
|
2013-04-27 04:07:33 +08:00
|
|
|
MachOObjectFile::getSegment64LoadCommand(const LoadCommandInfo &L) const {
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::segment_command_64>(*this, L.Ptr);
|
2013-04-27 04:07:33 +08:00
|
|
|
}
|
|
|
|
|
2014-12-18 08:53:40 +08:00
|
|
|
MachO::linker_option_command
|
|
|
|
MachOObjectFile::getLinkerOptionLoadCommand(const LoadCommandInfo &L) const {
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::linker_option_command>(*this, L.Ptr);
|
2013-04-27 04:07:33 +08:00
|
|
|
}
|
|
|
|
|
2014-03-19 06:09:05 +08:00
|
|
|
MachO::version_min_command
|
|
|
|
MachOObjectFile::getVersionMinLoadCommand(const LoadCommandInfo &L) const {
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::version_min_command>(*this, L.Ptr);
|
2017-01-20 01:36:31 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
MachO::note_command
|
|
|
|
MachOObjectFile::getNoteLoadCommand(const LoadCommandInfo &L) const {
|
|
|
|
return getStruct<MachO::note_command>(*this, L.Ptr);
|
2014-03-19 06:09:05 +08:00
|
|
|
}
|
|
|
|
|
2017-01-24 04:07:55 +08:00
|
|
|
MachO::build_version_command
|
|
|
|
MachOObjectFile::getBuildVersionLoadCommand(const LoadCommandInfo &L) const {
|
|
|
|
return getStruct<MachO::build_version_command>(*this, L.Ptr);
|
|
|
|
}
|
|
|
|
|
|
|
|
MachO::build_tool_version
|
|
|
|
MachOObjectFile::getBuildToolVersion(unsigned index) const {
|
|
|
|
return getStruct<MachO::build_tool_version>(*this, BuildTools[index]);
|
|
|
|
}
|
|
|
|
|
2014-06-30 22:40:57 +08:00
|
|
|
MachO::dylib_command
|
|
|
|
MachOObjectFile::getDylibIDLoadCommand(const LoadCommandInfo &L) const {
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::dylib_command>(*this, L.Ptr);
|
2014-06-30 22:40:57 +08:00
|
|
|
}
|
|
|
|
|
2014-09-05 00:54:47 +08:00
|
|
|
MachO::dyld_info_command
|
|
|
|
MachOObjectFile::getDyldInfoLoadCommand(const LoadCommandInfo &L) const {
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::dyld_info_command>(*this, L.Ptr);
|
2014-09-05 00:54:47 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
MachO::dylinker_command
|
|
|
|
MachOObjectFile::getDylinkerCommand(const LoadCommandInfo &L) const {
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::dylinker_command>(*this, L.Ptr);
|
2014-09-05 00:54:47 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
MachO::uuid_command
|
|
|
|
MachOObjectFile::getUuidCommand(const LoadCommandInfo &L) const {
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::uuid_command>(*this, L.Ptr);
|
2014-09-05 00:54:47 +08:00
|
|
|
}
|
|
|
|
|
2014-12-04 15:37:02 +08:00
|
|
|
MachO::rpath_command
|
|
|
|
MachOObjectFile::getRpathCommand(const LoadCommandInfo &L) const {
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::rpath_command>(*this, L.Ptr);
|
2014-12-04 15:37:02 +08:00
|
|
|
}
|
|
|
|
|
2014-09-05 00:54:47 +08:00
|
|
|
MachO::source_version_command
|
|
|
|
MachOObjectFile::getSourceVersionCommand(const LoadCommandInfo &L) const {
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::source_version_command>(*this, L.Ptr);
|
2014-09-05 00:54:47 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
MachO::entry_point_command
|
|
|
|
MachOObjectFile::getEntryPointCommand(const LoadCommandInfo &L) const {
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::entry_point_command>(*this, L.Ptr);
|
2014-09-05 00:54:47 +08:00
|
|
|
}
|
|
|
|
|
2014-12-17 07:25:52 +08:00
|
|
|
MachO::encryption_info_command
|
|
|
|
MachOObjectFile::getEncryptionInfoCommand(const LoadCommandInfo &L) const {
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::encryption_info_command>(*this, L.Ptr);
|
2014-12-17 07:25:52 +08:00
|
|
|
}
|
|
|
|
|
2014-12-17 09:01:30 +08:00
|
|
|
MachO::encryption_info_command_64
|
|
|
|
MachOObjectFile::getEncryptionInfoCommand64(const LoadCommandInfo &L) const {
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::encryption_info_command_64>(*this, L.Ptr);
|
2014-12-17 09:01:30 +08:00
|
|
|
}
|
|
|
|
|
2014-12-19 03:24:35 +08:00
|
|
|
MachO::sub_framework_command
|
|
|
|
MachOObjectFile::getSubFrameworkCommand(const LoadCommandInfo &L) const {
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::sub_framework_command>(*this, L.Ptr);
|
2014-12-19 03:24:35 +08:00
|
|
|
}
|
2014-06-30 22:40:57 +08:00
|
|
|
|
2014-12-19 07:13:26 +08:00
|
|
|
MachO::sub_umbrella_command
|
|
|
|
MachOObjectFile::getSubUmbrellaCommand(const LoadCommandInfo &L) const {
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::sub_umbrella_command>(*this, L.Ptr);
|
2014-12-19 07:13:26 +08:00
|
|
|
}
|
|
|
|
|
2014-12-20 03:48:16 +08:00
|
|
|
MachO::sub_library_command
|
|
|
|
MachOObjectFile::getSubLibraryCommand(const LoadCommandInfo &L) const {
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::sub_library_command>(*this, L.Ptr);
|
2014-12-20 03:48:16 +08:00
|
|
|
}
|
|
|
|
|
2014-12-20 05:06:24 +08:00
|
|
|
MachO::sub_client_command
|
|
|
|
MachOObjectFile::getSubClientCommand(const LoadCommandInfo &L) const {
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::sub_client_command>(*this, L.Ptr);
|
2014-12-20 05:06:24 +08:00
|
|
|
}
|
|
|
|
|
2014-12-20 06:25:22 +08:00
|
|
|
MachO::routines_command
|
|
|
|
MachOObjectFile::getRoutinesCommand(const LoadCommandInfo &L) const {
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::routines_command>(*this, L.Ptr);
|
2014-12-20 06:25:22 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
MachO::routines_command_64
|
|
|
|
MachOObjectFile::getRoutinesCommand64(const LoadCommandInfo &L) const {
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::routines_command_64>(*this, L.Ptr);
|
2014-12-20 06:25:22 +08:00
|
|
|
}
|
|
|
|
|
2014-12-24 06:56:39 +08:00
|
|
|
MachO::thread_command
|
|
|
|
MachOObjectFile::getThreadCommand(const LoadCommandInfo &L) const {
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::thread_command>(*this, L.Ptr);
|
2014-12-24 06:56:39 +08:00
|
|
|
}
|
|
|
|
|
2013-09-01 12:28:48 +08:00
|
|
|
MachO::any_relocation_info
|
2013-04-19 02:08:55 +08:00
|
|
|
MachOObjectFile::getRelocation(DataRefImpl Rel) const {
|
2014-04-04 07:51:28 +08:00
|
|
|
uint32_t Offset;
|
2017-06-23 01:41:22 +08:00
|
|
|
if (getHeader().filetype == MachO::MH_OBJECT) {
|
|
|
|
DataRefImpl Sec;
|
|
|
|
Sec.d.a = Rel.d.a;
|
|
|
|
if (is64Bit()) {
|
|
|
|
MachO::section_64 Sect = getSection64(Sec);
|
|
|
|
Offset = Sect.reloff;
|
|
|
|
} else {
|
|
|
|
MachO::section Sect = getSection(Sec);
|
|
|
|
Offset = Sect.reloff;
|
|
|
|
}
|
2014-04-04 07:51:28 +08:00
|
|
|
} else {
|
2017-06-23 01:41:22 +08:00
|
|
|
MachO::dysymtab_command DysymtabLoadCmd = getDysymtabLoadCommand();
|
2017-12-16 01:57:40 +08:00
|
|
|
if (Rel.d.a == 0)
|
|
|
|
Offset = DysymtabLoadCmd.extreloff; // Offset to the external relocations
|
|
|
|
else
|
|
|
|
Offset = DysymtabLoadCmd.locreloff; // Offset to the local relocations
|
2014-04-04 07:51:28 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
auto P = reinterpret_cast<const MachO::any_relocation_info *>(
|
2016-12-04 09:56:10 +08:00
|
|
|
getPtr(*this, Offset)) + Rel.d.b;
|
2014-04-04 07:51:28 +08:00
|
|
|
return getStruct<MachO::any_relocation_info>(
|
2016-12-04 09:56:10 +08:00
|
|
|
*this, reinterpret_cast<const char *>(P));
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2013-09-01 12:28:48 +08:00
|
|
|
MachO::data_in_code_entry
|
2013-06-07 01:20:50 +08:00
|
|
|
MachOObjectFile::getDice(DataRefImpl Rel) const {
|
|
|
|
const char *P = reinterpret_cast<const char *>(Rel.p);
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::data_in_code_entry>(*this, P);
|
2013-06-07 01:20:50 +08:00
|
|
|
}
|
|
|
|
|
2015-06-05 03:22:03 +08:00
|
|
|
const MachO::mach_header &MachOObjectFile::getHeader() const {
|
2015-06-05 06:49:55 +08:00
|
|
|
return Header;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2015-06-05 03:22:03 +08:00
|
|
|
const MachO::mach_header_64 &MachOObjectFile::getHeader64() const {
|
|
|
|
assert(is64Bit());
|
|
|
|
return Header64;
|
2013-04-27 04:07:33 +08:00
|
|
|
}
|
|
|
|
|
2013-09-01 12:28:48 +08:00
|
|
|
uint32_t MachOObjectFile::getIndirectSymbolTableEntry(
|
|
|
|
const MachO::dysymtab_command &DLC,
|
|
|
|
unsigned Index) const {
|
|
|
|
uint64_t Offset = DLC.indirectsymoff + Index * sizeof(uint32_t);
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<uint32_t>(*this, getPtr(*this, Offset));
|
2013-04-27 04:07:33 +08:00
|
|
|
}
|
|
|
|
|
2013-09-01 12:28:48 +08:00
|
|
|
MachO::data_in_code_entry
|
2013-04-27 04:07:33 +08:00
|
|
|
MachOObjectFile::getDataInCodeTableEntry(uint32_t DataOffset,
|
|
|
|
unsigned Index) const {
|
2013-09-01 12:28:48 +08:00
|
|
|
uint64_t Offset = DataOffset + Index * sizeof(MachO::data_in_code_entry);
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::data_in_code_entry>(*this, getPtr(*this, Offset));
|
2013-04-27 04:07:33 +08:00
|
|
|
}
|
|
|
|
|
2013-09-01 12:28:48 +08:00
|
|
|
MachO::symtab_command MachOObjectFile::getSymtabLoadCommand() const {
|
2014-10-24 03:37:31 +08:00
|
|
|
if (SymtabLoadCmd)
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::symtab_command>(*this, SymtabLoadCmd);
|
2014-10-24 03:37:31 +08:00
|
|
|
|
|
|
|
// If there is no SymtabLoadCmd return a load command with zero'ed fields.
|
|
|
|
MachO::symtab_command Cmd;
|
|
|
|
Cmd.cmd = MachO::LC_SYMTAB;
|
|
|
|
Cmd.cmdsize = sizeof(MachO::symtab_command);
|
|
|
|
Cmd.symoff = 0;
|
|
|
|
Cmd.nsyms = 0;
|
|
|
|
Cmd.stroff = 0;
|
|
|
|
Cmd.strsize = 0;
|
|
|
|
return Cmd;
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
2013-09-01 12:28:48 +08:00
|
|
|
MachO::dysymtab_command MachOObjectFile::getDysymtabLoadCommand() const {
|
2014-10-24 03:37:31 +08:00
|
|
|
if (DysymtabLoadCmd)
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::dysymtab_command>(*this, DysymtabLoadCmd);
|
2014-10-24 03:37:31 +08:00
|
|
|
|
|
|
|
// If there is no DysymtabLoadCmd return a load command with zero'ed fields.
|
|
|
|
MachO::dysymtab_command Cmd;
|
|
|
|
Cmd.cmd = MachO::LC_DYSYMTAB;
|
|
|
|
Cmd.cmdsize = sizeof(MachO::dysymtab_command);
|
|
|
|
Cmd.ilocalsym = 0;
|
|
|
|
Cmd.nlocalsym = 0;
|
|
|
|
Cmd.iextdefsym = 0;
|
|
|
|
Cmd.nextdefsym = 0;
|
|
|
|
Cmd.iundefsym = 0;
|
|
|
|
Cmd.nundefsym = 0;
|
|
|
|
Cmd.tocoff = 0;
|
|
|
|
Cmd.ntoc = 0;
|
|
|
|
Cmd.modtaboff = 0;
|
|
|
|
Cmd.nmodtab = 0;
|
|
|
|
Cmd.extrefsymoff = 0;
|
|
|
|
Cmd.nextrefsyms = 0;
|
|
|
|
Cmd.indirectsymoff = 0;
|
|
|
|
Cmd.nindirectsyms = 0;
|
|
|
|
Cmd.extreloff = 0;
|
|
|
|
Cmd.nextrel = 0;
|
|
|
|
Cmd.locreloff = 0;
|
|
|
|
Cmd.nlocrel = 0;
|
|
|
|
return Cmd;
|
2013-04-27 04:07:33 +08:00
|
|
|
}
|
|
|
|
|
2013-09-01 12:28:48 +08:00
|
|
|
MachO::linkedit_data_command
|
2013-06-07 01:20:50 +08:00
|
|
|
MachOObjectFile::getDataInCodeLoadCommand() const {
|
|
|
|
if (DataInCodeLoadCmd)
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::linkedit_data_command>(*this, DataInCodeLoadCmd);
|
2013-06-07 01:20:50 +08:00
|
|
|
|
|
|
|
// If there is no DataInCodeLoadCmd return a load command with zero'ed fields.
|
2013-09-01 12:28:48 +08:00
|
|
|
MachO::linkedit_data_command Cmd;
|
|
|
|
Cmd.cmd = MachO::LC_DATA_IN_CODE;
|
|
|
|
Cmd.cmdsize = sizeof(MachO::linkedit_data_command);
|
2015-01-28 05:28:24 +08:00
|
|
|
Cmd.dataoff = 0;
|
|
|
|
Cmd.datasize = 0;
|
|
|
|
return Cmd;
|
|
|
|
}
|
|
|
|
|
|
|
|
MachO::linkedit_data_command
|
|
|
|
MachOObjectFile::getLinkOptHintsLoadCommand() const {
|
|
|
|
if (LinkOptHintsLoadCmd)
|
2016-12-04 09:56:10 +08:00
|
|
|
return getStruct<MachO::linkedit_data_command>(*this, LinkOptHintsLoadCmd);
|
2015-01-28 05:28:24 +08:00
|
|
|
|
|
|
|
// If there is no LinkOptHintsLoadCmd return a load command with zero'ed
|
|
|
|
// fields.
|
|
|
|
MachO::linkedit_data_command Cmd;
|
|
|
|
Cmd.cmd = MachO::LC_LINKER_OPTIMIZATION_HINT;
|
|
|
|
Cmd.cmdsize = sizeof(MachO::linkedit_data_command);
|
2013-09-01 12:28:48 +08:00
|
|
|
Cmd.dataoff = 0;
|
|
|
|
Cmd.datasize = 0;
|
2013-06-07 01:20:50 +08:00
|
|
|
return Cmd;
|
|
|
|
}
|
|
|
|
|
2014-08-30 08:20:14 +08:00
|
|
|
ArrayRef<uint8_t> MachOObjectFile::getDyldInfoRebaseOpcodes() const {
|
2015-09-22 19:19:03 +08:00
|
|
|
if (!DyldInfoLoadCmd)
|
2015-09-21 13:32:41 +08:00
|
|
|
return None;
|
2014-08-30 08:20:14 +08:00
|
|
|
|
2019-06-05 00:55:30 +08:00
|
|
|
auto DyldInfoOrErr =
|
|
|
|
getStructOrErr<MachO::dyld_info_command>(*this, DyldInfoLoadCmd);
|
|
|
|
if (!DyldInfoOrErr)
|
|
|
|
return None;
|
|
|
|
MachO::dyld_info_command DyldInfo = DyldInfoOrErr.get();
|
2015-09-22 19:13:55 +08:00
|
|
|
const uint8_t *Ptr =
|
2016-12-04 09:56:10 +08:00
|
|
|
reinterpret_cast<const uint8_t *>(getPtr(*this, DyldInfo.rebase_off));
|
2015-09-21 13:32:41 +08:00
|
|
|
return makeArrayRef(Ptr, DyldInfo.rebase_size);
|
2014-08-30 08:20:14 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
ArrayRef<uint8_t> MachOObjectFile::getDyldInfoBindOpcodes() const {
|
2015-09-22 19:19:03 +08:00
|
|
|
if (!DyldInfoLoadCmd)
|
2015-09-21 13:32:41 +08:00
|
|
|
return None;
|
2014-08-30 08:20:14 +08:00
|
|
|
|
2019-06-05 00:55:30 +08:00
|
|
|
auto DyldInfoOrErr =
|
|
|
|
getStructOrErr<MachO::dyld_info_command>(*this, DyldInfoLoadCmd);
|
|
|
|
if (!DyldInfoOrErr)
|
|
|
|
return None;
|
|
|
|
MachO::dyld_info_command DyldInfo = DyldInfoOrErr.get();
|
2015-09-22 19:13:55 +08:00
|
|
|
const uint8_t *Ptr =
|
2016-12-04 09:56:10 +08:00
|
|
|
reinterpret_cast<const uint8_t *>(getPtr(*this, DyldInfo.bind_off));
|
2015-09-21 13:32:41 +08:00
|
|
|
return makeArrayRef(Ptr, DyldInfo.bind_size);
|
2014-08-30 08:20:14 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
ArrayRef<uint8_t> MachOObjectFile::getDyldInfoWeakBindOpcodes() const {
|
2015-09-22 19:19:03 +08:00
|
|
|
if (!DyldInfoLoadCmd)
|
2015-09-21 13:32:41 +08:00
|
|
|
return None;
|
2014-08-30 08:20:14 +08:00
|
|
|
|
2019-06-05 00:55:30 +08:00
|
|
|
auto DyldInfoOrErr =
|
|
|
|
getStructOrErr<MachO::dyld_info_command>(*this, DyldInfoLoadCmd);
|
|
|
|
if (!DyldInfoOrErr)
|
|
|
|
return None;
|
|
|
|
MachO::dyld_info_command DyldInfo = DyldInfoOrErr.get();
|
2015-09-22 19:13:55 +08:00
|
|
|
const uint8_t *Ptr =
|
2016-12-04 09:56:10 +08:00
|
|
|
reinterpret_cast<const uint8_t *>(getPtr(*this, DyldInfo.weak_bind_off));
|
2015-09-21 13:32:41 +08:00
|
|
|
return makeArrayRef(Ptr, DyldInfo.weak_bind_size);
|
2014-08-30 08:20:14 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
ArrayRef<uint8_t> MachOObjectFile::getDyldInfoLazyBindOpcodes() const {
|
2015-09-22 19:19:03 +08:00
|
|
|
if (!DyldInfoLoadCmd)
|
2015-09-21 13:32:41 +08:00
|
|
|
return None;
|
2014-08-30 08:20:14 +08:00
|
|
|
|
2019-06-05 00:55:30 +08:00
|
|
|
auto DyldInfoOrErr =
|
|
|
|
getStructOrErr<MachO::dyld_info_command>(*this, DyldInfoLoadCmd);
|
|
|
|
if (!DyldInfoOrErr)
|
|
|
|
return None;
|
|
|
|
MachO::dyld_info_command DyldInfo = DyldInfoOrErr.get();
|
2015-09-22 19:13:55 +08:00
|
|
|
const uint8_t *Ptr =
|
2016-12-04 09:56:10 +08:00
|
|
|
reinterpret_cast<const uint8_t *>(getPtr(*this, DyldInfo.lazy_bind_off));
|
2015-09-21 13:32:41 +08:00
|
|
|
return makeArrayRef(Ptr, DyldInfo.lazy_bind_size);
|
2014-08-30 08:20:14 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
ArrayRef<uint8_t> MachOObjectFile::getDyldInfoExportsTrie() const {
|
2015-09-22 19:19:03 +08:00
|
|
|
if (!DyldInfoLoadCmd)
|
2015-09-21 13:32:41 +08:00
|
|
|
return None;
|
2014-08-30 08:20:14 +08:00
|
|
|
|
2019-06-05 00:55:30 +08:00
|
|
|
auto DyldInfoOrErr =
|
|
|
|
getStructOrErr<MachO::dyld_info_command>(*this, DyldInfoLoadCmd);
|
|
|
|
if (!DyldInfoOrErr)
|
|
|
|
return None;
|
|
|
|
MachO::dyld_info_command DyldInfo = DyldInfoOrErr.get();
|
2015-09-22 19:13:55 +08:00
|
|
|
const uint8_t *Ptr =
|
2016-12-04 09:56:10 +08:00
|
|
|
reinterpret_cast<const uint8_t *>(getPtr(*this, DyldInfo.export_off));
|
2015-09-21 13:32:41 +08:00
|
|
|
return makeArrayRef(Ptr, DyldInfo.export_size);
|
2014-08-30 08:20:14 +08:00
|
|
|
}
|
|
|
|
|
2014-10-16 07:35:45 +08:00
|
|
|
ArrayRef<uint8_t> MachOObjectFile::getUuid() const {
|
|
|
|
if (!UuidLoadCmd)
|
2015-09-21 13:32:41 +08:00
|
|
|
return None;
|
2014-10-24 23:52:05 +08:00
|
|
|
// Returning a pointer is fine as uuid doesn't need endian swapping.
|
|
|
|
const char *Ptr = UuidLoadCmd + offsetof(MachO::uuid_command, uuid);
|
2015-09-21 13:32:41 +08:00
|
|
|
return makeArrayRef(reinterpret_cast<const uint8_t *>(Ptr), 16);
|
2014-10-16 07:35:45 +08:00
|
|
|
}
|
2014-08-30 08:20:14 +08:00
|
|
|
|
2013-04-27 04:07:33 +08:00
|
|
|
StringRef MachOObjectFile::getStringTableData() const {
|
2013-09-01 12:28:48 +08:00
|
|
|
MachO::symtab_command S = getSymtabLoadCommand();
|
|
|
|
return getData().substr(S.stroff, S.strsize);
|
2013-04-27 04:07:33 +08:00
|
|
|
}
|
|
|
|
|
2013-04-19 02:08:55 +08:00
|
|
|
bool MachOObjectFile::is64Bit() const {
|
|
|
|
return getType() == getMachOType(false, true) ||
|
2014-07-16 03:35:22 +08:00
|
|
|
getType() == getMachOType(true, true);
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
void MachOObjectFile::ReadULEB128s(uint64_t Index,
|
|
|
|
SmallVectorImpl<uint64_t> &Out) const {
|
|
|
|
DataExtractor extractor(ObjectFile::getData(), true, 0);
|
|
|
|
|
2019-08-06 18:49:40 +08:00
|
|
|
uint64_t offset = Index;
|
2013-04-19 02:08:55 +08:00
|
|
|
uint64_t data = 0;
|
|
|
|
while (uint64_t delta = extractor.getULEB128(&offset)) {
|
|
|
|
data += delta;
|
|
|
|
Out.push_back(data);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-08-18 03:09:37 +08:00
|
|
|
bool MachOObjectFile::isRelocatableObject() const {
|
|
|
|
return getHeader().filetype == MachO::MH_OBJECT;
|
|
|
|
}
|
|
|
|
|
2016-03-26 07:11:52 +08:00
|
|
|
Expected<std::unique_ptr<MachOObjectFile>>
|
2016-10-25 05:15:11 +08:00
|
|
|
ObjectFile::createMachOObjectFile(MemoryBufferRef Buffer,
|
|
|
|
uint32_t UniversalCputype,
|
|
|
|
uint32_t UniversalIndex) {
|
2014-08-20 02:44:46 +08:00
|
|
|
StringRef Magic = Buffer.getBuffer().slice(0, 4);
|
2016-03-26 05:59:14 +08:00
|
|
|
if (Magic == "\xFE\xED\xFA\xCE")
|
2016-10-25 05:15:11 +08:00
|
|
|
return MachOObjectFile::create(Buffer, false, false,
|
|
|
|
UniversalCputype, UniversalIndex);
|
2016-03-29 01:45:48 +08:00
|
|
|
if (Magic == "\xCE\xFA\xED\xFE")
|
2016-10-25 05:15:11 +08:00
|
|
|
return MachOObjectFile::create(Buffer, true, false,
|
|
|
|
UniversalCputype, UniversalIndex);
|
2016-03-29 01:45:48 +08:00
|
|
|
if (Magic == "\xFE\xED\xFA\xCF")
|
2016-10-25 05:15:11 +08:00
|
|
|
return MachOObjectFile::create(Buffer, false, true,
|
|
|
|
UniversalCputype, UniversalIndex);
|
2016-03-29 01:45:48 +08:00
|
|
|
if (Magic == "\xCF\xFA\xED\xFE")
|
2016-10-25 05:15:11 +08:00
|
|
|
return MachOObjectFile::create(Buffer, true, true,
|
|
|
|
UniversalCputype, UniversalIndex);
|
2016-05-07 04:16:28 +08:00
|
|
|
return make_error<GenericBinaryError>("Unrecognized MachO magic number",
|
2016-05-06 07:59:57 +08:00
|
|
|
object_error::invalid_file_type);
|
2013-04-19 02:08:55 +08:00
|
|
|
}
|
2017-06-06 09:22:34 +08:00
|
|
|
|
|
|
|
StringRef MachOObjectFile::mapDebugSectionName(StringRef Name) const {
|
|
|
|
return StringSwitch<StringRef>(Name)
|
|
|
|
.Case("debug_str_offs", "debug_str_offsets")
|
|
|
|
.Default(Name);
|
|
|
|
}
|