2010-10-15 07:06:10 +08:00
|
|
|
//===--- CodeGenTBAA.h - TBAA information for LLVM CodeGen ------*- C++ -*-===//
|
|
|
|
//
|
|
|
|
// The LLVM Compiler Infrastructure
|
|
|
|
//
|
|
|
|
// This file is distributed under the University of Illinois Open Source
|
|
|
|
// License. See LICENSE.TXT for details.
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
//
|
2010-10-22 02:49:12 +08:00
|
|
|
// This is the code that manages TBAA information and defines the TBAA policy
|
|
|
|
// for the optimizer to use.
|
2010-10-15 07:06:10 +08:00
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
2014-08-14 00:25:19 +08:00
|
|
|
#ifndef LLVM_CLANG_LIB_CODEGEN_CODEGENTBAA_H
|
|
|
|
#define LLVM_CLANG_LIB_CODEGEN_CODEGENTBAA_H
|
2010-10-15 07:06:10 +08:00
|
|
|
|
2016-02-02 22:24:21 +08:00
|
|
|
#include "clang/AST/Type.h"
|
2011-07-20 14:58:45 +08:00
|
|
|
#include "clang/Basic/LLVM.h"
|
2010-10-15 07:06:10 +08:00
|
|
|
#include "llvm/ADT/DenseMap.h"
|
2013-01-02 19:45:17 +08:00
|
|
|
#include "llvm/IR/MDBuilder.h"
|
2016-02-02 22:24:21 +08:00
|
|
|
#include "llvm/IR/Metadata.h"
|
2010-10-15 07:06:10 +08:00
|
|
|
|
|
|
|
namespace clang {
|
|
|
|
class ASTContext;
|
2012-04-24 14:57:01 +08:00
|
|
|
class CodeGenOptions;
|
2010-10-15 07:06:10 +08:00
|
|
|
class LangOptions;
|
2011-01-14 02:57:25 +08:00
|
|
|
class MangleContext;
|
2010-10-15 07:06:10 +08:00
|
|
|
class QualType;
|
|
|
|
class Type;
|
|
|
|
|
|
|
|
namespace CodeGen {
|
2017-10-03 18:52:39 +08:00
|
|
|
class CGRecordLayout;
|
|
|
|
|
2017-10-31 19:05:34 +08:00
|
|
|
// TBAAAccessKind - A kind of TBAA memory access descriptor.
|
|
|
|
enum class TBAAAccessKind : unsigned {
|
[CodeGen] Add initial support for union members in TBAA
The basic idea behind this patch is that since in strict aliasing
mode all accesses to union members require their outermost
enclosing union objects to be specified explicitly, then for a
couple given accesses to union members of the form
p->a.b.c...
q->x.y.z...
it is known they can only alias if both p and q point to the same
union type and offset ranges of members a.b.c... and x.y.z...
overlap. Note that the actual types of the members do not matter.
Specifically, in this patch we do the following:
* Make unions to be valid TBAA base access types. This enables
generation of TBAA type descriptors for unions.
* Encode union types as structures with a single member of a
special "union member" type. Currently we do not encode
information about sizes of types, but conceptually such union
members are considered to be of the size of the whole union.
* Encode accesses to direct and indirect union members, including
member arrays, as accesses to these special members. All
accesses to members of a union thus get the same offset, which
is the offset of the union they are part of. This means the
existing LLVM TBAA machinery is able to handle such accesses
with no changes.
While this is already an improvement comparing to the current
situation, that is, representing all union accesses as may-alias
ones, there are further changes planned to complete the support
for unions. One of them is storing information about access sizes
so we can distinct accesses to non-overlapping union members,
including accesses to different elements of member arrays.
Another change is encoding type sizes in order to make it
possible to compute offsets within constant-indexed array
elements. These enhancements will be addressed with separate
patches.
Differential Revision: https://reviews.llvm.org/D39455
llvm-svn: 319413
2017-11-30 17:26:39 +08:00
|
|
|
Ordinary, // An ordinary memory access.
|
|
|
|
MayAlias, // An access that may alias with any other accesses.
|
|
|
|
Incomplete, // Used to designate pointee values of incomplete types.
|
|
|
|
UnionMember, // An access to a direct or indirect union member.
|
2017-10-31 19:05:34 +08:00
|
|
|
};
|
|
|
|
|
2017-10-03 18:52:39 +08:00
|
|
|
// TBAAAccessInfo - Describes a memory access in terms of TBAA.
|
|
|
|
struct TBAAAccessInfo {
|
2017-10-31 19:05:34 +08:00
|
|
|
TBAAAccessInfo(TBAAAccessKind Kind, llvm::MDNode *BaseType,
|
2017-11-27 17:39:29 +08:00
|
|
|
llvm::MDNode *AccessType, uint64_t Offset, uint64_t Size)
|
|
|
|
: Kind(Kind), BaseType(BaseType), AccessType(AccessType),
|
|
|
|
Offset(Offset), Size(Size)
|
2017-10-31 19:05:34 +08:00
|
|
|
{}
|
|
|
|
|
2017-10-06 16:17:48 +08:00
|
|
|
TBAAAccessInfo(llvm::MDNode *BaseType, llvm::MDNode *AccessType,
|
2017-11-27 17:39:29 +08:00
|
|
|
uint64_t Offset, uint64_t Size)
|
|
|
|
: TBAAAccessInfo(TBAAAccessKind::Ordinary, BaseType, AccessType,
|
|
|
|
Offset, Size)
|
2017-10-03 18:52:39 +08:00
|
|
|
{}
|
|
|
|
|
2017-11-27 17:39:29 +08:00
|
|
|
explicit TBAAAccessInfo(llvm::MDNode *AccessType, uint64_t Size)
|
|
|
|
: TBAAAccessInfo(/* BaseType= */ nullptr, AccessType, /* Offset= */ 0, Size)
|
2017-10-03 18:52:39 +08:00
|
|
|
{}
|
|
|
|
|
|
|
|
TBAAAccessInfo()
|
2017-11-27 17:39:29 +08:00
|
|
|
: TBAAAccessInfo(/* AccessType= */ nullptr, /* Size= */ 0)
|
2017-10-03 18:52:39 +08:00
|
|
|
{}
|
2010-10-15 07:06:10 +08:00
|
|
|
|
2017-10-31 19:05:34 +08:00
|
|
|
static TBAAAccessInfo getMayAliasInfo() {
|
2017-11-27 17:39:29 +08:00
|
|
|
return TBAAAccessInfo(TBAAAccessKind::MayAlias,
|
|
|
|
/* BaseType= */ nullptr, /* AccessType= */ nullptr,
|
|
|
|
/* Offset= */ 0, /* Size= */ 0);
|
2017-10-31 19:05:34 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
bool isMayAlias() const { return Kind == TBAAAccessKind::MayAlias; }
|
|
|
|
|
2017-11-27 17:39:29 +08:00
|
|
|
static TBAAAccessInfo getIncompleteInfo() {
|
|
|
|
return TBAAAccessInfo(TBAAAccessKind::Incomplete,
|
|
|
|
/* BaseType= */ nullptr, /* AccessType= */ nullptr,
|
|
|
|
/* Offset= */ 0, /* Size= */ 0);
|
|
|
|
}
|
|
|
|
|
|
|
|
bool isIncomplete() const { return Kind == TBAAAccessKind::Incomplete; }
|
|
|
|
|
[CodeGen] Add initial support for union members in TBAA
The basic idea behind this patch is that since in strict aliasing
mode all accesses to union members require their outermost
enclosing union objects to be specified explicitly, then for a
couple given accesses to union members of the form
p->a.b.c...
q->x.y.z...
it is known they can only alias if both p and q point to the same
union type and offset ranges of members a.b.c... and x.y.z...
overlap. Note that the actual types of the members do not matter.
Specifically, in this patch we do the following:
* Make unions to be valid TBAA base access types. This enables
generation of TBAA type descriptors for unions.
* Encode union types as structures with a single member of a
special "union member" type. Currently we do not encode
information about sizes of types, but conceptually such union
members are considered to be of the size of the whole union.
* Encode accesses to direct and indirect union members, including
member arrays, as accesses to these special members. All
accesses to members of a union thus get the same offset, which
is the offset of the union they are part of. This means the
existing LLVM TBAA machinery is able to handle such accesses
with no changes.
While this is already an improvement comparing to the current
situation, that is, representing all union accesses as may-alias
ones, there are further changes planned to complete the support
for unions. One of them is storing information about access sizes
so we can distinct accesses to non-overlapping union members,
including accesses to different elements of member arrays.
Another change is encoding type sizes in order to make it
possible to compute offsets within constant-indexed array
elements. These enhancements will be addressed with separate
patches.
Differential Revision: https://reviews.llvm.org/D39455
llvm-svn: 319413
2017-11-30 17:26:39 +08:00
|
|
|
static TBAAAccessInfo getUnionMemberInfo(llvm::MDNode *BaseType,
|
|
|
|
uint64_t Offset, uint64_t Size) {
|
|
|
|
return TBAAAccessInfo(TBAAAccessKind::UnionMember, BaseType,
|
|
|
|
/* AccessType= */ nullptr, Offset, Size);
|
|
|
|
}
|
|
|
|
|
|
|
|
bool isUnionMember() const { return Kind == TBAAAccessKind::UnionMember; }
|
|
|
|
|
2017-10-17 17:12:13 +08:00
|
|
|
bool operator==(const TBAAAccessInfo &Other) const {
|
2017-10-31 19:05:34 +08:00
|
|
|
return Kind == Other.Kind &&
|
|
|
|
BaseType == Other.BaseType &&
|
2017-10-17 17:12:13 +08:00
|
|
|
AccessType == Other.AccessType &&
|
2017-11-27 17:39:29 +08:00
|
|
|
Offset == Other.Offset &&
|
|
|
|
Size == Other.Size;
|
2017-10-17 17:12:13 +08:00
|
|
|
}
|
|
|
|
|
2017-10-31 19:05:34 +08:00
|
|
|
bool operator!=(const TBAAAccessInfo &Other) const {
|
|
|
|
return !(*this == Other);
|
|
|
|
}
|
|
|
|
|
|
|
|
explicit operator bool() const {
|
|
|
|
return *this != TBAAAccessInfo();
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Kind - The kind of the access descriptor.
|
|
|
|
TBAAAccessKind Kind;
|
|
|
|
|
2017-10-03 18:52:39 +08:00
|
|
|
/// BaseType - The base/leading access type. May be null if this access
|
|
|
|
/// descriptor represents an access that is not considered to be an access
|
|
|
|
/// to an aggregate or union member.
|
2017-10-06 16:17:48 +08:00
|
|
|
llvm::MDNode *BaseType;
|
2017-10-03 18:52:39 +08:00
|
|
|
|
|
|
|
/// AccessType - The final access type. May be null if there is no TBAA
|
|
|
|
/// information available about this access.
|
|
|
|
llvm::MDNode *AccessType;
|
|
|
|
|
|
|
|
/// Offset - The byte offset of the final access within the base one. Must be
|
|
|
|
/// zero if the base access type is not specified.
|
|
|
|
uint64_t Offset;
|
2017-11-27 17:39:29 +08:00
|
|
|
|
|
|
|
/// Size - The size of access, in bytes.
|
|
|
|
uint64_t Size;
|
2017-10-03 18:52:39 +08:00
|
|
|
};
|
2013-04-05 05:53:22 +08:00
|
|
|
|
2010-10-15 07:06:10 +08:00
|
|
|
/// CodeGenTBAA - This class organizes the cross-module state that is used
|
|
|
|
/// while lowering AST types to LLVM types.
|
|
|
|
class CodeGenTBAA {
|
|
|
|
ASTContext &Context;
|
2017-11-27 17:39:29 +08:00
|
|
|
llvm::Module &Module;
|
2012-04-24 14:57:01 +08:00
|
|
|
const CodeGenOptions &CodeGenOpts;
|
2010-10-15 07:06:10 +08:00
|
|
|
const LangOptions &Features;
|
2010-10-16 04:23:12 +08:00
|
|
|
MangleContext &MContext;
|
2010-10-15 07:06:10 +08:00
|
|
|
|
2012-04-16 02:04:54 +08:00
|
|
|
// MDHelper - Helper for creating metadata.
|
|
|
|
llvm::MDBuilder MDHelper;
|
|
|
|
|
2013-04-05 05:53:22 +08:00
|
|
|
/// MetadataCache - This maps clang::Types to scalar llvm::MDNodes describing
|
|
|
|
/// them.
|
2010-10-15 07:06:10 +08:00
|
|
|
llvm::DenseMap<const Type *, llvm::MDNode *> MetadataCache;
|
2017-10-06 16:17:48 +08:00
|
|
|
/// This maps clang::Types to a base access type in the type DAG.
|
|
|
|
llvm::DenseMap<const Type *, llvm::MDNode *> BaseTypeMetadataCache;
|
|
|
|
/// This maps TBAA access descriptors to tag nodes.
|
|
|
|
llvm::DenseMap<TBAAAccessInfo, llvm::MDNode *> AccessTagMetadataCache;
|
2010-10-15 07:06:10 +08:00
|
|
|
|
2012-09-29 05:58:29 +08:00
|
|
|
/// StructMetadataCache - This maps clang::Types to llvm::MDNodes describing
|
|
|
|
/// them for struct assignments.
|
|
|
|
llvm::DenseMap<const Type *, llvm::MDNode *> StructMetadataCache;
|
|
|
|
|
2010-10-15 07:06:10 +08:00
|
|
|
llvm::MDNode *Root;
|
2010-10-26 05:48:30 +08:00
|
|
|
llvm::MDNode *Char;
|
2010-10-15 07:06:10 +08:00
|
|
|
|
2010-10-26 05:48:30 +08:00
|
|
|
/// getRoot - This is the mdnode for the root of the metadata type graph
|
|
|
|
/// for this translation unit.
|
|
|
|
llvm::MDNode *getRoot();
|
|
|
|
|
|
|
|
/// getChar - This is the mdnode for "char", which is special, and any types
|
2010-10-15 07:06:10 +08:00
|
|
|
/// considered to be equivalent to it.
|
2010-10-26 05:48:30 +08:00
|
|
|
llvm::MDNode *getChar();
|
2010-10-15 07:06:10 +08:00
|
|
|
|
[CodeGen] Add initial support for union members in TBAA
The basic idea behind this patch is that since in strict aliasing
mode all accesses to union members require their outermost
enclosing union objects to be specified explicitly, then for a
couple given accesses to union members of the form
p->a.b.c...
q->x.y.z...
it is known they can only alias if both p and q point to the same
union type and offset ranges of members a.b.c... and x.y.z...
overlap. Note that the actual types of the members do not matter.
Specifically, in this patch we do the following:
* Make unions to be valid TBAA base access types. This enables
generation of TBAA type descriptors for unions.
* Encode union types as structures with a single member of a
special "union member" type. Currently we do not encode
information about sizes of types, but conceptually such union
members are considered to be of the size of the whole union.
* Encode accesses to direct and indirect union members, including
member arrays, as accesses to these special members. All
accesses to members of a union thus get the same offset, which
is the offset of the union they are part of. This means the
existing LLVM TBAA machinery is able to handle such accesses
with no changes.
While this is already an improvement comparing to the current
situation, that is, representing all union accesses as may-alias
ones, there are further changes planned to complete the support
for unions. One of them is storing information about access sizes
so we can distinct accesses to non-overlapping union members,
including accesses to different elements of member arrays.
Another change is encoding type sizes in order to make it
possible to compute offsets within constant-indexed array
elements. These enhancements will be addressed with separate
patches.
Differential Revision: https://reviews.llvm.org/D39455
llvm-svn: 319413
2017-11-30 17:26:39 +08:00
|
|
|
/// getUnionMemberType - Get metadata that represents the type of union
|
|
|
|
/// members.
|
|
|
|
llvm::MDNode *getUnionMemberType(uint64_t Size);
|
|
|
|
|
2012-09-29 05:58:29 +08:00
|
|
|
/// CollectFields - Collect information about the fields of a type for
|
|
|
|
/// !tbaa.struct metadata formation. Return false for an unsupported type.
|
|
|
|
bool CollectFields(uint64_t BaseOffset,
|
|
|
|
QualType Ty,
|
|
|
|
SmallVectorImpl<llvm::MDBuilder::TBAAStructField> &Fields,
|
|
|
|
bool MayAlias);
|
|
|
|
|
2017-11-27 17:39:29 +08:00
|
|
|
/// createScalarTypeNode - A wrapper function to create a metadata node
|
|
|
|
/// describing a scalar type.
|
|
|
|
llvm::MDNode *createScalarTypeNode(StringRef Name, llvm::MDNode *Parent,
|
|
|
|
uint64_t Size);
|
2013-04-12 07:02:56 +08:00
|
|
|
|
2017-11-21 19:18:06 +08:00
|
|
|
/// getTypeInfoHelper - An internal helper function to generate metadata used
|
|
|
|
/// to describe accesses to objects of the given type.
|
|
|
|
llvm::MDNode *getTypeInfoHelper(const Type *Ty);
|
|
|
|
|
|
|
|
/// getBaseTypeInfoHelper - An internal helper function to generate metadata
|
|
|
|
/// used to describe accesses to objects of the given base type.
|
|
|
|
llvm::MDNode *getBaseTypeInfoHelper(const Type *Ty);
|
|
|
|
|
2010-10-15 07:06:10 +08:00
|
|
|
public:
|
2017-11-27 17:39:29 +08:00
|
|
|
CodeGenTBAA(ASTContext &Ctx, llvm::Module &M, const CodeGenOptions &CGO,
|
|
|
|
const LangOptions &Features, MangleContext &MContext);
|
2010-10-15 07:06:10 +08:00
|
|
|
~CodeGenTBAA();
|
|
|
|
|
2017-10-02 17:54:47 +08:00
|
|
|
/// getTypeInfo - Get metadata used to describe accesses to objects of the
|
|
|
|
/// given type.
|
|
|
|
llvm::MDNode *getTypeInfo(QualType QTy);
|
2012-03-27 01:03:51 +08:00
|
|
|
|
2017-10-05 19:08:17 +08:00
|
|
|
/// getVTablePtrAccessInfo - Get the TBAA information that describes an
|
|
|
|
/// access to a virtual table pointer.
|
2017-11-27 17:39:29 +08:00
|
|
|
TBAAAccessInfo getVTablePtrAccessInfo(llvm::Type *VTablePtrType);
|
2012-09-29 05:58:29 +08:00
|
|
|
|
|
|
|
/// getTBAAStructInfo - Get the TBAAStruct MDNode to be used for a memcpy of
|
|
|
|
/// the given type.
|
|
|
|
llvm::MDNode *getTBAAStructInfo(QualType QTy);
|
2013-04-05 05:53:22 +08:00
|
|
|
|
2017-10-06 16:17:48 +08:00
|
|
|
/// getBaseTypeInfo - Get metadata that describes the given base access type.
|
|
|
|
/// Return null if the type is not suitable for use in TBAA access tags.
|
|
|
|
llvm::MDNode *getBaseTypeInfo(QualType QTy);
|
2017-10-05 19:05:43 +08:00
|
|
|
|
2017-10-05 19:08:17 +08:00
|
|
|
/// getAccessTagInfo - Get TBAA tag for a given memory access.
|
|
|
|
llvm::MDNode *getAccessTagInfo(TBAAAccessInfo Info);
|
2013-04-12 07:02:56 +08:00
|
|
|
|
2017-10-17 17:12:13 +08:00
|
|
|
/// mergeTBAAInfoForCast - Get merged TBAA information for the purpose of
|
|
|
|
/// type casts.
|
|
|
|
TBAAAccessInfo mergeTBAAInfoForCast(TBAAAccessInfo SourceInfo,
|
|
|
|
TBAAAccessInfo TargetInfo);
|
2017-10-31 19:05:34 +08:00
|
|
|
|
|
|
|
/// mergeTBAAInfoForConditionalOperator - Get merged TBAA information for the
|
|
|
|
/// purpose of conditional operator.
|
|
|
|
TBAAAccessInfo mergeTBAAInfoForConditionalOperator(TBAAAccessInfo InfoA,
|
|
|
|
TBAAAccessInfo InfoB);
|
2010-10-15 07:06:10 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
} // end namespace CodeGen
|
|
|
|
} // end namespace clang
|
|
|
|
|
2013-04-05 05:53:22 +08:00
|
|
|
namespace llvm {
|
|
|
|
|
2017-10-06 16:17:48 +08:00
|
|
|
template<> struct DenseMapInfo<clang::CodeGen::TBAAAccessInfo> {
|
|
|
|
static clang::CodeGen::TBAAAccessInfo getEmptyKey() {
|
2017-10-31 19:05:34 +08:00
|
|
|
unsigned UnsignedKey = DenseMapInfo<unsigned>::getEmptyKey();
|
2017-10-06 16:17:48 +08:00
|
|
|
return clang::CodeGen::TBAAAccessInfo(
|
2017-10-31 19:05:34 +08:00
|
|
|
static_cast<clang::CodeGen::TBAAAccessKind>(UnsignedKey),
|
2017-10-06 16:17:48 +08:00
|
|
|
DenseMapInfo<MDNode *>::getEmptyKey(),
|
|
|
|
DenseMapInfo<MDNode *>::getEmptyKey(),
|
2017-11-27 17:39:29 +08:00
|
|
|
DenseMapInfo<uint64_t>::getEmptyKey(),
|
2013-04-05 05:53:22 +08:00
|
|
|
DenseMapInfo<uint64_t>::getEmptyKey());
|
|
|
|
}
|
|
|
|
|
2017-10-06 16:17:48 +08:00
|
|
|
static clang::CodeGen::TBAAAccessInfo getTombstoneKey() {
|
2017-10-31 19:05:34 +08:00
|
|
|
unsigned UnsignedKey = DenseMapInfo<unsigned>::getTombstoneKey();
|
2017-10-06 16:17:48 +08:00
|
|
|
return clang::CodeGen::TBAAAccessInfo(
|
2017-10-31 19:05:34 +08:00
|
|
|
static_cast<clang::CodeGen::TBAAAccessKind>(UnsignedKey),
|
2017-10-06 16:17:48 +08:00
|
|
|
DenseMapInfo<MDNode *>::getTombstoneKey(),
|
|
|
|
DenseMapInfo<MDNode *>::getTombstoneKey(),
|
2017-11-27 17:39:29 +08:00
|
|
|
DenseMapInfo<uint64_t>::getTombstoneKey(),
|
2013-04-05 05:53:22 +08:00
|
|
|
DenseMapInfo<uint64_t>::getTombstoneKey());
|
|
|
|
}
|
|
|
|
|
2017-10-06 16:17:48 +08:00
|
|
|
static unsigned getHashValue(const clang::CodeGen::TBAAAccessInfo &Val) {
|
2017-10-31 19:05:34 +08:00
|
|
|
auto KindValue = static_cast<unsigned>(Val.Kind);
|
|
|
|
return DenseMapInfo<unsigned>::getHashValue(KindValue) ^
|
|
|
|
DenseMapInfo<MDNode *>::getHashValue(Val.BaseType) ^
|
2017-10-06 16:17:48 +08:00
|
|
|
DenseMapInfo<MDNode *>::getHashValue(Val.AccessType) ^
|
2017-11-27 17:39:29 +08:00
|
|
|
DenseMapInfo<uint64_t>::getHashValue(Val.Offset) ^
|
|
|
|
DenseMapInfo<uint64_t>::getHashValue(Val.Size);
|
2013-04-05 05:53:22 +08:00
|
|
|
}
|
|
|
|
|
2017-10-06 16:17:48 +08:00
|
|
|
static bool isEqual(const clang::CodeGen::TBAAAccessInfo &LHS,
|
|
|
|
const clang::CodeGen::TBAAAccessInfo &RHS) {
|
2017-10-31 19:05:34 +08:00
|
|
|
return LHS == RHS;
|
2013-04-05 05:53:22 +08:00
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
} // end namespace llvm
|
|
|
|
|
2010-10-15 07:06:10 +08:00
|
|
|
#endif
|