forked from OSchip/llvm-project
CodeGen: Cast alloca to expected address space
Alloca always returns a pointer in alloca address space, which may be different from the type defined by the language. For example, in C++ the auto variables are in the default address space. Therefore cast alloca to the expected address space when necessary. Differential Revision: https://reviews.llvm.org/D32248 llvm-svn: 303370
This commit is contained in:
parent
b00ffd8cb7
commit
6d96f16347
|
@ -2324,8 +2324,7 @@ public:
|
|||
uint64_t getTargetNullPointerValue(QualType QT) const;
|
||||
|
||||
bool addressSpaceMapManglingFor(unsigned AS) const {
|
||||
return AddrSpaceMapMangling ||
|
||||
AS >= LangAS::Count;
|
||||
return AddrSpaceMapMangling || AS >= LangAS::FirstTargetAddressSpace;
|
||||
}
|
||||
|
||||
private:
|
||||
|
|
|
@ -333,15 +333,18 @@ public:
|
|||
|
||||
bool hasAddressSpace() const { return Mask & AddressSpaceMask; }
|
||||
unsigned getAddressSpace() const { return Mask >> AddressSpaceShift; }
|
||||
bool hasTargetSpecificAddressSpace() const {
|
||||
return getAddressSpace() >= LangAS::FirstTargetAddressSpace;
|
||||
}
|
||||
/// Get the address space attribute value to be printed by diagnostics.
|
||||
unsigned getAddressSpaceAttributePrintValue() const {
|
||||
auto Addr = getAddressSpace();
|
||||
// This function is not supposed to be used with language specific
|
||||
// address spaces. If that happens, the diagnostic message should consider
|
||||
// printing the QualType instead of the address space value.
|
||||
assert(Addr == 0 || Addr >= LangAS::Count);
|
||||
assert(Addr == 0 || hasTargetSpecificAddressSpace());
|
||||
if (Addr)
|
||||
return Addr - LangAS::Count;
|
||||
return Addr - LangAS::FirstTargetAddressSpace;
|
||||
// TODO: The diagnostic messages where Addr may be 0 should be fixed
|
||||
// since it cannot differentiate the situation where 0 denotes the default
|
||||
// address space or user specified __attribute__((address_space(0))).
|
||||
|
|
|
@ -45,13 +45,12 @@ enum ID {
|
|||
// This denotes the count of language-specific address spaces and also
|
||||
// the offset added to the target-specific address spaces, which are usually
|
||||
// specified by address space attributes __attribute__(address_space(n))).
|
||||
Count
|
||||
FirstTargetAddressSpace
|
||||
};
|
||||
|
||||
/// The type of a lookup table which maps from language-specific address spaces
|
||||
/// to target-specific ones.
|
||||
typedef unsigned Map[Count];
|
||||
|
||||
typedef unsigned Map[FirstTargetAddressSpace];
|
||||
}
|
||||
|
||||
}
|
||||
|
|
|
@ -2490,7 +2490,7 @@ def err_attribute_address_multiple_qualifiers : Error<
|
|||
def err_attribute_address_function_type : Error<
|
||||
"function type may not be qualified with an address space">;
|
||||
def err_as_qualified_auto_decl : Error<
|
||||
"automatic variable qualified with an address space">;
|
||||
"automatic variable qualified with an%select{| invalid}0 address space">;
|
||||
def err_arg_with_address_space : Error<
|
||||
"parameter may not be qualified with an address space">;
|
||||
def err_field_with_address_space : Error<
|
||||
|
|
|
@ -8730,8 +8730,8 @@ static QualType DecodeTypeFromStr(const char *&Str, const ASTContext &Context,
|
|||
char *End;
|
||||
unsigned AddrSpace = strtoul(Str, &End, 10);
|
||||
if (End != Str && AddrSpace != 0) {
|
||||
Type = Context.getAddrSpaceQualType(Type, AddrSpace +
|
||||
LangAS::Count);
|
||||
Type = Context.getAddrSpaceQualType(
|
||||
Type, AddrSpace + LangAS::FirstTargetAddressSpace);
|
||||
Str = End;
|
||||
}
|
||||
if (c == '*')
|
||||
|
@ -9546,13 +9546,8 @@ uint64_t ASTContext::getTargetNullPointerValue(QualType QT) const {
|
|||
}
|
||||
|
||||
unsigned ASTContext::getTargetAddressSpace(unsigned AS) const {
|
||||
// For OpenCL, only function local variables are not explicitly marked with
|
||||
// an address space in the AST, and these need to be the address space of
|
||||
// alloca.
|
||||
if (!AS && LangOpts.OpenCL)
|
||||
return getTargetInfo().getDataLayout().getAllocaAddrSpace();
|
||||
if (AS >= LangAS::Count)
|
||||
return AS - LangAS::Count;
|
||||
if (AS >= LangAS::FirstTargetAddressSpace)
|
||||
return AS - LangAS::FirstTargetAddressSpace;
|
||||
else
|
||||
return (*AddrSpaceMap)[AS];
|
||||
}
|
||||
|
|
|
@ -1668,9 +1668,9 @@ void Qualifiers::print(raw_ostream &OS, const PrintingPolicy& Policy,
|
|||
OS << "__shared";
|
||||
break;
|
||||
default:
|
||||
assert(addrspace >= LangAS::Count);
|
||||
assert(addrspace >= LangAS::FirstTargetAddressSpace);
|
||||
OS << "__attribute__((address_space(";
|
||||
OS << addrspace - LangAS::Count;
|
||||
OS << addrspace - LangAS::FirstTargetAddressSpace;
|
||||
OS << ")))";
|
||||
}
|
||||
}
|
||||
|
|
|
@ -2034,25 +2034,45 @@ ArrayRef<const char *> NVPTXTargetInfo::getGCCRegNames() const {
|
|||
return llvm::makeArrayRef(GCCRegNames);
|
||||
}
|
||||
|
||||
static const LangAS::Map AMDGPUPrivateIsZeroMap = {
|
||||
4, // Default
|
||||
1, // opencl_global
|
||||
3, // opencl_local
|
||||
2, // opencl_constant
|
||||
4, // opencl_generic
|
||||
1, // cuda_device
|
||||
2, // cuda_constant
|
||||
3 // cuda_shared
|
||||
static const LangAS::Map AMDGPUNonOpenCLPrivateIsZeroMap = {
|
||||
4, // Default
|
||||
1, // opencl_global
|
||||
3, // opencl_local
|
||||
2, // opencl_constant
|
||||
4, // opencl_generic
|
||||
1, // cuda_device
|
||||
2, // cuda_constant
|
||||
3 // cuda_shared
|
||||
};
|
||||
static const LangAS::Map AMDGPUGenericIsZeroMap = {
|
||||
0, // Default
|
||||
1, // opencl_global
|
||||
3, // opencl_local
|
||||
2, // opencl_constant
|
||||
0, // opencl_generic
|
||||
1, // cuda_device
|
||||
2, // cuda_constant
|
||||
3 // cuda_shared
|
||||
static const LangAS::Map AMDGPUNonOpenCLGenericIsZeroMap = {
|
||||
0, // Default
|
||||
1, // opencl_global
|
||||
3, // opencl_local
|
||||
2, // opencl_constant
|
||||
0, // opencl_generic
|
||||
1, // cuda_device
|
||||
2, // cuda_constant
|
||||
3 // cuda_shared
|
||||
};
|
||||
static const LangAS::Map AMDGPUOpenCLPrivateIsZeroMap = {
|
||||
0, // Default
|
||||
1, // opencl_global
|
||||
3, // opencl_local
|
||||
2, // opencl_constant
|
||||
4, // opencl_generic
|
||||
1, // cuda_device
|
||||
2, // cuda_constant
|
||||
3 // cuda_shared
|
||||
};
|
||||
static const LangAS::Map AMDGPUOpenCLGenericIsZeroMap = {
|
||||
5, // Default
|
||||
1, // opencl_global
|
||||
3, // opencl_local
|
||||
2, // opencl_constant
|
||||
0, // opencl_generic
|
||||
1, // cuda_device
|
||||
2, // cuda_constant
|
||||
3 // cuda_shared
|
||||
};
|
||||
|
||||
// If you edit the description strings, make sure you update
|
||||
|
@ -2149,8 +2169,12 @@ public:
|
|||
: DataLayoutStringR600);
|
||||
assert(DataLayout->getAllocaAddrSpace() == AS.Private);
|
||||
|
||||
AddrSpaceMap = IsGenericZero ? &AMDGPUGenericIsZeroMap :
|
||||
&AMDGPUPrivateIsZeroMap;
|
||||
AddrSpaceMap =
|
||||
llvm::StringSwitch<const LangAS::Map *>(Triple.getEnvironmentName())
|
||||
.Case("opencl", &AMDGPUOpenCLPrivateIsZeroMap)
|
||||
.Case("amdgiz", &AMDGPUNonOpenCLGenericIsZeroMap)
|
||||
.Case("amdgizcl", &AMDGPUOpenCLGenericIsZeroMap)
|
||||
.Default(&AMDGPUNonOpenCLPrivateIsZeroMap);
|
||||
UseAddrSpaceMapMangling = true;
|
||||
}
|
||||
|
||||
|
|
|
@ -11,14 +11,15 @@
|
|||
//
|
||||
//===----------------------------------------------------------------------===//
|
||||
|
||||
#include "CodeGenFunction.h"
|
||||
#include "CGBlocks.h"
|
||||
#include "CGCXXABI.h"
|
||||
#include "CGCleanup.h"
|
||||
#include "CGDebugInfo.h"
|
||||
#include "CGOpenCLRuntime.h"
|
||||
#include "CGOpenMPRuntime.h"
|
||||
#include "CodeGenFunction.h"
|
||||
#include "CodeGenModule.h"
|
||||
#include "TargetInfo.h"
|
||||
#include "clang/AST/ASTContext.h"
|
||||
#include "clang/AST/CharUnits.h"
|
||||
#include "clang/AST/Decl.h"
|
||||
|
@ -1105,6 +1106,21 @@ CodeGenFunction::EmitAutoVarAlloca(const VarDecl &D) {
|
|||
address = Address(vla, alignment);
|
||||
}
|
||||
|
||||
// Alloca always returns a pointer in alloca address space, which may
|
||||
// be different from the type defined by the language. For example,
|
||||
// in C++ the auto variables are in the default address space. Therefore
|
||||
// cast alloca to the expected address space when necessary.
|
||||
auto T = D.getType();
|
||||
assert(T.getAddressSpace() == LangAS::Default);
|
||||
if (getASTAllocaAddressSpace() != LangAS::Default) {
|
||||
auto *Addr = getTargetHooks().performAddrSpaceCast(
|
||||
*this, address.getPointer(), getASTAllocaAddressSpace(),
|
||||
T.getAddressSpace(),
|
||||
address.getElementType()->getPointerTo(
|
||||
getContext().getTargetAddressSpace(T.getAddressSpace())),
|
||||
/*non-null*/ true);
|
||||
address = Address(Addr, address.getAlignment());
|
||||
}
|
||||
setAddrOfLocalVar(&D, address);
|
||||
emission.Addr = address;
|
||||
|
||||
|
|
|
@ -1579,10 +1579,9 @@ Value *ScalarExprEmitter::VisitCastExpr(CastExpr *CE) {
|
|||
}
|
||||
// Since target may map different address spaces in AST to the same address
|
||||
// space, an address space conversion may end up as a bitcast.
|
||||
auto *Src = Visit(E);
|
||||
return CGF.CGM.getTargetCodeGenInfo().performAddrSpaceCast(CGF, Src,
|
||||
E->getType(),
|
||||
DestTy);
|
||||
return CGF.CGM.getTargetCodeGenInfo().performAddrSpaceCast(
|
||||
CGF, Visit(E), E->getType()->getPointeeType().getAddressSpace(),
|
||||
DestTy->getPointeeType().getAddressSpace(), ConvertType(DestTy));
|
||||
}
|
||||
case CK_AtomicToNonAtomic:
|
||||
case CK_NonAtomicToAtomic:
|
||||
|
|
|
@ -113,6 +113,7 @@ CodeGenModule::CodeGenModule(ASTContext &C, const HeaderSearchOptions &HSO,
|
|||
Int8PtrPtrTy = Int8PtrTy->getPointerTo(0);
|
||||
AllocaInt8PtrTy = Int8Ty->getPointerTo(
|
||||
M.getDataLayout().getAllocaAddrSpace());
|
||||
ASTAllocaAddressSpace = getTargetCodeGenInfo().getASTAllocaAddressSpace();
|
||||
|
||||
RuntimeCC = getTargetCodeGenInfo().getABIInfo().getRuntimeCC();
|
||||
BuiltinCC = getTargetCodeGenInfo().getABIInfo().getBuiltinCC();
|
||||
|
|
|
@ -94,6 +94,8 @@ struct CodeGenTypeCache {
|
|||
unsigned char SizeAlignInBytes;
|
||||
};
|
||||
|
||||
unsigned ASTAllocaAddressSpace;
|
||||
|
||||
CharUnits getSizeSize() const {
|
||||
return CharUnits::fromQuantity(SizeSizeInBytes);
|
||||
}
|
||||
|
@ -111,6 +113,8 @@ struct CodeGenTypeCache {
|
|||
llvm::CallingConv::ID getRuntimeCC() const { return RuntimeCC; }
|
||||
llvm::CallingConv::ID BuiltinCC;
|
||||
llvm::CallingConv::ID getBuiltinCC() const { return BuiltinCC; }
|
||||
|
||||
unsigned getASTAllocaAddressSpace() const { return ASTAllocaAddressSpace; }
|
||||
};
|
||||
|
||||
} // end namespace CodeGen
|
||||
|
|
|
@ -407,12 +407,11 @@ llvm::Constant *TargetCodeGenInfo::getNullPointer(const CodeGen::CodeGenModule &
|
|||
}
|
||||
|
||||
llvm::Value *TargetCodeGenInfo::performAddrSpaceCast(
|
||||
CodeGen::CodeGenFunction &CGF, llvm::Value *Src, QualType SrcTy,
|
||||
QualType DestTy) const {
|
||||
CodeGen::CodeGenFunction &CGF, llvm::Value *Src, unsigned SrcAddr,
|
||||
unsigned DestAddr, llvm::Type *DestTy, bool isNonNull) const {
|
||||
// Since target may map different address spaces in AST to the same address
|
||||
// space, an address space conversion may end up as a bitcast.
|
||||
return CGF.Builder.CreatePointerBitCastOrAddrSpaceCast(Src,
|
||||
CGF.ConvertType(DestTy));
|
||||
return CGF.Builder.CreatePointerBitCastOrAddrSpaceCast(Src, DestTy);
|
||||
}
|
||||
|
||||
static bool isEmptyRecord(ASTContext &Context, QualType T, bool AllowArrays);
|
||||
|
@ -7292,6 +7291,11 @@ public:
|
|||
|
||||
llvm::Constant *getNullPointer(const CodeGen::CodeGenModule &CGM,
|
||||
llvm::PointerType *T, QualType QT) const override;
|
||||
|
||||
unsigned getASTAllocaAddressSpace() const override {
|
||||
return LangAS::FirstTargetAddressSpace +
|
||||
getABIInfo().getDataLayout().getAllocaAddrSpace();
|
||||
}
|
||||
};
|
||||
}
|
||||
|
||||
|
|
|
@ -229,13 +229,20 @@ public:
|
|||
virtual llvm::Constant *getNullPointer(const CodeGen::CodeGenModule &CGM,
|
||||
llvm::PointerType *T, QualType QT) const;
|
||||
|
||||
/// Get the AST address space for alloca.
|
||||
virtual unsigned getASTAllocaAddressSpace() const { return LangAS::Default; }
|
||||
|
||||
/// Perform address space cast of an expression of pointer type.
|
||||
/// \param V is the LLVM value to be casted to another address space.
|
||||
/// \param SrcTy is the QualType of \p V.
|
||||
/// \param DestTy is the destination QualType.
|
||||
/// \param SrcAddr is the language address space of \p V.
|
||||
/// \param DestAddr is the targeted language address space.
|
||||
/// \param DestTy is the destination LLVM pointer type.
|
||||
/// \param IsNonNull is the flag indicating \p V is known to be non null.
|
||||
virtual llvm::Value *performAddrSpaceCast(CodeGen::CodeGenFunction &CGF,
|
||||
llvm::Value *V, QualType SrcTy, QualType DestTy) const;
|
||||
|
||||
llvm::Value *V, unsigned SrcAddr,
|
||||
unsigned DestAddr,
|
||||
llvm::Type *DestTy,
|
||||
bool IsNonNull = false) const;
|
||||
};
|
||||
|
||||
} // namespace CodeGen
|
||||
|
|
|
@ -7191,7 +7191,7 @@ void Sema::CheckVariableDeclarationType(VarDecl *NewVD) {
|
|||
// ISO/IEC TR 18037 S5.1.2
|
||||
if (!getLangOpts().OpenCL
|
||||
&& NewVD->hasLocalStorage() && T.getAddressSpace() != 0) {
|
||||
Diag(NewVD->getLocation(), diag::err_as_qualified_auto_decl);
|
||||
Diag(NewVD->getLocation(), diag::err_as_qualified_auto_decl) << 0;
|
||||
NewVD->setInvalidDecl();
|
||||
return;
|
||||
}
|
||||
|
@ -7271,6 +7271,11 @@ void Sema::CheckVariableDeclarationType(VarDecl *NewVD) {
|
|||
NewVD->setInvalidDecl();
|
||||
return;
|
||||
}
|
||||
} else if (T.getAddressSpace() != LangAS::Default) {
|
||||
// Do not allow other address spaces on automatic variable.
|
||||
Diag(NewVD->getLocation(), diag::err_as_qualified_auto_decl) << 1;
|
||||
NewVD->setInvalidDecl();
|
||||
return;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
|
|
@ -5531,14 +5531,15 @@ static void HandleAddressSpaceTypeAttribute(QualType &Type,
|
|||
addrSpace.setIsSigned(false);
|
||||
}
|
||||
llvm::APSInt max(addrSpace.getBitWidth());
|
||||
max = Qualifiers::MaxAddressSpace - LangAS::Count;
|
||||
max = Qualifiers::MaxAddressSpace - LangAS::FirstTargetAddressSpace;
|
||||
if (addrSpace > max) {
|
||||
S.Diag(Attr.getLoc(), diag::err_attribute_address_space_too_high)
|
||||
<< (unsigned)max.getZExtValue() << ASArgExpr->getSourceRange();
|
||||
Attr.setInvalid();
|
||||
return;
|
||||
}
|
||||
ASIdx = static_cast<unsigned>(addrSpace.getZExtValue()) + LangAS::Count;
|
||||
ASIdx = static_cast<unsigned>(addrSpace.getZExtValue()) +
|
||||
LangAS::FirstTargetAddressSpace;
|
||||
} else {
|
||||
// The keyword-based type attributes imply which address space to use.
|
||||
switch (Attr.getKind()) {
|
||||
|
|
|
@ -1,6 +1,6 @@
|
|||
// RUN: %clang_cc1 -triple x86_64-apple-darwin -emit-llvm < %s | FileCheck -check-prefixes=CHECK,GIZ %s
|
||||
// RUN: %clang_cc1 -triple amdgcn -emit-llvm < %s | FileCheck -check-prefixes=CHECK,PIZ %s
|
||||
// RUN: %clang_cc1 -triple amdgcn---amdgiz -emit-llvm < %s | FileCheck -check-prefixes=CHeCK,GIZ %s
|
||||
// RUN: %clang_cc1 -triple amdgcn---amdgiz -emit-llvm < %s | FileCheck -check-prefixes=CHECK,GIZ %s
|
||||
|
||||
// CHECK: @foo = common addrspace(1) global
|
||||
int foo __attribute__((address_space(1)));
|
||||
|
@ -40,8 +40,10 @@ typedef struct {
|
|||
} MyStruct;
|
||||
|
||||
// CHECK-LABEL: define void @test4(
|
||||
// CHECK: call void @llvm.memcpy.p0i8.p2i8
|
||||
// CHECK: call void @llvm.memcpy.p2i8.p0i8
|
||||
// GIZ: call void @llvm.memcpy.p0i8.p2i8
|
||||
// GIZ: call void @llvm.memcpy.p2i8.p0i8
|
||||
// PIZ: call void @llvm.memcpy.p4i8.p2i8
|
||||
// PIZ: call void @llvm.memcpy.p2i8.p4i8
|
||||
void test4(MyStruct __attribute__((address_space(2))) *pPtr) {
|
||||
MyStruct s = pPtr[0];
|
||||
pPtr[0] = s;
|
||||
|
|
|
@ -0,0 +1,72 @@
|
|||
// RUN: %clang_cc1 -O0 -triple amdgcn---amdgiz -emit-llvm %s -o - | FileCheck %s
|
||||
|
||||
// CHECK-LABEL: define void @_Z5func1Pi(i32* %x)
|
||||
void func1(int *x) {
|
||||
// CHECK: %[[x_addr:.*]] = alloca i32*{{.*}}addrspace(5)
|
||||
// CHECK: store i32* %x, i32* addrspace(5)* %[[x_addr]]
|
||||
// CHECK: %[[r0:.*]] = load i32*, i32* addrspace(5)* %[[x_addr]]
|
||||
// CHECK: store i32 1, i32* %[[r0]]
|
||||
*x = 1;
|
||||
}
|
||||
|
||||
// CHECK-LABEL: define void @_Z5func2v()
|
||||
void func2(void) {
|
||||
// CHECK: %lv1 = alloca i32, align 4, addrspace(5)
|
||||
// CHECK: %lv2 = alloca i32, align 4, addrspace(5)
|
||||
// CHECK: %la = alloca [100 x i32], align 4, addrspace(5)
|
||||
// CHECK: %lp1 = alloca i32*, align 4, addrspace(5)
|
||||
// CHECK: %lp2 = alloca i32*, align 4, addrspace(5)
|
||||
// CHECK: %lvc = alloca i32, align 4, addrspace(5)
|
||||
|
||||
// CHECK: %[[r0:.*]] = addrspacecast i32 addrspace(5)* %lv1 to i32*
|
||||
// CHECK: store i32 1, i32* %[[r0]]
|
||||
int lv1;
|
||||
lv1 = 1;
|
||||
// CHECK: %[[r1:.*]] = addrspacecast i32 addrspace(5)* %lv2 to i32*
|
||||
// CHECK: store i32 2, i32* %[[r1]]
|
||||
int lv2 = 2;
|
||||
|
||||
// CHECK: %[[r2:.*]] = addrspacecast [100 x i32] addrspace(5)* %la to [100 x i32]*
|
||||
// CHECK: %[[arrayidx:.*]] = getelementptr inbounds [100 x i32], [100 x i32]* %[[r2]], i64 0, i64 0
|
||||
// CHECK: store i32 3, i32* %[[arrayidx]], align 4
|
||||
int la[100];
|
||||
la[0] = 3;
|
||||
|
||||
// CHECK: %[[r3:.*]] = addrspacecast i32* addrspace(5)* %lp1 to i32**
|
||||
// CHECK: store i32* %[[r0]], i32** %[[r3]], align 4
|
||||
int *lp1 = &lv1;
|
||||
|
||||
// CHECK: %[[r4:.*]] = addrspacecast i32* addrspace(5)* %lp2 to i32**
|
||||
// CHECK: %[[arraydecay:.*]] = getelementptr inbounds [100 x i32], [100 x i32]* %[[r2]], i32 0, i32 0
|
||||
// CHECK: store i32* %[[arraydecay]], i32** %[[r4]], align 4
|
||||
int *lp2 = la;
|
||||
|
||||
// CHECK: call void @_Z5func1Pi(i32* %[[r0]])
|
||||
func1(&lv1);
|
||||
|
||||
// CHECK: %[[r5:.*]] = addrspacecast i32 addrspace(5)* %lvc to i32*
|
||||
// CHECK: store i32 4, i32* %[[r5]]
|
||||
// CHECK: store i32 4, i32* %[[r0]]
|
||||
const int lvc = 4;
|
||||
lv1 = lvc;
|
||||
}
|
||||
|
||||
void destroy(int x);
|
||||
|
||||
class A {
|
||||
int x;
|
||||
public:
|
||||
A():x(0) {}
|
||||
~A() {
|
||||
destroy(x);
|
||||
}
|
||||
};
|
||||
|
||||
// CHECK-LABEL: define void @_Z5func3v
|
||||
void func3() {
|
||||
// CHECK: %[[a:.*]] = alloca %class.A, align 4, addrspace(5)
|
||||
// CHECK: %[[r0:.*]] = addrspacecast %class.A addrspace(5)* %[[a]] to %class.A*
|
||||
// CHECK: call void @_ZN1AC1Ev(%class.A* %[[r0]])
|
||||
// CHECK: call void @_ZN1AD1Ev(%class.A* %[[r0]])
|
||||
A a;
|
||||
}
|
|
@ -0,0 +1,60 @@
|
|||
// RUN: %clang_cc1 -O0 -cl-std=CL1.2 -triple amdgcn---amdgizcl -emit-llvm %s -o - | FileCheck -check-prefixes=CHECK,CL12 %s
|
||||
// RUN: %clang_cc1 -O0 -cl-std=CL2.0 -triple amdgcn---amdgizcl -emit-llvm %s -o - | FileCheck -check-prefixes=CHECK,CL20 %s
|
||||
|
||||
// CL12-LABEL: define void @func1(i32 addrspace(5)* %x)
|
||||
// CL20-LABEL: define void @func1(i32* %x)
|
||||
void func1(int *x) {
|
||||
// CL12: %[[x_addr:.*]] = alloca i32 addrspace(5)*{{.*}}addrspace(5)
|
||||
// CL12: store i32 addrspace(5)* %x, i32 addrspace(5)* addrspace(5)* %[[x_addr]]
|
||||
// CL12: %[[r0:.*]] = load i32 addrspace(5)*, i32 addrspace(5)* addrspace(5)* %[[x_addr]]
|
||||
// CL12: store i32 1, i32 addrspace(5)* %[[r0]]
|
||||
// CL20: %[[x_addr:.*]] = alloca i32*{{.*}}addrspace(5)
|
||||
// CL20: store i32* %x, i32* addrspace(5)* %[[x_addr]]
|
||||
// CL20: %[[r0:.*]] = load i32*, i32* addrspace(5)* %[[x_addr]]
|
||||
// CL20: store i32 1, i32* %[[r0]]
|
||||
*x = 1;
|
||||
}
|
||||
|
||||
// CHECK-LABEL: define void @func2()
|
||||
void func2(void) {
|
||||
// CHECK: %lv1 = alloca i32, align 4, addrspace(5)
|
||||
// CHECK: %lv2 = alloca i32, align 4, addrspace(5)
|
||||
// CHECK: %la = alloca [100 x i32], align 4, addrspace(5)
|
||||
// CL12: %lp1 = alloca i32 addrspace(5)*, align 4, addrspace(5)
|
||||
// CL12: %lp2 = alloca i32 addrspace(5)*, align 4, addrspace(5)
|
||||
// CL20: %lp1 = alloca i32*, align 4, addrspace(5)
|
||||
// CL20: %lp2 = alloca i32*, align 4, addrspace(5)
|
||||
// CHECK: %lvc = alloca i32, align 4, addrspace(5)
|
||||
|
||||
// CHECK: store i32 1, i32 addrspace(5)* %lv1
|
||||
int lv1;
|
||||
lv1 = 1;
|
||||
// CHECK: store i32 2, i32 addrspace(5)* %lv2
|
||||
int lv2 = 2;
|
||||
|
||||
// CHECK: %[[arrayidx:.*]] = getelementptr inbounds [100 x i32], [100 x i32] addrspace(5)* %la, i64 0, i64 0
|
||||
// CHECK: store i32 3, i32 addrspace(5)* %[[arrayidx]], align 4
|
||||
int la[100];
|
||||
la[0] = 3;
|
||||
|
||||
// CL12: store i32 addrspace(5)* %lv1, i32 addrspace(5)* addrspace(5)* %lp1, align 4
|
||||
// CL20: %[[r0:.*]] = addrspacecast i32 addrspace(5)* %lv1 to i32*
|
||||
// CL20: store i32* %[[r0]], i32* addrspace(5)* %lp1, align 4
|
||||
int *lp1 = &lv1;
|
||||
|
||||
// CHECK: %[[arraydecay:.*]] = getelementptr inbounds [100 x i32], [100 x i32] addrspace(5)* %la, i32 0, i32 0
|
||||
// CL12: store i32 addrspace(5)* %[[arraydecay]], i32 addrspace(5)* addrspace(5)* %lp2, align 4
|
||||
// CL20: %[[r1:.*]] = addrspacecast i32 addrspace(5)* %[[arraydecay]] to i32*
|
||||
// CL20: store i32* %[[r1]], i32* addrspace(5)* %lp2, align 4
|
||||
int *lp2 = la;
|
||||
|
||||
// CL12: call void @func1(i32 addrspace(5)* %lv1)
|
||||
// CL20: %[[r2:.*]] = addrspacecast i32 addrspace(5)* %lv1 to i32*
|
||||
// CL20: call void @func1(i32* %[[r2]])
|
||||
func1(&lv1);
|
||||
|
||||
// CHECK: store i32 4, i32 addrspace(5)* %lvc
|
||||
// CHECK: store i32 4, i32 addrspace(5)* %lv1
|
||||
const int lvc = 4;
|
||||
lv1 = lvc;
|
||||
}
|
|
@ -1,5 +1,5 @@
|
|||
// REQUIRES: amdgpu-registered-target
|
||||
// RUN: %clang_cc1 -triple amdgcn-unknown-unknown -S -disable-llvm-passes -emit-llvm -o - %s | FileCheck %s
|
||||
// RUN: %clang_cc1 -triple amdgcn-unknown-unknown-opencl -S -disable-llvm-passes -emit-llvm -o - %s | FileCheck %s
|
||||
|
||||
#pragma OPENCL EXTENSION cl_khr_fp64 : enable
|
||||
#pragma OPENCL EXTENSION cl_khr_fp16 : enable
|
||||
|
|
|
@ -1,4 +1,4 @@
|
|||
// RUN: %clang -cl-std=CL2.0 -emit-llvm -g -O0 -S -target amdgcn-amd-amdhsa -mcpu=fiji -o - %s | FileCheck %s
|
||||
// RUN: %clang -cl-std=CL2.0 -emit-llvm -g -O0 -S -target amdgcn-amd-amdhsa-opencl -mcpu=fiji -o - %s | FileCheck %s
|
||||
|
||||
// CHECK-DAG: ![[DWARF_ADDRESS_SPACE_NONE:[0-9]+]] = !DIDerivedType(tag: DW_TAG_pointer_type, baseType: !{{[0-9]+}}, size: {{[0-9]+}})
|
||||
// CHECK-DAG: ![[DWARF_ADDRESS_SPACE_LOCAL:[0-9]+]] = !DIDerivedType(tag: DW_TAG_pointer_type, baseType: !{{[0-9]+}}, size: {{[0-9]+}}, dwarfAddressSpace: 2)
|
||||
|
|
|
@ -1,4 +1,4 @@
|
|||
// RUN: %clang -cl-std=CL2.0 -emit-llvm -g -O0 -S -target amdgcn-amd-amdhsa -mcpu=fiji -o - %s | FileCheck %s
|
||||
// RUN: %clang -cl-std=CL2.0 -emit-llvm -g -O0 -S -target amdgcn-amd-amdhsa-opencl -mcpu=fiji -o - %s | FileCheck %s
|
||||
|
||||
// CHECK-DAG: ![[LOCAL:[0-9]+]] = !DIExpression(DW_OP_constu, 2, DW_OP_swap, DW_OP_xderef)
|
||||
// CHECK-DAG: ![[PRIVATE:[0-9]+]] = !DIExpression(DW_OP_constu, 1, DW_OP_swap, DW_OP_xderef)
|
||||
|
|
|
@ -1,5 +1,5 @@
|
|||
// RUN: %clang_cc1 %s -cl-std=CL2.0 -include opencl-c.h -triple amdgcn -emit-llvm -o - | FileCheck %s
|
||||
// RUN: %clang_cc1 %s -O0 -cl-std=CL2.0 -include opencl-c.h -triple amdgcn -emit-llvm -o - | FileCheck --check-prefix=NOOPT %s
|
||||
// RUN: %clang_cc1 %s -cl-std=CL2.0 -include opencl-c.h -triple amdgcn---opencl -emit-llvm -o - | FileCheck %s
|
||||
// RUN: %clang_cc1 %s -O0 -cl-std=CL2.0 -include opencl-c.h -triple amdgcn---opencl -emit-llvm -o - | FileCheck --check-prefix=NOOPT %s
|
||||
|
||||
typedef struct {
|
||||
private char *p1;
|
||||
|
|
|
@ -1,5 +1,5 @@
|
|||
// REQUIRES: amdgpu-registered-target
|
||||
// RUN: %clang_cc1 -triple amdgcn-unknown-unknown -S -emit-llvm -o - %s | FileCheck %s
|
||||
// RUN: %clang_cc1 -triple amdgcn-unknown-unknown-opencl -S -emit-llvm -o - %s | FileCheck %s
|
||||
|
||||
#pragma OPENCL EXTENSION cl_khr_fp64 : enable
|
||||
|
||||
|
|
|
@ -1,4 +1,4 @@
|
|||
// RUN: %clang_cc1 -emit-llvm -o - -triple amdgcn %s | FileCheck %s
|
||||
// RUN: %clang_cc1 -emit-llvm -o - -triple amdgcn---opencl %s | FileCheck %s
|
||||
// RUN: %clang_cc1 -emit-llvm -o - -triple amdgcn---amdgizcl %s | FileCheck %s -check-prefix=AMDGIZ
|
||||
|
||||
struct A {
|
||||
|
|
|
@ -1,6 +1,6 @@
|
|||
// RUN: %clang_cc1 %s -cl-std=CL2.0 -finclude-default-header -emit-llvm -O0 -triple spir-unknown-unknown -o - | FileCheck --check-prefix=SZ32 %s
|
||||
// RUN: %clang_cc1 %s -cl-std=CL2.0 -finclude-default-header -emit-llvm -O0 -triple spir64-unknown-unknown -o - | FileCheck --check-prefix=SZ64 --check-prefix=SZ64ONLY %s
|
||||
// RUN: %clang_cc1 %s -cl-std=CL2.0 -finclude-default-header -emit-llvm -O0 -triple amdgcn-- -o - | FileCheck --check-prefix=SZ64 --check-prefix=AMDONLY %s
|
||||
// RUN: %clang_cc1 %s -cl-std=CL2.0 -finclude-default-header -emit-llvm -O0 -triple amdgcn---opencl -o - | FileCheck --check-prefix=SZ64 --check-prefix=AMDONLY %s
|
||||
|
||||
//SZ32: define{{.*}} i32 @test_ptrtoint_private(i8* %x)
|
||||
//SZ32: ptrtoint i8* %{{.*}} to i32
|
||||
|
|
|
@ -1,4 +1,4 @@
|
|||
// RUN: %clang_cc1 -verify -fsyntax-only -triple amdgcn -target-cpu verde -S -emit-llvm -o - %s
|
||||
// RUN: %clang_cc1 -verify -fsyntax-only -triple amdgcn--opencl -target-cpu verde -S -emit-llvm -o - %s
|
||||
// expected-no-diagnostics
|
||||
|
||||
// Record lowering was crashing on SI and newer targets, because it
|
||||
|
|
|
@ -12,7 +12,9 @@ void kernel foo() {
|
|||
|
||||
constant int L1 = 0;
|
||||
local int L2;
|
||||
global int L3; // expected-error{{function scope variable cannot be declared in global address space}}
|
||||
global int L3; // expected-error{{function scope variable cannot be declared in global address space}}
|
||||
generic int L4; // expected-error{{automatic variable qualified with an invalid address space}}
|
||||
__attribute__((address_space(100))) int L5; // expected-error{{automatic variable qualified with an invalid address space}}
|
||||
|
||||
extern global int G5;
|
||||
extern int G6; // expected-error{{extern variable must reside in global or constant address space}}
|
||||
|
|
|
@ -13,29 +13,37 @@ void kernel foo(int x) {
|
|||
constant int L1 = 0;
|
||||
local int L2;
|
||||
|
||||
auto int L3 = 7; // expected-error{{OpenCL version 1.2 does not support the 'auto' storage class specifier}}
|
||||
global int L4; // expected-error{{function scope variable cannot be declared in global address space}}
|
||||
auto int L3 = 7; // expected-error{{OpenCL version 1.2 does not support the 'auto' storage class specifier}}
|
||||
global int L4; // expected-error{{function scope variable cannot be declared in global address space}}
|
||||
__attribute__((address_space(100))) int L5; // expected-error{{automatic variable qualified with an invalid address space}}
|
||||
|
||||
constant int L5 = x; // expected-error {{initializer element is not a compile-time constant}}
|
||||
global int *constant L6 = &G4;
|
||||
private int *constant L7 = &x; // expected-error {{initializer element is not a compile-time constant}}
|
||||
constant int *constant L8 = &L1;
|
||||
local int *constant L9 = &L2; // expected-error {{initializer element is not a compile-time constant}}
|
||||
constant int L6 = x; // expected-error {{initializer element is not a compile-time constant}}
|
||||
global int *constant L7 = &G4;
|
||||
private int *constant L8 = &x; // expected-error {{initializer element is not a compile-time constant}}
|
||||
constant int *constant L9 = &L1;
|
||||
local int *constant L10 = &L2; // expected-error {{initializer element is not a compile-time constant}}
|
||||
}
|
||||
|
||||
static void kernel bar() { // expected-error{{kernel functions cannot be declared static}}
|
||||
}
|
||||
|
||||
void f() {
|
||||
constant int L1 = 0; // expected-error{{non-kernel function variable cannot be declared in constant address space}}
|
||||
local int L2; // expected-error{{non-kernel function variable cannot be declared in local address space}}
|
||||
constant int L1 = 0; // expected-error{{non-kernel function variable cannot be declared in constant address space}}
|
||||
local int L2; // expected-error{{non-kernel function variable cannot be declared in local address space}}
|
||||
global int L3; // expected-error{{function scope variable cannot be declared in global address space}}
|
||||
__attribute__((address_space(100))) int L4; // expected-error{{automatic variable qualified with an invalid address space}}
|
||||
|
||||
{
|
||||
constant int L1 = 0; // expected-error{{non-kernel function variable cannot be declared in constant address space}}
|
||||
local int L2; // expected-error{{non-kernel function variable cannot be declared in local address space}}
|
||||
constant int L1 = 0; // expected-error{{non-kernel function variable cannot be declared in constant address space}}
|
||||
local int L2; // expected-error{{non-kernel function variable cannot be declared in local address space}}
|
||||
global int L3; // expected-error{{function scope variable cannot be declared in global address space}}
|
||||
__attribute__((address_space(100))) int L4; // expected-error{{automatic variable qualified with an invalid address space}}
|
||||
}
|
||||
global int L3; // expected-error{{function scope variable cannot be declared in global address space}}
|
||||
extern constant float L4;
|
||||
extern local float L5; // expected-error{{extern variable must reside in constant address space}}
|
||||
static int L6 = 0; // expected-error{{variables in function scope cannot be declared static}}
|
||||
static int L7; // expected-error{{variables in function scope cannot be declared static}}
|
||||
|
||||
|
||||
extern constant float L5;
|
||||
extern local float L6; // expected-error{{extern variable must reside in constant address space}}
|
||||
|
||||
static int L7 = 0; // expected-error{{variables in function scope cannot be declared static}}
|
||||
static int L8; // expected-error{{variables in function scope cannot be declared static}}
|
||||
}
|
||||
|
|
Loading…
Reference in New Issue