forked from OSchip/llvm-project
[CUDA][HIP] Enable kernel function return type deduction.
Summary: - Even though only `void` is still accepted as the deduced return type, enabling deduction/instantiation on the return type allows more consistent coding. Reviewers: tra, jlebar Subscribers: cfe-commits, yaxunl Tags: #clang Differential Revision: https://reviews.llvm.org/D68031 llvm-svn: 372898
This commit is contained in:
parent
8535a8672e
commit
24337db616
|
@ -4223,7 +4223,9 @@ static void handleGlobalAttr(Sema &S, Decl *D, const ParsedAttr &AL) {
|
|||
return;
|
||||
}
|
||||
const auto *FD = cast<FunctionDecl>(D);
|
||||
if (!FD->getReturnType()->isVoidType()) {
|
||||
if (!FD->getReturnType()->isVoidType() &&
|
||||
!FD->getReturnType()->getAs<AutoType>() &&
|
||||
!FD->getReturnType()->isInstantiationDependentType()) {
|
||||
SourceRange RTRange = FD->getReturnTypeSourceRange();
|
||||
S.Diag(FD->getTypeSpecStartLoc(), diag::err_kern_type_not_void_return)
|
||||
<< FD->getType()
|
||||
|
|
|
@ -5891,7 +5891,9 @@ ExprResult Sema::BuildResolvedCallExpr(Expr *Fn, NamedDecl *NDecl,
|
|||
<< FDecl << Fn->getSourceRange());
|
||||
|
||||
// CUDA: Kernel function must have 'void' return type
|
||||
if (!FuncT->getReturnType()->isVoidType())
|
||||
if (!FuncT->getReturnType()->isVoidType() &&
|
||||
!FuncT->getReturnType()->getAs<AutoType>() &&
|
||||
!FuncT->getReturnType()->isInstantiationDependentType())
|
||||
return ExprError(Diag(LParenLoc, diag::err_kern_type_not_void_return)
|
||||
<< Fn->getType() << Fn->getSourceRange());
|
||||
} else {
|
||||
|
|
|
@ -3500,6 +3500,14 @@ bool Sema::DeduceFunctionTypeFromReturnExpr(FunctionDecl *FD,
|
|||
return true;
|
||||
}
|
||||
|
||||
// CUDA: Kernel function must have 'void' return type.
|
||||
if (getLangOpts().CUDA)
|
||||
if (FD->hasAttr<CUDAGlobalAttr>() && !Deduced->isVoidType()) {
|
||||
Diag(FD->getLocation(), diag::err_kern_type_not_void_return)
|
||||
<< FD->getType() << FD->getSourceRange();
|
||||
return true;
|
||||
}
|
||||
|
||||
// If a function with a declared return type that contains a placeholder type
|
||||
// has multiple return statements, the return type is deduced for each return
|
||||
// statement. [...] if the type deduced is not the same in each deduction,
|
||||
|
|
|
@ -3093,6 +3093,13 @@ Sema::SubstituteExplicitTemplateArguments(
|
|||
Function->getTypeSpecStartLoc(), Function->getDeclName());
|
||||
if (ResultType.isNull() || Trap.hasErrorOccurred())
|
||||
return TDK_SubstitutionFailure;
|
||||
// CUDA: Kernel function must have 'void' return type.
|
||||
if (getLangOpts().CUDA)
|
||||
if (Function->hasAttr<CUDAGlobalAttr>() && !ResultType->isVoidType()) {
|
||||
Diag(Function->getLocation(), diag::err_kern_type_not_void_return)
|
||||
<< Function->getType() << Function->getSourceRange();
|
||||
return TDK_SubstitutionFailure;
|
||||
}
|
||||
}
|
||||
|
||||
// Instantiate the types of each of the function parameters given the
|
||||
|
|
|
@ -0,0 +1,44 @@
|
|||
// RUN: %clang_cc1 -std=c++14 -fsyntax-only -verify %s
|
||||
|
||||
#include "Inputs/cuda.h"
|
||||
|
||||
template <typename T>
|
||||
__global__ T foo() {
|
||||
// expected-note@-1 {{kernel function type 'T ()' must have void return type}}
|
||||
}
|
||||
|
||||
void f0() {
|
||||
foo<void><<<0, 0>>>();
|
||||
foo<int><<<0, 0>>>();
|
||||
// expected-error@-1 {{no matching function for call to 'foo'}}
|
||||
}
|
||||
|
||||
__global__ auto f1() {
|
||||
}
|
||||
|
||||
__global__ auto f2(int x) {
|
||||
return x + 1;
|
||||
// expected-error@-2 {{kernel function type 'auto (int)' must have void return type}}
|
||||
}
|
||||
|
||||
template <bool Cond, typename T = void> struct enable_if { typedef T type; };
|
||||
template <typename T> struct enable_if<false, T> {};
|
||||
|
||||
template <int N>
|
||||
__global__
|
||||
auto bar() -> typename enable_if<N == 1>::type {
|
||||
// expected-note@-1 {{requirement '3 == 1' was not satisfied [with N = 3]}}
|
||||
}
|
||||
|
||||
template <int N>
|
||||
__global__
|
||||
auto bar() -> typename enable_if<N == 2>::type {
|
||||
// expected-note@-1 {{requirement '3 == 2' was not satisfied [with N = 3]}}
|
||||
}
|
||||
|
||||
void f3() {
|
||||
bar<1><<<0, 0>>>();
|
||||
bar<2><<<0, 0>>>();
|
||||
bar<3><<<0, 0>>>();
|
||||
// expected-error@-1 {{no matching function for call to 'bar'}}
|
||||
}
|
Loading…
Reference in New Issue