[CUDA][HIP] Enable kernel function return type deduction.

Summary:
- Even though only `void` is still accepted as the deduced return type,
  enabling deduction/instantiation on the return type allows more
  consistent coding.

Reviewers: tra, jlebar

Subscribers: cfe-commits, yaxunl

Tags: #clang

Differential Revision: https://reviews.llvm.org/D68031

llvm-svn: 372898
This commit is contained in:
Michael Liao 2019-09-25 16:51:45 +00:00
parent 8535a8672e
commit 24337db616
5 changed files with 65 additions and 2 deletions

View File

@ -4223,7 +4223,9 @@ static void handleGlobalAttr(Sema &S, Decl *D, const ParsedAttr &AL) {
return;
}
const auto *FD = cast<FunctionDecl>(D);
if (!FD->getReturnType()->isVoidType()) {
if (!FD->getReturnType()->isVoidType() &&
!FD->getReturnType()->getAs<AutoType>() &&
!FD->getReturnType()->isInstantiationDependentType()) {
SourceRange RTRange = FD->getReturnTypeSourceRange();
S.Diag(FD->getTypeSpecStartLoc(), diag::err_kern_type_not_void_return)
<< FD->getType()

View File

@ -5891,7 +5891,9 @@ ExprResult Sema::BuildResolvedCallExpr(Expr *Fn, NamedDecl *NDecl,
<< FDecl << Fn->getSourceRange());
// CUDA: Kernel function must have 'void' return type
if (!FuncT->getReturnType()->isVoidType())
if (!FuncT->getReturnType()->isVoidType() &&
!FuncT->getReturnType()->getAs<AutoType>() &&
!FuncT->getReturnType()->isInstantiationDependentType())
return ExprError(Diag(LParenLoc, diag::err_kern_type_not_void_return)
<< Fn->getType() << Fn->getSourceRange());
} else {

View File

@ -3500,6 +3500,14 @@ bool Sema::DeduceFunctionTypeFromReturnExpr(FunctionDecl *FD,
return true;
}
// CUDA: Kernel function must have 'void' return type.
if (getLangOpts().CUDA)
if (FD->hasAttr<CUDAGlobalAttr>() && !Deduced->isVoidType()) {
Diag(FD->getLocation(), diag::err_kern_type_not_void_return)
<< FD->getType() << FD->getSourceRange();
return true;
}
// If a function with a declared return type that contains a placeholder type
// has multiple return statements, the return type is deduced for each return
// statement. [...] if the type deduced is not the same in each deduction,

View File

@ -3093,6 +3093,13 @@ Sema::SubstituteExplicitTemplateArguments(
Function->getTypeSpecStartLoc(), Function->getDeclName());
if (ResultType.isNull() || Trap.hasErrorOccurred())
return TDK_SubstitutionFailure;
// CUDA: Kernel function must have 'void' return type.
if (getLangOpts().CUDA)
if (Function->hasAttr<CUDAGlobalAttr>() && !ResultType->isVoidType()) {
Diag(Function->getLocation(), diag::err_kern_type_not_void_return)
<< Function->getType() << Function->getSourceRange();
return TDK_SubstitutionFailure;
}
}
// Instantiate the types of each of the function parameters given the

View File

@ -0,0 +1,44 @@
// RUN: %clang_cc1 -std=c++14 -fsyntax-only -verify %s
#include "Inputs/cuda.h"
template <typename T>
__global__ T foo() {
// expected-note@-1 {{kernel function type 'T ()' must have void return type}}
}
void f0() {
foo<void><<<0, 0>>>();
foo<int><<<0, 0>>>();
// expected-error@-1 {{no matching function for call to 'foo'}}
}
__global__ auto f1() {
}
__global__ auto f2(int x) {
return x + 1;
// expected-error@-2 {{kernel function type 'auto (int)' must have void return type}}
}
template <bool Cond, typename T = void> struct enable_if { typedef T type; };
template <typename T> struct enable_if<false, T> {};
template <int N>
__global__
auto bar() -> typename enable_if<N == 1>::type {
// expected-note@-1 {{requirement '3 == 1' was not satisfied [with N = 3]}}
}
template <int N>
__global__
auto bar() -> typename enable_if<N == 2>::type {
// expected-note@-1 {{requirement '3 == 2' was not satisfied [with N = 3]}}
}
void f3() {
bar<1><<<0, 0>>>();
bar<2><<<0, 0>>>();
bar<3><<<0, 0>>>();
// expected-error@-1 {{no matching function for call to 'bar'}}
}