forked from OSchip/llvm-project
[OPENMP] Improved codegen for outlined functions for 'parallel' directives.
llvm-svn: 213927
This commit is contained in:
parent
94bd553eb8
commit
d6c57554f9
|
@ -127,6 +127,24 @@ llvm::Value *CGOpenMPRuntime::GetOpenMPGlobalThreadNum(CodeGenFunction &CGF,
|
|||
OpenMPGtidMapTy::iterator I = OpenMPGtidMap.find(CGF.CurFn);
|
||||
if (I != OpenMPGtidMap.end()) {
|
||||
GTid = I->second;
|
||||
} else {
|
||||
// Check if current function is a function which has first parameter
|
||||
// with type int32 and name ".global_tid.".
|
||||
if (!CGF.CurFn->arg_empty() &&
|
||||
CGF.CurFn->arg_begin()->getType()->isPointerTy() &&
|
||||
CGF.CurFn->arg_begin()
|
||||
->getType()
|
||||
->getPointerElementType()
|
||||
->isIntegerTy() &&
|
||||
CGF.CurFn->arg_begin()
|
||||
->getType()
|
||||
->getPointerElementType()
|
||||
->getIntegerBitWidth() == 32 &&
|
||||
CGF.CurFn->arg_begin()->hasName() &&
|
||||
CGF.CurFn->arg_begin()->getName() == ".global_tid.") {
|
||||
CGBuilderTy::InsertPointGuard IPG(CGF.Builder);
|
||||
CGF.Builder.SetInsertPoint(CGF.AllocaInsertPt);
|
||||
GTid = CGF.Builder.CreateLoad(CGF.CurFn->arg_begin());
|
||||
} else {
|
||||
// Generate "int32 .kmpc_global_thread_num.addr;"
|
||||
CGBuilderTy::InsertPointGuard IPG(CGF.Builder);
|
||||
|
@ -134,6 +152,7 @@ llvm::Value *CGOpenMPRuntime::GetOpenMPGlobalThreadNum(CodeGenFunction &CGF,
|
|||
llvm::Value *Args[] = {EmitOpenMPUpdateLocation(CGF, Loc)};
|
||||
GTid = CGF.EmitRuntimeCall(
|
||||
CreateRuntimeFunction(OMPRTL__kmpc_global_thread_num), Args);
|
||||
}
|
||||
OpenMPGtidMap[CGF.CurFn] = GTid;
|
||||
}
|
||||
return GTid;
|
||||
|
|
Loading…
Reference in New Issue