forked from OSchip/llvm-project
[OpenMP] Initialize data sharing stack for SPMD case
Summary: In the SPMD case, we need to initialize the data sharing and globalization infrastructure. This covers the case when an SPMD region calls a function in a different compilation unit. Reviewers: ABataev, carlo.bertolli, caomhin Reviewed By: ABataev Subscribers: Hahnfeld, jholewinski, guansong, cfe-commits Differential Revision: https://reviews.llvm.org/D49188 llvm-svn: 337015
This commit is contained in:
parent
b64e74feed
commit
ad4e579407
|
@ -81,6 +81,8 @@ enum OpenMPRTLFunctionNVPTX {
|
|||
OMPRTL_NVPTX__kmpc_end_reduce_nowait,
|
||||
/// Call to void __kmpc_data_sharing_init_stack();
|
||||
OMPRTL_NVPTX__kmpc_data_sharing_init_stack,
|
||||
/// Call to void __kmpc_data_sharing_init_stack_spmd();
|
||||
OMPRTL_NVPTX__kmpc_data_sharing_init_stack_spmd,
|
||||
/// Call to void* __kmpc_data_sharing_push_stack(size_t size,
|
||||
/// int16_t UseSharedMemory);
|
||||
OMPRTL_NVPTX__kmpc_data_sharing_push_stack,
|
||||
|
@ -1025,6 +1027,12 @@ void CGOpenMPRuntimeNVPTX::emitSPMDEntryHeader(
|
|||
/*RequiresDataSharing=*/Bld.getInt16(1)};
|
||||
CGF.EmitRuntimeCall(
|
||||
createNVPTXRuntimeFunction(OMPRTL_NVPTX__kmpc_spmd_kernel_init), Args);
|
||||
|
||||
// For data sharing, we need to initialize the stack.
|
||||
CGF.EmitRuntimeCall(
|
||||
createNVPTXRuntimeFunction(
|
||||
OMPRTL_NVPTX__kmpc_data_sharing_init_stack_spmd));
|
||||
|
||||
CGF.EmitBranch(ExecuteBB);
|
||||
|
||||
CGF.EmitBlock(ExecuteBB);
|
||||
|
@ -1107,11 +1115,6 @@ void CGOpenMPRuntimeNVPTX::emitWorkerLoop(CodeGenFunction &CGF,
|
|||
// Wait for parallel work
|
||||
syncCTAThreads(CGF);
|
||||
|
||||
// For data sharing, we need to initialize the stack for workers.
|
||||
CGF.EmitRuntimeCall(
|
||||
createNVPTXRuntimeFunction(
|
||||
OMPRTL_NVPTX__kmpc_data_sharing_init_stack));
|
||||
|
||||
Address WorkFn =
|
||||
CGF.CreateDefaultAlignTempAlloca(CGF.Int8PtrTy, /*Name=*/"work_fn");
|
||||
Address ExecStatus =
|
||||
|
@ -1417,6 +1420,13 @@ CGOpenMPRuntimeNVPTX::createNVPTXRuntimeFunction(unsigned Function) {
|
|||
RTLFn = CGM.CreateRuntimeFunction(FnTy, "__kmpc_data_sharing_init_stack");
|
||||
break;
|
||||
}
|
||||
case OMPRTL_NVPTX__kmpc_data_sharing_init_stack_spmd: {
|
||||
/// Build void __kmpc_data_sharing_init_stack_spmd();
|
||||
auto *FnTy =
|
||||
llvm::FunctionType::get(CGM.VoidTy, llvm::None, /*isVarArg*/ false);
|
||||
RTLFn = CGM.CreateRuntimeFunction(FnTy, "__kmpc_data_sharing_init_stack_spmd");
|
||||
break;
|
||||
}
|
||||
case OMPRTL_NVPTX__kmpc_data_sharing_push_stack: {
|
||||
// Build void *__kmpc_data_sharing_push_stack(size_t size,
|
||||
// int16_t UseSharedMemory);
|
||||
|
|
|
@ -30,7 +30,7 @@ void test_ds(){
|
|||
/// ========= In the worker function ========= ///
|
||||
// CK1: {{.*}}define internal void @__omp_offloading{{.*}}test_ds{{.*}}_worker()
|
||||
// CK1: call void @llvm.nvvm.barrier0()
|
||||
// CK1: call void @__kmpc_data_sharing_init_stack
|
||||
// CK1-NOT: call void @__kmpc_data_sharing_init_stack
|
||||
|
||||
/// ========= In the kernel function ========= ///
|
||||
|
||||
|
|
|
@ -60,6 +60,7 @@ int bar(int n){
|
|||
// CHECK: [[AA:%.+]] = load i16*, i16** [[AA_ADDR]], align
|
||||
// CHECK: [[THREAD_LIMIT:%.+]] = call i32 @llvm.nvvm.read.ptx.sreg.ntid.x()
|
||||
// CHECK: call void @__kmpc_spmd_kernel_init(i32 [[THREAD_LIMIT]],
|
||||
// CHECK: call void @__kmpc_data_sharing_init_stack_spmd
|
||||
// CHECK: br label {{%?}}[[EXEC:.+]]
|
||||
//
|
||||
// CHECK: [[EXEC]]
|
||||
|
@ -102,6 +103,7 @@ int bar(int n){
|
|||
// CHECK: [[B:%.+]] = load [10 x i32]*, [10 x i32]** [[B_ADDR]], align
|
||||
// CHECK: [[THREAD_LIMIT:%.+]] = call i32 @llvm.nvvm.read.ptx.sreg.ntid.x()
|
||||
// CHECK: call void @__kmpc_spmd_kernel_init(i32 [[THREAD_LIMIT]],
|
||||
// CHECK: call void @__kmpc_data_sharing_init_stack_spmd
|
||||
// CHECK: br label {{%?}}[[EXEC:.+]]
|
||||
//
|
||||
// CHECK: [[EXEC]]
|
||||
|
|
|
@ -48,6 +48,7 @@ int bar(int n){
|
|||
|
||||
// CHECK-LABEL: define {{.*}}void {{@__omp_offloading_.+template.+l22}}(
|
||||
// CHECK: call void @__kmpc_spmd_kernel_init(
|
||||
// CHECK: call void @__kmpc_data_sharing_init_stack_spmd
|
||||
// CHECK: br label {{%?}}[[EXEC:.+]]
|
||||
//
|
||||
// CHECK: [[EXEC]]
|
||||
|
@ -69,6 +70,7 @@ int bar(int n){
|
|||
|
||||
// CHECK-LABEL: define {{.*}}void {{@__omp_offloading_.+template.+l26}}(
|
||||
// CHECK: call void @__kmpc_spmd_kernel_init(
|
||||
// CHECK: call void @__kmpc_data_sharing_init_stack_spmd
|
||||
// CHECK: br label {{%?}}[[EXEC:.+]]
|
||||
//
|
||||
// CHECK: [[EXEC]]
|
||||
|
@ -89,6 +91,7 @@ int bar(int n){
|
|||
|
||||
// CHECK-LABEL: define {{.*}}void {{@__omp_offloading_.+template.+l31}}(
|
||||
// CHECK: call void @__kmpc_spmd_kernel_init(
|
||||
// CHECK: call void @__kmpc_data_sharing_init_stack_spmd
|
||||
// CHECK: br label {{%?}}[[EXEC:.+]]
|
||||
//
|
||||
// CHECK: [[EXEC]]
|
||||
|
|
|
@ -55,6 +55,7 @@ int bar(int n){
|
|||
// CHECK: define {{.*}}void {{@__omp_offloading_.+template.+l27}}(
|
||||
//
|
||||
// CHECK: call void @__kmpc_spmd_kernel_init(
|
||||
// CHECK: call void @__kmpc_data_sharing_init_stack_spmd
|
||||
// CHECK: br label {{%?}}[[EXECUTE:.+]]
|
||||
//
|
||||
// CHECK: [[EXECUTE]]
|
||||
|
@ -242,6 +243,7 @@ int bar(int n){
|
|||
// CHECK: define {{.*}}void {{@__omp_offloading_.+template.+l32}}(
|
||||
//
|
||||
// CHECK: call void @__kmpc_spmd_kernel_init(
|
||||
// CHECK: call void @__kmpc_data_sharing_init_stack_spmd
|
||||
// CHECK: br label {{%?}}[[EXECUTE:.+]]
|
||||
//
|
||||
// CHECK: [[EXECUTE]]
|
||||
|
@ -519,6 +521,7 @@ int bar(int n){
|
|||
// CHECK: define {{.*}}void {{@__omp_offloading_.+template.+l38}}(
|
||||
//
|
||||
// CHECK: call void @__kmpc_spmd_kernel_init(
|
||||
// CHECK: call void @__kmpc_data_sharing_init_stack_spmd
|
||||
// CHECK: br label {{%?}}[[EXECUTE:.+]]
|
||||
//
|
||||
// CHECK: [[EXECUTE]]
|
||||
|
|
|
@ -228,6 +228,7 @@ int bar(int n){
|
|||
|
||||
// CHECK: define weak void @__omp_offloading_{{.*}}ftemplate{{.*}}_l37(
|
||||
// CHECK: call void @__kmpc_spmd_kernel_init(
|
||||
// CHECK: call void @__kmpc_data_sharing_init_stack_spmd
|
||||
// CHECK: call i8* @__kmpc_data_sharing_push_stack(
|
||||
// CHECK-NOT: call void @__kmpc_serialized_parallel(
|
||||
// CHECK: call void [[L0:@.+]](i32* %{{.+}}, i32* %{{.+}}, i16* %{{.*}})
|
||||
|
|
|
@ -70,6 +70,7 @@ int bar(int n){
|
|||
// CHECK-LABEL: define {{.*}}void {{@__omp_offloading_.+}}(
|
||||
// CHECK-DAG: [[THREAD_LIMIT:%.+]] = call i32 @llvm.nvvm.read.ptx.sreg.ntid.x()
|
||||
// CHECK: call void @__kmpc_spmd_kernel_init(i32 [[THREAD_LIMIT]],
|
||||
// CHECK: call void @__kmpc_data_sharing_init_stack_spmd
|
||||
// CHECK: call void @__kmpc_for_static_init_4({{.+}}, {{.+}}, {{.+}} 91,
|
||||
// CHECK: {{call|invoke}} void [[OUTL1:@.+]](
|
||||
// CHECK: call void @__kmpc_for_static_fini(
|
||||
|
@ -84,6 +85,7 @@ int bar(int n){
|
|||
// CHECK-LABEL: define {{.*}}void {{@__omp_offloading_.+}}(
|
||||
// CHECK-DAG: [[THREAD_LIMIT:%.+]] = call i32 @llvm.nvvm.read.ptx.sreg.ntid.x()
|
||||
// CHECK: call void @__kmpc_spmd_kernel_init(i32 [[THREAD_LIMIT]],
|
||||
// CHECK: call void @__kmpc_data_sharing_init_stack_spmd
|
||||
// CHECK: call void @__kmpc_for_static_init_4({{.+}}, {{.+}}, {{.+}} 92,
|
||||
// CHECK: {{call|invoke}} void [[OUTL2:@.+]](
|
||||
// CHECK: call void @__kmpc_for_static_fini(
|
||||
|
@ -98,6 +100,7 @@ int bar(int n){
|
|||
// CHECK-LABEL: define {{.*}}void {{@__omp_offloading_.+}}(
|
||||
// CHECK-DAG: [[THREAD_LIMIT:%.+]] = call i32 @llvm.nvvm.read.ptx.sreg.ntid.x()
|
||||
// CHECK: call void @__kmpc_spmd_kernel_init(i32 [[THREAD_LIMIT]],
|
||||
// CHECK: call void @__kmpc_data_sharing_init_stack_spmd
|
||||
// CHECK: call void @__kmpc_for_static_init_4({{.+}}, {{.+}}, {{.+}} 92,
|
||||
// CHECK: {{call|invoke}} void [[OUTL3:@.+]](
|
||||
// CHECK: call void @__kmpc_for_static_fini(
|
||||
|
@ -113,6 +116,7 @@ int bar(int n){
|
|||
// CHECK: store {{.+}} [[F_IN]], {{.+}}* {{.+}},
|
||||
// CHECK-DAG: [[THREAD_LIMIT:%.+]] = call i32 @llvm.nvvm.read.ptx.sreg.ntid.x()
|
||||
// CHECK: call void @__kmpc_spmd_kernel_init(i32 [[THREAD_LIMIT]],
|
||||
// CHECK: call void @__kmpc_data_sharing_init_stack_spmd
|
||||
// CHECK: store {{.+}} 99, {{.+}}* [[COMB_UB:%.+]], align
|
||||
// CHECK: call void @__kmpc_for_static_init_4({{.+}}, {{.+}}, {{.+}} 92, {{.+}}, {{.+}}, {{.+}}* [[COMB_UB]],
|
||||
// CHECK: {{call|invoke}} void [[OUTL4:@.+]](
|
||||
|
|
|
@ -22,7 +22,7 @@ tx ftemplate(int n) {
|
|||
tx a[N];
|
||||
short aa[N];
|
||||
tx b[10];
|
||||
tx c[M][M];
|
||||
tx c[M][M];
|
||||
tx f = n;
|
||||
tx l;
|
||||
int k;
|
||||
|
@ -47,7 +47,7 @@ tx ftemplate(int n) {
|
|||
for(int i = 0; i < M; i++) {
|
||||
for(int j = 0; j < M; j++) {
|
||||
k = M;
|
||||
c[i][j] = i+j*f+k;
|
||||
c[i][j] = i+j*f+k;
|
||||
}
|
||||
}
|
||||
|
||||
|
@ -65,6 +65,7 @@ int bar(int n){
|
|||
// CHECK-LABEL: define {{.*}}void {{@__omp_offloading_.+}}(
|
||||
// CHECK-DAG: [[THREAD_LIMIT:%.+]] = call i32 @llvm.nvvm.read.ptx.sreg.ntid.x()
|
||||
// CHECK: call void @__kmpc_spmd_kernel_init(i32 [[THREAD_LIMIT]],
|
||||
// CHECK: call void @__kmpc_data_sharing_init_stack_spmd
|
||||
// CHECK: call void @__kmpc_for_static_init_4({{.+}}, {{.+}}, {{.+}} 91,
|
||||
// CHECK: {{call|invoke}} void [[OUTL1:@.+]](
|
||||
// CHECK: call void @__kmpc_for_static_fini(
|
||||
|
@ -79,6 +80,7 @@ int bar(int n){
|
|||
// CHECK-LABEL: define {{.*}}void {{@__omp_offloading_.+}}(
|
||||
// CHECK-DAG: [[THREAD_LIMIT:%.+]] = call i32 @llvm.nvvm.read.ptx.sreg.ntid.x()
|
||||
// CHECK: call void @__kmpc_spmd_kernel_init(i32 [[THREAD_LIMIT]],
|
||||
// CHECK: call void @__kmpc_data_sharing_init_stack_spmd
|
||||
// CHECK: call void @__kmpc_for_static_init_4({{.+}}, {{.+}}, {{.+}} 92,
|
||||
// CHECK: {{call|invoke}} void [[OUTL2:@.+]](
|
||||
// CHECK: call void @__kmpc_for_static_fini(
|
||||
|
@ -93,6 +95,7 @@ int bar(int n){
|
|||
// CHECK-LABEL: define {{.*}}void {{@__omp_offloading_.+}}(
|
||||
// CHECK-DAG: [[THREAD_LIMIT:%.+]] = call i32 @llvm.nvvm.read.ptx.sreg.ntid.x()
|
||||
// CHECK: call void @__kmpc_spmd_kernel_init(i32 [[THREAD_LIMIT]],
|
||||
// CHECK: call void @__kmpc_data_sharing_init_stack_spmd
|
||||
// CHECK: call void @__kmpc_for_static_init_4({{.+}}, {{.+}}, {{.+}} 92,
|
||||
// CHECK: {{call|invoke}} void [[OUTL3:@.+]](
|
||||
// CHECK: call void @__kmpc_for_static_fini(
|
||||
|
@ -108,6 +111,7 @@ int bar(int n){
|
|||
// CHECK: store {{.+}} [[F_IN]], {{.+}}* {{.+}},
|
||||
// CHECK-DAG: [[THREAD_LIMIT:%.+]] = call i32 @llvm.nvvm.read.ptx.sreg.ntid.x()
|
||||
// CHECK: call void @__kmpc_spmd_kernel_init(i32 [[THREAD_LIMIT]],
|
||||
// CHECK: call void @__kmpc_data_sharing_init_stack_spmd
|
||||
// CHECK: store {{.+}} 99, {{.+}}* [[COMB_UB:%.+]], align
|
||||
// CHECK: call void @__kmpc_for_static_init_4({{.+}}, {{.+}}, {{.+}} 92, {{.+}}, {{.+}}, {{.+}}* [[COMB_UB]],
|
||||
// CHECK: {{call|invoke}} void [[OUTL4:@.+]](
|
||||
|
|
Loading…
Reference in New Issue