[libomptarget] Update device pointer only if needed

Currently, libomptarget will always perform a host-to-device memory transfer in
order to update the device pointer of a PTR_AND_OBJ entry. This is not always
necessary because the device pointer may have been set to the correct pointee
address already, so we can eliminate the redundant memory transfer.
This commit is contained in:
George Rokos 2021-07-10 04:14:44 -07:00
parent b205f2bb89
commit bb0166dc72
2 changed files with 70 additions and 13 deletions

View File

@ -556,22 +556,35 @@ int targetDataBegin(ident_t *loc, DeviceTy &Device, int32_t arg_num,
} }
if (arg_types[i] & OMP_TGT_MAPTYPE_PTR_AND_OBJ && !IsHostPtr) { if (arg_types[i] & OMP_TGT_MAPTYPE_PTR_AND_OBJ && !IsHostPtr) {
DP("Update pointer (" DPxMOD ") -> [" DPxMOD "]\n", // Check whether we need to update the pointer on the device
DPxPTR(PointerTgtPtrBegin), DPxPTR(TgtPtrBegin)); bool UpdateDevPtr = false;
uint64_t Delta = (uint64_t)HstPtrBegin - (uint64_t)HstPtrBase; uint64_t Delta = (uint64_t)HstPtrBegin - (uint64_t)HstPtrBase;
void *&TgtPtrBase = AsyncInfo.getVoidPtrLocation(); void *ExpectedTgtPtrBase = (void *)((uint64_t)TgtPtrBegin - Delta);
TgtPtrBase = (void *)((uint64_t)TgtPtrBegin - Delta);
int rt = Device.submitData(PointerTgtPtrBegin, &TgtPtrBase,
sizeof(void *), AsyncInfo);
if (rt != OFFLOAD_SUCCESS) {
REPORT("Copying data to device failed.\n");
return OFFLOAD_FAIL;
}
// create shadow pointers for this entry
Device.ShadowMtx.lock(); Device.ShadowMtx.lock();
Device.ShadowPtrMap[Pointer_HstPtrBegin] = { auto Entry = Device.ShadowPtrMap.find(Pointer_HstPtrBegin);
HstPtrBase, PointerTgtPtrBegin, TgtPtrBase}; // If this pointer is not in the map we need to insert it.
if (Entry == Device.ShadowPtrMap.end()) {
// create shadow pointers for this entry
Device.ShadowPtrMap[Pointer_HstPtrBegin] = {
HstPtrBase, PointerTgtPtrBegin, ExpectedTgtPtrBase};
UpdateDevPtr = true;
}
Device.ShadowMtx.unlock(); Device.ShadowMtx.unlock();
if (UpdateDevPtr) {
DP("Update pointer (" DPxMOD ") -> [" DPxMOD "]\n",
DPxPTR(PointerTgtPtrBegin), DPxPTR(TgtPtrBegin));
void *&TgtPtrBase = AsyncInfo.getVoidPtrLocation();
TgtPtrBase = ExpectedTgtPtrBase;
int rt = Device.submitData(PointerTgtPtrBegin, &TgtPtrBase,
sizeof(void *), AsyncInfo);
if (rt != OFFLOAD_SUCCESS) {
REPORT("Copying data to device failed.\n");
return OFFLOAD_FAIL;
}
}
} }
} }

View File

@ -0,0 +1,44 @@
// RUN: %libomptarget-compile-generic
// RUN: env LIBOMPTARGET_DEBUG=1 %libomptarget-run-generic 2>&1 \
// RUN: | %fcheck-generic -check-prefix=DEBUG -check-prefix=CHECK
// REQUIRES: libomptarget-debug
#include <stdio.h>
struct S {
int *p;
};
int main(void) {
int A[10];
struct S s1;
s1.p = A;
// DEBUG: Update pointer ([[DEV_PTR:0x[^ ]+]]) -> {{\[}}[[DEV_OBJ_A:0x[^ ]+]]{{\]}}
#pragma omp target enter data map(alloc : s1.p [0:10])
// DEBUG-NOT: Update pointer ([[DEV_PTR]]) -> {{\[}}[[DEV_OBJ_A]]{{\]}}
#pragma omp target map(alloc : s1.p [0:10])
{
for (int i = 0; i < 10; ++i)
s1.p[i] = i;
}
#pragma omp target exit data map(from : s1.p [0:10])
int fail_A = 0;
for (int i = 0; i < 10; ++i) {
if (A[i] != i) {
fail_A = 1;
break;
}
}
// CHECK-NOT: Test A failed
if (fail_A) {
printf("Test A failed\n");
}
return fail_A;
}