GPU dump - input bins lag behind by 1 iteration

This commit is contained in:
John Tzanakakis 2020-07-23 12:54:18 -04:00
parent b1fae868ba
commit 96744f087e
1 changed files with 4 additions and 4 deletions

View File

@ -616,10 +616,6 @@ bool GPUKernelRuntime::LaunchKernelDynamic(const session::KernelGraph *graph, De
#ifdef ENABLE_DEBUGGER
bool dump_enabled = GPUKernelRuntime::DumpDataEnabledIteration();
if (!mock) {
// collect weights and bias
LoadParameters(graph, debugger, dump_enabled);
}
#endif
auto &kernels = graph->execution_order();
int exec_order = 1;
@ -665,6 +661,10 @@ bool GPUKernelRuntime::LaunchKernelDynamic(const session::KernelGraph *graph, De
}
}
if (!mock) {
#ifdef ENABLE_DEBUGGER
// collect weights and bias
LoadParameters(graph, debugger, dump_enabled);
#endif
CHECK_OP_RET_WITH_EXCEPT(SyncStream(), "SyncStream failed.");
}
ClearSwapInfo(mock);