!3397 GPU dump - input bins lag behind by 1 iteration
Merge pull request !3397 from john_tzanakakis/master_ms1
This commit is contained in:
commit
252c6aa788
|
@ -616,10 +616,6 @@ bool GPUKernelRuntime::LaunchKernelDynamic(const session::KernelGraph *graph, De
|
|||
|
||||
#ifdef ENABLE_DEBUGGER
|
||||
bool dump_enabled = GPUKernelRuntime::DumpDataEnabledIteration();
|
||||
if (!mock) {
|
||||
// collect weights and bias
|
||||
LoadParameters(graph, debugger, dump_enabled);
|
||||
}
|
||||
#endif
|
||||
auto &kernels = graph->execution_order();
|
||||
int exec_order = 1;
|
||||
|
@ -665,6 +661,10 @@ bool GPUKernelRuntime::LaunchKernelDynamic(const session::KernelGraph *graph, De
|
|||
}
|
||||
}
|
||||
if (!mock) {
|
||||
#ifdef ENABLE_DEBUGGER
|
||||
// collect weights and bias
|
||||
LoadParameters(graph, debugger, dump_enabled);
|
||||
#endif
|
||||
CHECK_OP_RET_WITH_EXCEPT(SyncStream(), "SyncStream failed.");
|
||||
}
|
||||
ClearSwapInfo(mock);
|
||||
|
|
Loading…
Reference in New Issue