forked from mindspore-Ecosystem/mindspore
fix bug when add atomic clean for getnext's output
This commit is contained in:
parent
4b5ed8dc86
commit
dbc6147e9b
|
@ -234,10 +234,15 @@ std::map<AnfNodePtr, std::vector<size_t>> GetCommunicationOpInputInfo(
|
||||||
for (size_t i = 0; i < input_num; i++) {
|
for (size_t i = 0; i < input_num; i++) {
|
||||||
auto input_node = kernel->input(i + 1);
|
auto input_node = kernel->input(i + 1);
|
||||||
auto kernel_input = AnfAlgo::VisitKernelWithReturnType(input_node, 0, true);
|
auto kernel_input = AnfAlgo::VisitKernelWithReturnType(input_node, 0, true);
|
||||||
if (AnfAlgo::IsCommunicationOp(kernel_input.first)) {
|
if (!kernel_input.first->isa<CNode>()) {
|
||||||
// no need to add atomic for communication op's output
|
continue;
|
||||||
MS_LOG(INFO) << "No need to add atomic clean for communication op "
|
}
|
||||||
<< kernel_input.first->fullname_with_scope() << "'s output";
|
auto cnode = kernel_input.first->cast<CNodePtr>();
|
||||||
|
if (AnfAlgo::IsCommunicationOp(cnode) || AnfAlgo::IsIndependentNode(cnode) ||
|
||||||
|
AnfAlgo::GetCNodeName(cnode) == kGetNextOpName) {
|
||||||
|
// no need to add atomic for communication/independent/getnext op 's output
|
||||||
|
MS_LOG(INFO) << "No need to add atomic clean for op " << kernel_input.first->fullname_with_scope()
|
||||||
|
<< "'s output";
|
||||||
continue;
|
continue;
|
||||||
}
|
}
|
||||||
MS_LOG(INFO) << "Add atomic clean for single communication op input, comm:" << kernel->fullname_with_scope()
|
MS_LOG(INFO) << "Add atomic clean for single communication op input, comm:" << kernel->fullname_with_scope()
|
||||||
|
|
|
@ -280,6 +280,12 @@ void KernelAdjust::InsertSwitchLoop(const std::shared_ptr<session::KernelGraph>
|
||||||
for (size_t idx = i + 1; idx < orders.size(); idx++) {
|
for (size_t idx = i + 1; idx < orders.size(); idx++) {
|
||||||
cur_cnode = orders[idx];
|
cur_cnode = orders[idx];
|
||||||
if (AnfAlgo::HasNodeAttr(kAttrLabelForInsertStreamActive, cur_cnode)) {
|
if (AnfAlgo::HasNodeAttr(kAttrLabelForInsertStreamActive, cur_cnode)) {
|
||||||
|
auto pre_node = orders[idx - 1];
|
||||||
|
auto pre_kernel_name = AnfAlgo::GetCNodeName(pre_node);
|
||||||
|
if (pre_kernel_name == kAtomicAddrCleanOpName) {
|
||||||
|
other_list.pop_back();
|
||||||
|
memcpy_list.push_back(pre_node);
|
||||||
|
}
|
||||||
memcpy_list.emplace_back(cur_cnode);
|
memcpy_list.emplace_back(cur_cnode);
|
||||||
} else {
|
} else {
|
||||||
other_list.emplace_back(cur_cnode);
|
other_list.emplace_back(cur_cnode);
|
||||||
|
|
Loading…
Reference in New Issue