forked from mindspore-Ecosystem/mindspore
!750 refresh parameter format
Merge pull request !750 from liubuyu/master
This commit is contained in:
commit
0fbec0f55a
|
@ -38,6 +38,7 @@
|
|||
#include "pre_activate/ascend/ir_fusion/adam_apply_one_fusion.h"
|
||||
#include "pre_activate/ascend/ir_fusion/adam_apply_one_with_decay_rule.h"
|
||||
#include "pre_activate/ascend/ir_fusion/parameter_and_transop_fusion.h"
|
||||
#include "pre_activate/ascend/ir_fusion/refresh_parameter_format.h"
|
||||
#include "pre_activate/ascend/ir_fusion/transpose_transdata_fusion.h"
|
||||
#include "pre_activate/ascend/ir_fission/transdata_split.h"
|
||||
#include "pre_activate/ascend/ir_fission/topk_split.h"
|
||||
|
@ -265,6 +266,7 @@ void AscendBackendOptimization(const std::shared_ptr<session::KernelGraph> &kern
|
|||
other_pm->AddPass(std::make_shared<AllReduceFusion>());
|
||||
other_pm->AddPass(std::make_shared<AllGatherFusion>());
|
||||
other_pm->AddPass(std::make_shared<ParameterTransOpFusion>());
|
||||
other_pm->AddPass(std::make_shared<RefreshParameterFormat>());
|
||||
other_pm->AddPass(std::make_shared<BufferFusion>());
|
||||
other_pm->AddPass(std::make_shared<GetitemTuple>());
|
||||
other_pm->AddPass(std::make_shared<CommonSubexpressionElimination>());
|
||||
|
|
|
@ -0,0 +1,71 @@
|
|||
/**
|
||||
* Copyright 2020 Huawei Technologies Co., Ltd
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#include "pre_activate/ascend/ir_fusion/refresh_parameter_format.h"
|
||||
#include "session/anf_runtime_algorithm.h"
|
||||
#include "utils/utils.h"
|
||||
#include "operator/ops.h"
|
||||
#include "device/kernel_info.h"
|
||||
#include "pre_activate/common/helper.h"
|
||||
#include "pre_activate/common/optimizer.h"
|
||||
#include "pre_activate/ascend/ascend_helper.h"
|
||||
|
||||
namespace mindspore {
|
||||
namespace opt {
|
||||
void DoRefresh(const CNodePtr &cnode) {
|
||||
if (cnode == nullptr) {
|
||||
MS_LOG(EXCEPTION) << "node is nullptr";
|
||||
}
|
||||
for (size_t input_index = 0; input_index < AnfAlgo::GetInputTensorNum(cnode); input_index++) {
|
||||
auto input_kernel_node = AnfAlgo::GetInputNode(cnode, input_index);
|
||||
if (input_kernel_node->isa<Parameter>()) {
|
||||
std::shared_ptr<kernel::KernelBuildInfo::KernelBuildInfoBuilder> builder =
|
||||
std::make_shared<kernel::KernelBuildInfo::KernelBuildInfoBuilder>();
|
||||
auto cnode_input_format = AnfAlgo::GetInputFormat(cnode, input_index);
|
||||
auto kernel_node_format = AnfAlgo::GetOutputFormat(input_kernel_node, 0);
|
||||
auto dtype = AnfAlgo::GetOutputDeviceDataType(input_kernel_node, 0);
|
||||
if (kernel_node_format != cnode_input_format) {
|
||||
builder->SetOutputsFormat({cnode_input_format});
|
||||
builder->SetOutputsDeviceType({dtype});
|
||||
AnfAlgo::SetSelectKernelBuildInfo(builder->Build(), input_kernel_node.get());
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
bool RefreshParameterFormat::Run(const FuncGraphPtr &func_graph) {
|
||||
if (func_graph == nullptr) {
|
||||
MS_LOG(ERROR) << "func_graph is nullptr.";
|
||||
return false;
|
||||
}
|
||||
std::vector<AnfNodePtr> node_list = TopoSort(func_graph->get_return());
|
||||
for (auto node : node_list) {
|
||||
if (node == nullptr || !node->isa<CNode>()) {
|
||||
continue;
|
||||
}
|
||||
auto cnode = node->cast<CNodePtr>();
|
||||
if (cnode == nullptr) {
|
||||
continue;
|
||||
}
|
||||
auto node_name = AnfAlgo::GetCNodeName(cnode);
|
||||
if (node_name == kBNTrainingUpdateOpName) {
|
||||
DoRefresh(cnode);
|
||||
}
|
||||
}
|
||||
return true;
|
||||
}
|
||||
} // namespace opt
|
||||
} // namespace mindspore
|
|
@ -0,0 +1,40 @@
|
|||
/**
|
||||
* Copyright 2020 Huawei Technologies Co., Ltd
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#ifndef MINDSPORE_CCSRC_PRE_ACTIVATE_ASCEND_IR_FUSION_REFRESH_PARAMETER_FORMAT_H_
|
||||
#define MINDSPORE_CCSRC_PRE_ACTIVATE_ASCEND_IR_FUSION_REFRESH_PARAMETER_FORMAT_H_
|
||||
|
||||
#include <vector>
|
||||
#include <memory>
|
||||
#include <utility>
|
||||
#include "ir/anf.h"
|
||||
#include "pre_activate/common/pass.h"
|
||||
|
||||
namespace mindspore {
|
||||
namespace opt {
|
||||
class RefreshParameterFormat : public Pass {
|
||||
public:
|
||||
explicit RefreshParameterFormat(size_t groups = 1) : Pass("refresh_parameter_format"), groups_(groups) {}
|
||||
~RefreshParameterFormat() override = default;
|
||||
bool Run(const FuncGraphPtr &graph) override;
|
||||
|
||||
private:
|
||||
size_t groups_ = 1;
|
||||
};
|
||||
} // namespace opt
|
||||
} // namespace mindspore
|
||||
|
||||
#endif // MINDSPORE_CCSRC_PRE_ACTIVATE_ASCEND_IR_FUSION_REFRESH_PARAMETER_FORMAT_H_
|
Loading…
Reference in New Issue