forked from OSSInnovation/mindspore
commit
0c2e7f5092
|
@ -27,6 +27,5 @@ MS_REG_GPU_KERNEL_ONE(CTCLossV2,
|
||||||
.AddOutputAttr(kNumberTypeFloat32)
|
.AddOutputAttr(kNumberTypeFloat32)
|
||||||
.AddOutputAttr(kNumberTypeFloat32),
|
.AddOutputAttr(kNumberTypeFloat32),
|
||||||
CtcLossGpuKernel, float)
|
CtcLossGpuKernel, float)
|
||||||
|
|
||||||
} // namespace kernel
|
} // namespace kernel
|
||||||
} // namespace mindspore
|
} // namespace mindspore
|
||||||
|
|
|
@ -110,7 +110,6 @@ void ReplaceOutput(const FuncGraphPtr &graph, const AnfNodePtr &bn_grad, const A
|
||||||
manager->Replace(relu_grad, bn_add_relu_grad_output[kBNAddReluGradOutputNum - 1]);
|
manager->Replace(relu_grad, bn_add_relu_grad_output[kBNAddReluGradOutputNum - 1]);
|
||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
|
|
||||||
} // namespace
|
} // namespace
|
||||||
|
|
||||||
const BaseRef BatchNormAddReluGradFusion::DefinePattern() const {
|
const BaseRef BatchNormAddReluGradFusion::DefinePattern() const {
|
||||||
|
|
|
@ -81,8 +81,6 @@ void GPUSession::Optimize(const std::shared_ptr<KernelGraph> &kernel_graph) {
|
||||||
auto pm = std::make_shared<opt::PassManager>();
|
auto pm = std::make_shared<opt::PassManager>();
|
||||||
pm->AddPass(std::make_shared<opt::AdamWeightDecayFusion>());
|
pm->AddPass(std::make_shared<opt::AdamWeightDecayFusion>());
|
||||||
pm->AddPass(std::make_shared<opt::AdamFusion>());
|
pm->AddPass(std::make_shared<opt::AdamFusion>());
|
||||||
// pm->AddPass(std::make_shared<opt::ApplyMomentumWeightDecayScaleFusion>());
|
|
||||||
// pm->AddPass(std::make_shared<opt::ApplyMomentumScaleFusion>());
|
|
||||||
pm->AddPass(std::make_shared<opt::ReplaceBNCastFusion>());
|
pm->AddPass(std::make_shared<opt::ReplaceBNCastFusion>());
|
||||||
pm->AddPass(std::make_shared<opt::ReplaceBNGradCastFusion>());
|
pm->AddPass(std::make_shared<opt::ReplaceBNGradCastFusion>());
|
||||||
pm->AddPass(std::make_shared<opt::ReplaceMomentumCastFusion>());
|
pm->AddPass(std::make_shared<opt::ReplaceMomentumCastFusion>());
|
||||||
|
@ -98,7 +96,6 @@ void GPUSession::HardwareOptimize(const std::shared_ptr<KernelGraph> &kernel_gra
|
||||||
pm->AddPass(std::make_shared<opt::BatchNormReluFusion>());
|
pm->AddPass(std::make_shared<opt::BatchNormReluFusion>());
|
||||||
pm->AddPass(std::make_shared<opt::BatchNormReluGradFusion>());
|
pm->AddPass(std::make_shared<opt::BatchNormReluGradFusion>());
|
||||||
pm->AddPass(std::make_shared<opt::BatchNormAddReluFusion>());
|
pm->AddPass(std::make_shared<opt::BatchNormAddReluFusion>());
|
||||||
// pm->AddPass(std::make_shared<opt::BatchNormAddReluGradFusion>());
|
|
||||||
pm->AddPass(std::make_shared<opt::InsertFormatTransformOp>());
|
pm->AddPass(std::make_shared<opt::InsertFormatTransformOp>());
|
||||||
pm->AddPass(std::make_shared<opt::RemoveFormatTransformPair>());
|
pm->AddPass(std::make_shared<opt::RemoveFormatTransformPair>());
|
||||||
pm->AddPass(std::make_shared<opt::RemoveRedundantFormatTransform>());
|
pm->AddPass(std::make_shared<opt::RemoveRedundantFormatTransform>());
|
||||||
|
|
Loading…
Reference in New Issue