forked from mindspore-Ecosystem/mindspore
!7004 [MSLITE][Develop] fix bug of arm fp16 cpu op: reopen deconv depthwise
Merge pull request !7004 from yangruoqi713/lite
This commit is contained in:
commit
d51099abf5
|
@ -176,6 +176,7 @@ int DeconvolutionDepthwiseFp16CPUKernel::Run() {
|
||||||
}
|
}
|
||||||
|
|
||||||
if (!need_align_) {
|
if (!need_align_) {
|
||||||
|
memset(execute_output_, 0, out_tensors_.at(kOutputIndex)->ElementsNum() * sizeof(float16_t));
|
||||||
packed_output_ = execute_output_;
|
packed_output_ = execute_output_;
|
||||||
}
|
}
|
||||||
ret = ParallelLaunch(this->context_->thread_pool_, DeconvDwFp16Run, this, conv_param_->thread_num_);
|
ret = ParallelLaunch(this->context_->thread_pool_, DeconvDwFp16Run, this, conv_param_->thread_num_);
|
||||||
|
@ -243,4 +244,6 @@ kernel::LiteKernel *CpuDeconvDwFp16KernelCreator(const std::vector<lite::Tensor
|
||||||
}
|
}
|
||||||
return kernel;
|
return kernel;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
REG_KERNEL(kCPU, kNumberTypeFloat16, PrimitiveType_DeDepthwiseConv2D, CpuDeconvDwFp16KernelCreator)
|
||||||
} // namespace mindspore::kernel
|
} // namespace mindspore::kernel
|
||||||
|
|
Loading…
Reference in New Issue