!14400 【MS】【LITE】【GPU】 optimize opencl performance on mate40

From: @wangdongxu6
Reviewed-by: @ddwsky,@hangangqiang
Signed-off-by: @ddwsky
This commit is contained in:
mindspore-ci-bot 2021-03-31 09:22:27 +08:00 committed by Gitee
commit afde4e3bf9
1 changed files with 3 additions and 0 deletions

View File

@ -350,6 +350,9 @@ void Conv2DOpenCLKernel::SetGlobalLocal() {
size_t global_w = UP_DIV(OW_, block_size_.W);
size_t global_c = UP_DIV(CO_SLICES_, block_size_.C);
int local_max = filter_type_ == MemType::IMG ? 64 : 128;
if (ocl_runtime_->DeviceComputeUnits() > 16) {
local_max = 256;
}
const int local_c_max = 16;
const int OH_threshold = 100;
const int OW_threshold = 100;