!48792 Fix the precision problem for TruncateDiv

Merge pull request !48792 from zhanzhan/truncatediv
2023-02-14 02:52:12 +00:00 · 2023-02-14 02:52:12 +00:00 · 5b6ffcf7ce
parent 13b0afac51 931a0b254e
commit 5b6ffcf7ce
1 changed files with 2 additions and 2 deletions
--- a/mindspore/ccsrc/plugin/device/gpu/kernel/cuda_impl/cuda_ops/broadcast_impl.cu
+++ b/mindspore/ccsrc/plugin/device/gpu/kernel/cuda_impl/cuda_ops/broadcast_impl.cu
@ -1123,8 +1123,8 @@ struct TruncateDivFunc {
 template <>
 struct TruncateDivFunc<half> {
  __device__ __forceinline__ half operator()(const half &lhs, const half &rhs) {
-    float res = truncf(__half2float(lhs) / __half2float(rhs));
-    return __float2half_rn(res);
+    half res = __hdiv(lhs, rhs);
+    return res;
  }
 };