From f16a78e553f65991bfd8c3397b704f5e8e81539a Mon Sep 17 00:00:00 2001 From: Radomir Djogo Date: Thu, 18 Jul 2024 21:37:14 +0000 Subject: [PATCH] Recip round fp32->fp16b if dest in 16bit mode --- common/inc/sfpu/ckernel_sfpu_recip.h | 8 ++++++-- 1 file changed, 6 insertions(+), 2 deletions(-) diff --git a/common/inc/sfpu/ckernel_sfpu_recip.h b/common/inc/sfpu/ckernel_sfpu_recip.h index 41c8603..c0f22f8 100644 --- a/common/inc/sfpu/ckernel_sfpu_recip.h +++ b/common/inc/sfpu/ckernel_sfpu_recip.h @@ -55,7 +55,7 @@ sfpi_inline vFloat _sfpu_reciprocal_(const vFloat in) return setexp(result, new_exp); } -template +template inline void _calculate_reciprocal_(const int iterations) { #pragma GCC unroll 8 @@ -70,7 +70,11 @@ inline void _calculate_reciprocal_(const int iterations) } v_endif; - dst_reg[0] = out; + if constexpr (is_fp32_dest_acc_en) { + dst_reg[0] = out; + } else { + dst_reg[0] = reinterpret(float_to_fp16b(out, 0)); + } dst_reg++; }