[3/9] target/arm: Fix float16 to/from int16

Message ID	20180425012300.14698-4-richard.henderson@linaro.org
State	Superseded
Headers	show Delivered-To: patch@linaro.org Received-SPF: pass (google.com: domain of qemu-devel-bounces+patch=linaro.org@nongnu.org designates 2001:4830:134:3::11 as permitted sender) client-ip=2001:4830:134:3::11; From: Richard Henderson <richard.henderson@linaro.org> To: qemu-devel@nongnu.org Date: Tue, 24 Apr 2018 15:22:54 -1000 Message-Id: <20180425012300.14698-4-richard.henderson@linaro.org> In-Reply-To: <20180425012300.14698-1-richard.henderson@linaro.org> References: <20180425012300.14698-1-richard.henderson@linaro.org> Subject: [Qemu-devel] [PATCH 3/9] target/arm: Fix float16 to/from int16 Precedence: list Cc: peter.maydell@linaro.org, alex.bennee@linaro.org Errors-To: qemu-devel-bounces+patch=linaro.org@nongnu.org Sender: "Qemu-devel" <qemu-devel-bounces+patch=linaro.org@nongnu.org>
Series	target/arm: Fixups for ARM_FEATURE_V8_FP16 \| expand [0/9] target/arm: Fixups for ARM_FEATURE_V8_FP16 [1/9] target/arm: Implement vector shifted SCVF/UCVF for fp16 [2/9] target/arm: Implement vector shifted FCVT for fp16 [3/9] target/arm: Fix float16 to/from int16 [4/9] target/arm: Clear SVE high bits for FMOV [5/9] target/arm: Implement FMOV (general) for fp16 [6/9] target/arm: Implement FCVT (scalar, integer) for fp16 [7/9] target/arm: Implement FCVT (scalar, fixed-point) for fp16 [8/9] target/arm: Implement FP data-processing (2 source) for fp16 [9/9] target/arm: Implement FP data-processing (3 source) for fp16

Message ID

20180425012300.14698-4-richard.henderson@linaro.org

State

Superseded

Headers

Received-SPF: pass (google.com: domain of
	qemu-devel-bounces+patch=linaro.org@nongnu.org designates
	2001:4830:134:3::11 as permitted sender)
	client-ip=2001:4830:134:3::11; 
From: Richard Henderson <richard.henderson@linaro.org>
To: qemu-devel@nongnu.org
Date: Tue, 24 Apr 2018 15:22:54 -1000
Message-Id: <20180425012300.14698-4-richard.henderson@linaro.org>
In-Reply-To: <20180425012300.14698-1-richard.henderson@linaro.org>
References: <20180425012300.14698-1-richard.henderson@linaro.org>
Subject: [Qemu-devel] [PATCH 3/9] target/arm: Fix float16 to/from int16
Precedence: list
Cc: peter.maydell@linaro.org, alex.bennee@linaro.org
Errors-To: qemu-devel-bounces+patch=linaro.org@nongnu.org
Sender: "Qemu-devel" <qemu-devel-bounces+patch=linaro.org@nongnu.org>

Series

target/arm: Fixups for ARM_FEATURE_V8_FP16 | expand

Commit Message

Richard Henderson April 25, 2018, 1:22 a.m. UTC

The instruction "ucvtf v0.4h, v04h, #2", with input 0x8000u,
overflows the intermediate float16 to infinity before we have a
chance to scale the output.  Use float64 as the intermediate type
so that no input argument (uint32_t in this case) can overflow
or round before scaling.  Given the declared argument, the signed
int32_t function has the same problem.

When converting from float16 to integer, using u/int32_t instead
of u/int16_t means that the bounding is incorrect.

Signed-off-by: Richard Henderson <richard.henderson@linaro.org>

---
 target/arm/helper.h        |  4 ++--
 target/arm/helper.c        | 53 ++++++++++++++++++++++++++++++++++++++++++++--
 target/arm/translate-a64.c |  4 ++--
 3 files changed, 55 insertions(+), 6 deletions(-)

-- 
2.14.3

Comments

Alex Bennée May 1, 2018, 10:10 a.m. UTC | #1

Richard Henderson <richard.henderson@linaro.org> writes:

> The instruction "ucvtf v0.4h, v04h, #2", with input 0x8000u,

> overflows the intermediate float16 to infinity before we have a

> chance to scale the output.  Use float64 as the intermediate type

> so that no input argument (uint32_t in this case) can overflow

> or round before scaling.  Given the declared argument, the signed

> int32_t function has the same problem.

>

> When converting from float16 to integer, using u/int32_t instead

> of u/int16_t means that the bounding is incorrect.

>

> Signed-off-by: Richard Henderson <richard.henderson@linaro.org>


Reviewed-by: Alex Bennée <alex.bennee@linaro.org>


> ---

>  target/arm/helper.h        |  4 ++--

>  target/arm/helper.c        | 53 ++++++++++++++++++++++++++++++++++++++++++++--

>  target/arm/translate-a64.c |  4 ++--

>  3 files changed, 55 insertions(+), 6 deletions(-)

>

> diff --git a/target/arm/helper.h b/target/arm/helper.h

> index b3ae394b4f..eafd5d746b 100644

> --- a/target/arm/helper.h

> +++ b/target/arm/helper.h

> @@ -149,8 +149,8 @@ DEF_HELPER_3(vfp_toshd_round_to_zero, i64, f64, i32, ptr)

>  DEF_HELPER_3(vfp_tosld_round_to_zero, i64, f64, i32, ptr)

>  DEF_HELPER_3(vfp_touhd_round_to_zero, i64, f64, i32, ptr)

>  DEF_HELPER_3(vfp_tould_round_to_zero, i64, f64, i32, ptr)

> -DEF_HELPER_3(vfp_toulh, i32, f16, i32, ptr)

> -DEF_HELPER_3(vfp_toslh, i32, f16, i32, ptr)

> +DEF_HELPER_3(vfp_touhh, i32, f16, i32, ptr)

> +DEF_HELPER_3(vfp_toshh, i32, f16, i32, ptr)

>  DEF_HELPER_3(vfp_toshs, i32, f32, i32, ptr)

>  DEF_HELPER_3(vfp_tosls, i32, f32, i32, ptr)

>  DEF_HELPER_3(vfp_tosqs, i64, f32, i32, ptr)

> diff --git a/target/arm/helper.c b/target/arm/helper.c

> index ea09510599..743f34bd0a 100644

> --- a/target/arm/helper.c

> +++ b/target/arm/helper.c

> @@ -11409,11 +11409,60 @@ VFP_CONV_FIX_A64(sq, s, 32, 64, int64)

>  VFP_CONV_FIX(uh, s, 32, 32, uint16)

>  VFP_CONV_FIX(ul, s, 32, 32, uint32)

>  VFP_CONV_FIX_A64(uq, s, 32, 64, uint64)

> -VFP_CONV_FIX_A64(sl, h, 16, 32, int32)

> -VFP_CONV_FIX_A64(ul, h, 16, 32, uint32)

> +

>  #undef VFP_CONV_FIX

>  #undef VFP_CONV_FIX_FLOAT

>  #undef VFP_CONV_FLOAT_FIX_ROUND

> +#undef VFP_CONV_FIX_A64

> +

> +/* Conversion to/from f16 can overflow to infinity before/after scaling.

> + * Therefore we convert to f64 (which does not round), scale,

> + * and then convert f64 to f16 (which may round).

> + */

> +

> +static float16 do_postscale_fp16(float64 f, int shift, float_status *fpst)

> +{

> +    return float64_to_float16(float64_scalbn(f, -shift, fpst), true, fpst);

> +}

> +

> +float16 HELPER(vfp_sltoh)(uint32_t x, uint32_t shift, void *fpst)

> +{

> +    return do_postscale_fp16(int32_to_float64(x, fpst), shift, fpst);

> +}

> +

> +float16 HELPER(vfp_ultoh)(uint32_t x, uint32_t shift, void *fpst)

> +{

> +    return do_postscale_fp16(uint32_to_float64(x, fpst), shift, fpst);

> +}

> +

> +static float64 do_prescale_fp16(float16 f, int shift, float_status *fpst)

> +{

> +    if (unlikely(float16_is_any_nan(f))) {

> +        float_raise(float_flag_invalid, fpst);

> +        return 0;

> +    } else {

> +        int old_exc_flags = get_float_exception_flags(fpst);

> +        float64 ret;

> +

> +        ret = float16_to_float64(f, true, fpst);

> +        ret = float64_scalbn(ret, shift, fpst);

> +        old_exc_flags |= get_float_exception_flags(fpst)

> +            & float_flag_input_denormal;

> +        set_float_exception_flags(old_exc_flags, fpst);

> +

> +        return ret;

> +    }

> +}

> +

> +uint32_t HELPER(vfp_toshh)(float16 x, uint32_t shift, void *fpst)

> +{

> +    return float64_to_int16(do_prescale_fp16(x, shift, fpst), fpst);

> +}

> +

> +uint32_t HELPER(vfp_touhh)(float16 x, uint32_t shift, void *fpst)

> +{

> +    return float64_to_uint16(do_prescale_fp16(x, shift, fpst), fpst);

> +}

>

>  /* Set the current fp rounding mode and return the old one.

>   * The argument is a softfloat float_round_ value.

> diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c

> index e2d11998bd..b27892d971 100644

> --- a/target/arm/translate-a64.c

> +++ b/target/arm/translate-a64.c

> @@ -7181,9 +7181,9 @@ static void handle_simd_shift_fpint_conv(DisasContext *s, bool is_scalar,

>          switch (size) {

>          case MO_16:

>              if (is_u) {

> -                fn = gen_helper_vfp_toulh;

> +                fn = gen_helper_vfp_touhh;

>              } else {

> -                fn = gen_helper_vfp_toslh;

> +                fn = gen_helper_vfp_toshh;

>              }

>              break;

>          case MO_32:



--
Alex Bennée

diff --git a/target/arm/helper.h b/target/arm/helper.h
index b3ae394b4f..eafd5d746b 100644
--- a/target/arm/helper.h
+++ b/target/arm/helper.h
@@ -149,8 +149,8 @@  DEF_HELPER_3(vfp_toshd_round_to_zero, i64, f64, i32, ptr)
 DEF_HELPER_3(vfp_tosld_round_to_zero, i64, f64, i32, ptr)
 DEF_HELPER_3(vfp_touhd_round_to_zero, i64, f64, i32, ptr)
 DEF_HELPER_3(vfp_tould_round_to_zero, i64, f64, i32, ptr)
-DEF_HELPER_3(vfp_toulh, i32, f16, i32, ptr)
-DEF_HELPER_3(vfp_toslh, i32, f16, i32, ptr)
+DEF_HELPER_3(vfp_touhh, i32, f16, i32, ptr)
+DEF_HELPER_3(vfp_toshh, i32, f16, i32, ptr)
 DEF_HELPER_3(vfp_toshs, i32, f32, i32, ptr)
 DEF_HELPER_3(vfp_tosls, i32, f32, i32, ptr)
 DEF_HELPER_3(vfp_tosqs, i64, f32, i32, ptr)
diff --git a/target/arm/helper.c b/target/arm/helper.c
index ea09510599..743f34bd0a 100644
--- a/target/arm/helper.c
+++ b/target/arm/helper.c
@@ -11409,11 +11409,60 @@  VFP_CONV_FIX_A64(sq, s, 32, 64, int64)
 VFP_CONV_FIX(uh, s, 32, 32, uint16)
 VFP_CONV_FIX(ul, s, 32, 32, uint32)
 VFP_CONV_FIX_A64(uq, s, 32, 64, uint64)
-VFP_CONV_FIX_A64(sl, h, 16, 32, int32)
-VFP_CONV_FIX_A64(ul, h, 16, 32, uint32)
+
 #undef VFP_CONV_FIX
 #undef VFP_CONV_FIX_FLOAT
 #undef VFP_CONV_FLOAT_FIX_ROUND
+#undef VFP_CONV_FIX_A64
+
+/* Conversion to/from f16 can overflow to infinity before/after scaling.
+ * Therefore we convert to f64 (which does not round), scale,
+ * and then convert f64 to f16 (which may round).
+ */
+
+static float16 do_postscale_fp16(float64 f, int shift, float_status *fpst)
+{
+    return float64_to_float16(float64_scalbn(f, -shift, fpst), true, fpst);
+}
+
+float16 HELPER(vfp_sltoh)(uint32_t x, uint32_t shift, void *fpst)
+{
+    return do_postscale_fp16(int32_to_float64(x, fpst), shift, fpst);
+}
+
+float16 HELPER(vfp_ultoh)(uint32_t x, uint32_t shift, void *fpst)
+{
+    return do_postscale_fp16(uint32_to_float64(x, fpst), shift, fpst);
+}
+
+static float64 do_prescale_fp16(float16 f, int shift, float_status *fpst)
+{
+    if (unlikely(float16_is_any_nan(f))) {
+        float_raise(float_flag_invalid, fpst);
+        return 0;
+    } else {
+        int old_exc_flags = get_float_exception_flags(fpst);
+        float64 ret;
+
+        ret = float16_to_float64(f, true, fpst);
+        ret = float64_scalbn(ret, shift, fpst);
+        old_exc_flags |= get_float_exception_flags(fpst)
+            & float_flag_input_denormal;
+        set_float_exception_flags(old_exc_flags, fpst);
+
+        return ret;
+    }
+}
+
+uint32_t HELPER(vfp_toshh)(float16 x, uint32_t shift, void *fpst)
+{
+    return float64_to_int16(do_prescale_fp16(x, shift, fpst), fpst);
+}
+
+uint32_t HELPER(vfp_touhh)(float16 x, uint32_t shift, void *fpst)
+{
+    return float64_to_uint16(do_prescale_fp16(x, shift, fpst), fpst);
+}
 
 /* Set the current fp rounding mode and return the old one.
  * The argument is a softfloat float_round_ value.
diff --git a/target/arm/translate-a64.c b/target/arm/translate-a64.c
index e2d11998bd..b27892d971 100644
--- a/target/arm/translate-a64.c
+++ b/target/arm/translate-a64.c
@@ -7181,9 +7181,9 @@  static void handle_simd_shift_fpint_conv(DisasContext *s, bool is_scalar,
         switch (size) {
         case MO_16:
             if (is_u) {
-                fn = gen_helper_vfp_toulh;
+                fn = gen_helper_vfp_touhh;
             } else {
-                fn = gen_helper_vfp_toslh;
+                fn = gen_helper_vfp_toshh;
             }
             break;
         case MO_32:

[3/9] target/arm: Fix float16 to/from int16

Commit Message

Comments

Patch