From nobody Mon Feb  9 20:18:31 2026
Delivered-To: importer@patchew.org
Received-SPF: pass (zoho.com: domain of gnu.org designates 208.118.235.17 as
 permitted sender) client-ip=208.118.235.17;
 envelope-from=qemu-devel-bounces+importer=patchew.org@nongnu.org;
 helo=lists.gnu.org;
Authentication-Results: mx.zohomail.com;
	dkim=fail;
	spf=pass (zoho.com: domain of gnu.org designates 208.118.235.17 as permitted
 sender)  smtp.mailfrom=qemu-devel-bounces+importer=patchew.org@nongnu.org
Return-Path: <qemu-devel-bounces+importer=patchew.org@nongnu.org>
Received: from lists.gnu.org (lists.gnu.org [208.118.235.17]) by
 mx.zohomail.com
	with SMTPS id 15348267892341003.898888228161;
 Mon, 20 Aug 2018 21:46:29 -0700 (PDT)
Received: from localhost ([::1]:50708 helo=lists.gnu.org)
	by lists.gnu.org with esmtp (Exim 4.71)
	(envelope-from <qemu-devel-bounces+importer=patchew.org@nongnu.org>)
	id 1fryYl-00006G-V7
	for importer@patchew.org; Tue, 21 Aug 2018 00:46:28 -0400
Received: from eggs.gnu.org ([2001:4830:134:3::10]:56520)
	by lists.gnu.org with esmtp (Exim 4.71)
	(envelope-from <dgibson@ozlabs.org>) id 1fryMt-0004C7-Tn
	for qemu-devel@nongnu.org; Tue, 21 Aug 2018 00:34:15 -0400
Received: from Debian-exim by eggs.gnu.org with spam-scanned (Exim 4.71)
	(envelope-from <dgibson@ozlabs.org>) id 1fryMp-0000MW-03
	for qemu-devel@nongnu.org; Tue, 21 Aug 2018 00:34:11 -0400
Received: from ozlabs.org ([203.11.71.1]:39101)
	by eggs.gnu.org with esmtps (TLS1.0:DHE_RSA_AES_256_CBC_SHA1:32)
	(Exim 4.71) (envelope-from <dgibson@ozlabs.org>)
	id 1fryMk-0000Gk-Ss; Tue, 21 Aug 2018 00:34:05 -0400
Received: by ozlabs.org (Postfix, from userid 1007)
	id 41vd9F4ql2z9sCh; Tue, 21 Aug 2018 14:33:51 +1000 (AEST)
DKIM-Signature: v=1; a=rsa-sha256; c=relaxed/simple;
	d=gibson.dropbear.id.au; s=201602; t=1534826033;
	bh=nvjBLhRZ4TSfC5LLasaHiomTJbRKh1sOGnFknL/Leqk=;
	h=From:To:Cc:Subject:Date:In-Reply-To:References:From;
	b=LmbYxYXh7cnN0e7JbnhbY/ciVQnLmoeG/Z/5ZuRVJ1FQy8bFejq+vxWq3NKFBCKqu
	PLtt8bQbTjxxNO2jB6hgi7vEev7fqwRorwlhGKSFAdr6VPuSMCqwYAL0BHs8J9fWvS
	Njx1GtoivABIrTWfpKqGpYqgTk0VfrhvK5Kg0NRc=
From: David Gibson <david@gibson.dropbear.id.au>
To: peter.maydell@linaro.org
Date: Tue, 21 Aug 2018 14:33:26 +1000
Message-Id: <20180821043343.7514-10-david@gibson.dropbear.id.au>
X-Mailer: git-send-email 2.17.1
In-Reply-To: <20180821043343.7514-1-david@gibson.dropbear.id.au>
References: <20180821043343.7514-1-david@gibson.dropbear.id.au>
X-detected-operating-system: by eggs.gnu.org: GNU/Linux 2.2.x-3.x [generic]
X-Received-From: 203.11.71.1
Subject: [Qemu-devel] [PULL 09/26] target/ppc: Use non-arithmetic
 conversions for fp load/store
X-BeenThere: qemu-devel@nongnu.org
X-Mailman-Version: 2.1.21
Precedence: list
List-Id: <qemu-devel.nongnu.org>
List-Unsubscribe: <https://lists.nongnu.org/mailman/options/qemu-devel>,
	<mailto:qemu-devel-request@nongnu.org?subject=unsubscribe>
List-Archive: <http://lists.nongnu.org/archive/html/qemu-devel/>
List-Post: <mailto:qemu-devel@nongnu.org>
List-Help: <mailto:qemu-devel-request@nongnu.org?subject=help>
List-Subscribe: <https://lists.nongnu.org/mailman/listinfo/qemu-devel>,
	<mailto:qemu-devel-request@nongnu.org?subject=subscribe>
Cc: lvivier@redhat.com, aik@ozlabs.ru,
	Richard Henderson <richard.henderson@linaro.org>, groug@kaod.org,
	qemu-devel@nongnu.org, qemu-ppc@nongnu.org, clg@kaod.org,
	David Gibson <david@gibson.dropbear.id.au>
Errors-To: qemu-devel-bounces+importer=patchew.org@nongnu.org
Sender: "Qemu-devel" <qemu-devel-bounces+importer=patchew.org@nongnu.org>
X-ZohoMail-DKIM: fail (Header signature does not verify)
X-ZohoMail: RDKM_2  RSF_0  Z_629925259 SPT_0
Content-Transfer-Encoding: quoted-printable
MIME-Version: 1.0
Content-Type: text/plain; charset="utf-8"

From: Richard Henderson <richard.henderson@linaro.org>

Memory operations have no side effects on fp state.
The use of a "real" conversions between float64 and float32
would raise exceptions for SNaN and out-of-range inputs.

Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
Signed-off-by: David Gibson <david@gibson.dropbear.id.au>
---
 target/ppc/fpu_helper.c            | 61 ++++++++++++++++++++++++------
 target/ppc/helper.h                |  4 +-
 target/ppc/translate/fp-impl.inc.c | 26 +++++--------
 3 files changed, 61 insertions(+), 30 deletions(-)

diff --git a/target/ppc/fpu_helper.c b/target/ppc/fpu_helper.c
index 5af5241ab0..b9bb1b856e 100644
--- a/target/ppc/fpu_helper.c
+++ b/target/ppc/fpu_helper.c
@@ -47,24 +47,61 @@ static inline bool fp_exceptions_enabled(CPUPPCState *e=
nv)
=20
 /*************************************************************************=
****/
 /* Floating point operations helpers */
-uint64_t helper_float32_to_float64(CPUPPCState *env, uint32_t arg)
+
+/*
+ * This is the non-arithmatic conversion that happens e.g. on loads.
+ * In the Power ISA pseudocode, this is called DOUBLE.
+ */
+uint64_t helper_todouble(uint32_t arg)
 {
-    CPU_FloatU f;
-    CPU_DoubleU d;
+    uint32_t abs_arg =3D arg & 0x7fffffff;
+    uint64_t ret;
=20
-    f.l =3D arg;
-    d.d =3D float32_to_float64(f.f, &env->fp_status);
-    return d.ll;
+    if (likely(abs_arg >=3D 0x00800000)) {
+        /* Normalized operand, or Inf, or NaN.  */
+        ret  =3D (uint64_t)extract32(arg, 30, 2) << 62;
+        ret |=3D ((extract32(arg, 30, 1) ^ 1) * (uint64_t)7) << 59;
+        ret |=3D (uint64_t)extract32(arg, 0, 30) << 29;
+    } else {
+        /* Zero or Denormalized operand.  */
+        ret =3D (uint64_t)extract32(arg, 31, 1) << 63;
+        if (unlikely(abs_arg !=3D 0)) {
+            /* Denormalized operand.  */
+            int shift =3D clz32(abs_arg) - 9;
+            int exp =3D -126 - shift + 1023;
+            ret |=3D (uint64_t)exp << 52;
+            ret |=3D abs_arg << (shift + 29);
+        }
+    }
+    return ret;
 }
=20
-uint32_t helper_float64_to_float32(CPUPPCState *env, uint64_t arg)
+/*
+ * This is the non-arithmatic conversion that happens e.g. on stores.
+ * In the Power ISA pseudocode, this is called SINGLE.
+ */
+uint32_t helper_tosingle(uint64_t arg)
 {
-    CPU_FloatU f;
-    CPU_DoubleU d;
+    int exp =3D extract64(arg, 52, 11);
+    uint32_t ret;
=20
-    d.ll =3D arg;
-    f.f =3D float64_to_float32(d.d, &env->fp_status);
-    return f.l;
+    if (likely(exp > 896)) {
+        /* No denormalization required (includes Inf, NaN).  */
+        ret  =3D extract64(arg, 62, 2) << 30;
+        ret |=3D extract64(arg, 29, 30);
+    } else {
+        /* Zero or Denormal result.  If the exponent is in bounds for
+         * a single-precision denormal result, extract the proper bits.
+         * If the input is not zero, and the exponent is out of bounds,
+         * then the result is undefined; this underflows to zero.
+         */
+        ret =3D extract64(arg, 63, 1) << 31;
+        if (unlikely(exp >=3D 874)) {
+            /* Denormal result.  */
+            ret |=3D ((1ULL << 52) | extract64(arg, 0, 52)) >> (896 + 30 -=
 exp);
+        }
+    }
+    return ret;
 }
=20
 static inline int ppc_float32_get_unbiased_exp(float32 f)
diff --git a/target/ppc/helper.h b/target/ppc/helper.h
index 7ed72c2337..ef64248bc4 100644
--- a/target/ppc/helper.h
+++ b/target/ppc/helper.h
@@ -61,8 +61,8 @@ DEF_HELPER_2(compute_fprf_float64, void, env, i64)
 DEF_HELPER_3(store_fpscr, void, env, i64, i32)
 DEF_HELPER_2(fpscr_clrbit, void, env, i32)
 DEF_HELPER_2(fpscr_setbit, void, env, i32)
-DEF_HELPER_2(float64_to_float32, i32, env, i64)
-DEF_HELPER_2(float32_to_float64, i64, env, i32)
+DEF_HELPER_FLAGS_1(todouble, TCG_CALL_NO_RWG_SE, i64, i32)
+DEF_HELPER_FLAGS_1(tosingle, TCG_CALL_NO_RWG_SE, i32, i64)
=20
 DEF_HELPER_4(fcmpo, void, env, i64, i64, i32)
 DEF_HELPER_4(fcmpu, void, env, i64, i64, i32)
diff --git a/target/ppc/translate/fp-impl.inc.c b/target/ppc/translate/fp-i=
mpl.inc.c
index 2fbd4d4f38..a6f522b85c 100644
--- a/target/ppc/translate/fp-impl.inc.c
+++ b/target/ppc/translate/fp-impl.inc.c
@@ -660,15 +660,12 @@ GEN_LDUF(name, ldop, op | 0x21, type);               =
                         \
 GEN_LDUXF(name, ldop, op | 0x01, type);                                   =
    \
 GEN_LDXF(name, ldop, 0x17, op | 0x00, type)
=20
-static inline void gen_qemu_ld32fs(DisasContext *ctx, TCGv_i64 arg1, TCGv =
arg2)
+static void gen_qemu_ld32fs(DisasContext *ctx, TCGv_i64 dest, TCGv addr)
 {
-    TCGv t0 =3D tcg_temp_new();
-    TCGv_i32 t1 =3D tcg_temp_new_i32();
-    gen_qemu_ld32u(ctx, t0, arg2);
-    tcg_gen_trunc_tl_i32(t1, t0);
-    tcg_temp_free(t0);
-    gen_helper_float32_to_float64(arg1, cpu_env, t1);
-    tcg_temp_free_i32(t1);
+    TCGv_i32 tmp =3D tcg_temp_new_i32();
+    tcg_gen_qemu_ld_i32(tmp, addr, ctx->mem_idx, DEF_MEMOP(MO_UL));
+    gen_helper_todouble(dest, tmp);
+    tcg_temp_free_i32(tmp);
 }
=20
  /* lfd lfdu lfdux lfdx */
@@ -836,15 +833,12 @@ GEN_STUF(name, stop, op | 0x21, type);               =
                         \
 GEN_STUXF(name, stop, op | 0x01, type);                                   =
    \
 GEN_STXF(name, stop, 0x17, op | 0x00, type)
=20
-static inline void gen_qemu_st32fs(DisasContext *ctx, TCGv_i64 arg1, TCGv =
arg2)
+static void gen_qemu_st32fs(DisasContext *ctx, TCGv_i64 src, TCGv addr)
 {
-    TCGv_i32 t0 =3D tcg_temp_new_i32();
-    TCGv t1 =3D tcg_temp_new();
-    gen_helper_float64_to_float32(t0, cpu_env, arg1);
-    tcg_gen_extu_i32_tl(t1, t0);
-    tcg_temp_free_i32(t0);
-    gen_qemu_st32(ctx, t1, arg2);
-    tcg_temp_free(t1);
+    TCGv_i32 tmp =3D tcg_temp_new_i32();
+    gen_helper_tosingle(tmp, src);
+    tcg_gen_qemu_st_i32(tmp, addr, ctx->mem_idx, DEF_MEMOP(MO_UL));
+    tcg_temp_free_i32(tmp);
 }
=20
 /* stfd stfdu stfdux stfdx */
--=20
2.17.1