AArch64: Fix SVE powf routine [BZ #33299]

author Pierre Blanchard <pierre.blanchard@arm.com>

Wed, 20 Aug 2025 17:41:50 +0000 (17:41 +0000)

committer Wilco Dijkstra <wilco.dijkstra@arm.com>

Wed, 20 Aug 2025 17:45:21 +0000 (17:45 +0000)
author Pierre Blanchard <pierre.blanchard@arm.com>
Wed, 20 Aug 2025 17:41:50 +0000 (17:41 +0000)
committer Wilco Dijkstra <wilco.dijkstra@arm.com>
Wed, 20 Aug 2025 17:45:21 +0000 (17:45 +0000)
diff --git a/sysdeps/aarch64/fpu/powf_sve.c b/sysdeps/aarch64/fpu/powf_sve.c

index 7046990aa118504a01183c7474020aa6fd83145b..65e9bd29d9bcca51666c6672beee7ee7f13e5a18 100644 (file)
--- a/sysdeps/aarch64/fpu/powf_sve.c
+++ b/sysdeps/aarch64/fpu/powf_sve.c
@@ -223,15 +223,15 @@ sv_powf_core (const svbool_t pg, svuint32_t i, svuint32_t iz, svint32_t k,
    const svbool_t ptrue = svptrue_b64 ();
  
    /* Unpack and promote input vectors (pg, y, z, i, k and sign_bias) into two
-   * in order to perform core computation in double precision.  */
+     in order to perform core computation in double precision.  */
    const svbool_t pg_lo = svunpklo (pg);
    const svbool_t pg_hi = svunpkhi (pg);
-  svfloat64_t y_lo
-      = svcvt_f64_x (pg, svreinterpret_f32 (svunpklo (svreinterpret_u32 (y))));
-  svfloat64_t y_hi
-      = svcvt_f64_x (pg, svreinterpret_f32 (svunpkhi (svreinterpret_u32 (y))));
-  svfloat64_t z_lo = svcvt_f64_x (pg, svreinterpret_f32 (svunpklo (iz)));
-  svfloat64_t z_hi = svcvt_f64_x (pg, svreinterpret_f32 (svunpkhi (iz)));
+  svfloat64_t y_lo = svcvt_f64_x (
+      ptrue, svreinterpret_f32 (svunpklo (svreinterpret_u32 (y))));
+  svfloat64_t y_hi = svcvt_f64_x (
+      ptrue, svreinterpret_f32 (svunpkhi (svreinterpret_u32 (y))));
+  svfloat64_t z_lo = svcvt_f64_x (ptrue, svreinterpret_f32 (svunpklo (iz)));
+  svfloat64_t z_hi = svcvt_f64_x (ptrue, svreinterpret_f32 (svunpkhi (iz)));
    svuint64_t i_lo = svunpklo (i);
    svuint64_t i_hi = svunpkhi (i);
    svint64_t k_lo = svunpklo (k);
@@ -312,7 +312,7 @@ svfloat32_t SV_NAME_F2 (pow) (svfloat32_t x, svfloat32_t y, const svbool_t pg)
                          (23 - V_POWF_EXP2_TABLE_BITS));
  
    /* Compute core in extended precision and return intermediate ylogx results
-   * to handle cases of underflow and underflow in exp.  */
+     to handle cases of underflow and overflow in exp.  */
    svfloat32_t ylogx;
    svfloat32_t ret
        = sv_powf_core (yint_or_xpos, i, iz, k, y, sign_bias, &ylogx, d);
author	Pierre Blanchard <pierre.blanchard@arm.com>
	Wed, 20 Aug 2025 17:41:50 +0000 (17:41 +0000)
committer	Wilco Dijkstra <wilco.dijkstra@arm.com>
	Wed, 20 Aug 2025 17:45:21 +0000 (17:45 +0000)