aarch64: Force vector in SVE gimple_folder::fold_active_lanes_to.

author Jennifer Schmitz <jschmitz@nvidia.com>

Thu, 28 Aug 2025 10:10:27 +0000 (03:10 -0700)

committer Jennifer Schmitz <jschmitz@nvidia.com>

Tue, 16 Sep 2025 14:06:24 +0000 (16:06 +0200)
author Jennifer Schmitz <jschmitz@nvidia.com>
Thu, 28 Aug 2025 10:10:27 +0000 (03:10 -0700)
committer Jennifer Schmitz <jschmitz@nvidia.com>
Tue, 16 Sep 2025 14:06:24 +0000 (16:06 +0200)
diff --git a/gcc/config/aarch64/aarch64-sve-builtins.cc b/gcc/config/aarch64/aarch64-sve-builtins.cc

index 909d9e524e1e0a77f60459c3e58a5f1246aee01a..3facc42843e331169a704dcf821eec21072e026b 100644 (file)
--- a/gcc/config/aarch64/aarch64-sve-builtins.cc
+++ b/gcc/config/aarch64/aarch64-sve-builtins.cc
@@ -3799,6 +3799,7 @@ gimple_folder::fold_active_lanes_to (tree x)
  
    gimple_seq stmts = NULL;
    tree pred = convert_pred (stmts, vector_type (0), 0);
+  x = force_vector (stmts, TREE_TYPE (lhs), x);
    gsi_insert_seq_before (gsi, stmts, GSI_SAME_STMT);
    return gimple_build_assign (lhs, VEC_COND_EXPR, pred, x, vec_inactive);
  }
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_s16.c b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_s16.c

index e9b6bf83b032e8751019026faa80e7f1d76ba04a..4148097cc63cb0bce6326e6bb4cae3d28364a407 100644 (file)
--- a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_s16.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_s16.c
@@ -331,6 +331,16 @@ TEST_UNIFORM_Z (mul_1op1_s16_z_tied2, svint16_t,
                 z0 = svmul_s16_z (p0, svdup_s16 (1), z0),
                 z0 = svmul_z (p0, svdup_s16 (1), z0))
  
+/*
+** mul_1op1n_s16_z:
+**     movprfx z0\.h, p0/z, z0\.h
+**     mov     z0\.h, p0/m, w0
+**     ret
+*/
+TEST_UNIFORM_ZX (mul_1op1n_s16_z, svint16_t, int16_t,
+       z0 = svmul_n_s16_z (p0, svdup_s16 (1), x0),
+       z0 = svmul_z (p0, svdup_s16 (1), x0))
+
  /*
  ** mul_3_s16_z_tied1:
  **     mov     (z[0-9]+\.h), #3
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_s32.c b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_s32.c

index 71c476f48ca36297ce62f59aeb348d1f51b9318b..2c53e3f14d64710fd663a76cb2a2721ea4e254c3 100644 (file)
--- a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_s32.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_s32.c
@@ -341,6 +341,16 @@ TEST_UNIFORM_Z (mul_1op1_s32_z_tied2, svint32_t,
                 z0 = svmul_s32_z (p0, svdup_s32 (1), z0),
                 z0 = svmul_z (p0, svdup_s32 (1), z0))
  
+/*
+** mul_1op1n_s32_z:
+**     movprfx z0\.s, p0/z, z0\.s
+**     mov     z0\.s, p0/m, w0
+**     ret
+*/
+TEST_UNIFORM_ZX (mul_1op1n_s32_z, svint32_t, int32_t,
+       z0 = svmul_n_s32_z (p0, svdup_s32 (1), x0),
+       z0 = svmul_z (p0, svdup_s32 (1), x0))
+
  /*
  ** mul_3_s32_z_tied1:
  **     mov     (z[0-9]+\.s), #3
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_s64.c b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_s64.c

index a34dc27740a811bc41271ccaa5b2121f108ba2df..55342a13f8bd623103abbda13377f25ce6b9a8b8 100644 (file)
--- a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_s64.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_s64.c
@@ -340,6 +340,16 @@ TEST_UNIFORM_Z (mul_1op1_s64_z_tied2, svint64_t,
                 z0 = svmul_s64_z (p0, svdup_s64 (1), z0),
                 z0 = svmul_z (p0, svdup_s64 (1), z0))
  
+/*
+** mul_1op1n_s64_z:
+**     movprfx z0\.d, p0/z, z0\.d
+**     mov     z0\.d, p0/m, x0
+**     ret
+*/
+TEST_UNIFORM_ZX (mul_1op1n_s64_z, svint64_t, int64_t,
+       z0 = svmul_n_s64_z (p0, svdup_s64 (1), x0),
+       z0 = svmul_z (p0, svdup_s64 (1), x0))
+
  /*
  ** mul_2_s64_z_tied1:
  **     movprfx z0.d, p0/z, z0.d
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_s8.c b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_s8.c

index 683e15eccecb8a43cc03a2b9a417f0aad7a26f7d..786a424eeead9f1eb767e57a9ef932effbda4288 100644 (file)
--- a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_s8.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_s8.c
@@ -331,6 +331,16 @@ TEST_UNIFORM_Z (mul_1op1_s8_z_tied2, svint8_t,
                 z0 = svmul_s8_z (p0, svdup_s8 (1), z0),
                 z0 = svmul_z (p0, svdup_s8 (1), z0))
  
+/*
+** mul_1op1n_s8_z:
+**     movprfx z0\.b, p0/z, z0\.b
+**     mov     z0\.b, p0/m, w0
+**     ret
+*/
+TEST_UNIFORM_ZX (mul_1op1n_s8_z, svint8_t, int8_t,
+       z0 = svmul_n_s8_z (p0, svdup_s8 (1), x0),
+       z0 = svmul_z (p0, svdup_s8 (1), x0))
+
  /*
  ** mul_3_s8_z_tied1:
  **     mov     (z[0-9]+\.b), #3
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_u16.c b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_u16.c

index e228dc5995dfe43d3634127421f4935664a1646b..ed08635382d51cceb7e3f519b5398d09bd75eaae 100644 (file)
--- a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_u16.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_u16.c
@@ -312,6 +312,16 @@ TEST_UNIFORM_Z (mul_1op1_u16_z_tied2, svuint16_t,
                 z0 = svmul_u16_z (p0, svdup_u16 (1), z0),
                 z0 = svmul_z (p0, svdup_u16 (1), z0))
  
+/*
+** mul_1op1n_u16_z:
+**     movprfx z0\.h, p0/z, z0\.h
+**     mov     z0\.h, p0/m, w0
+**     ret
+*/
+TEST_UNIFORM_ZX (mul_1op1n_u16_z, svuint16_t, uint16_t,
+       z0 = svmul_n_u16_z (p0, svdup_u16 (1), x0),
+       z0 = svmul_z (p0, svdup_u16 (1), x0))
+
  /*
  ** mul_3_u16_z_tied1:
  **     mov     (z[0-9]+\.h), #3
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_u32.c b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_u32.c

index e8f52c9d7854b31e8c4438f13957ae1c05964552..f82ac4269e8fd37e9c9455f6f1e0d028e7457c97 100644 (file)
--- a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_u32.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_u32.c
@@ -312,6 +312,16 @@ TEST_UNIFORM_Z (mul_1op1_u32_z_tied2, svuint32_t,
                 z0 = svmul_u32_z (p0, svdup_u32 (1), z0),
                 z0 = svmul_z (p0, svdup_u32 (1), z0))
  
+/*
+** mul_1op1n_u32_z:
+**     movprfx z0\.s, p0/z, z0\.s
+**     mov     z0\.s, p0/m, w0
+**     ret
+*/
+TEST_UNIFORM_ZX (mul_1op1n_u32_z, svuint32_t, uint32_t,
+       z0 = svmul_n_u32_z (p0, svdup_u32 (1), x0),
+       z0 = svmul_z (p0, svdup_u32 (1), x0))
+
  /*
  ** mul_3_u32_z_tied1:
  **     mov     (z[0-9]+\.s), #3
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_u64.c b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_u64.c

index 2ccdc3642c52085f5c0035af1a4c32341c013f50..9f1bfff5fd2fd0a4f9d09d962f8ad9dd81eb1e49 100644 (file)
--- a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_u64.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_u64.c
@@ -333,6 +333,16 @@ TEST_UNIFORM_Z (mul_1op1_u64_z_tied2, svuint64_t,
                 z0 = svmul_u64_z (p0, svdup_u64 (1), z0),
                 z0 = svmul_z (p0, svdup_u64 (1), z0))
  
+/*
+** mul_1op1n_u64_z:
+**     movprfx z0\.d, p0/z, z0\.d
+**     mov     z0\.d, p0/m, x0
+**     ret
+*/
+TEST_UNIFORM_ZX (mul_1op1n_u64_z, svuint64_t, uint64_t,
+       z0 = svmul_n_u64_z (p0, svdup_u64 (1), x0),
+       z0 = svmul_z (p0, svdup_u64 (1), x0))
+
  /*
  ** mul_2_u64_z_tied1:
  **     movprfx z0.d, p0/z, z0.d
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_u8.c b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_u8.c

index 8e53a4821f05d19bf1e950ea40ef8ea0f80ab764..b2c1edf5ff8245dc8ec08a11493571f7d01aabac 100644 (file)
--- a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_u8.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_u8.c
@@ -312,6 +312,16 @@ TEST_UNIFORM_Z (mul_1op1_u8_z_tied2, svuint8_t,
                 z0 = svmul_u8_z (p0, svdup_u8 (1), z0),
                 z0 = svmul_z (p0, svdup_u8 (1), z0))
  
+/*
+** mul_1op1n_u8_z:
+**     movprfx z0\.b, p0/z, z0\.b
+**     mov     z0\.b, p0/m, w0
+**     ret
+*/
+TEST_UNIFORM_ZX (mul_1op1n_u8_z, svuint8_t, uint8_t,
+       z0 = svmul_n_u8_z (p0, svdup_u8 (1), x0),
+       z0 = svmul_z (p0, svdup_u8 (1), x0))
+
  /*
  ** mul_3_u8_z_tied1:
  **     mov     (z[0-9]+\.b), #3
author	Jennifer Schmitz <jschmitz@nvidia.com>
	Thu, 28 Aug 2025 10:10:27 +0000 (03:10 -0700)
committer	Jennifer Schmitz <jschmitz@nvidia.com>
	Tue, 16 Sep 2025 14:06:24 +0000 (16:06 +0200)
gcc/config/aarch64/aarch64-sve-builtins.cc		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_s16.c		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_s32.c		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_s64.c		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_s8.c		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_u16.c		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_u32.c		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_u64.c		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/aarch64/sve/acle/asm/mul_u8.c		patch \| blob \| blame \| history