From: Saurabh Jha <saurabh.jha@arm.com>
Date: Wed, 11 Mar 2026 10:30:04 +0000 (+0000)
Subject: aarch64: mingw: Add more tests for variadic hva
X-Git-Url: http://git.ipfire.org/cgi-bin/gitweb.cgi?a=commitdiff_plain;h=f9d51409f978afa569cf6a9bc145f9c8d31ddda2;p=thirdparty%2Fgcc.git

aarch64: mingw: Add more tests for variadic hva

The test gcc.target/aarch64/mingw/variadic_hva.c started failing after
this commit:
b67918fddab42c434c10bedff6c210c55ed907a0

This commit adds three variants of this test case with options that
introduce more predictability to code generation. This will make it less
probable that these tests will break with any other future change. The
options used are:
1. -fno-section-anchors
2. -mcmodel=tiny
3. -mcmodel=small.

gcc/testsuite/ChangeLog:

	* gcc.target/aarch64/mingw/variadic_hva.c: Deleted and created
	three variants.
	* gcc.target/aarch64/mingw/variadic_hva1.c: Derived from
	variadic_hva.c and compiled with option -fno-section-anchors.
	* gcc.target/aarch64/mingw/variadic_hva2.c: Derived from
	variadic_hva.c and compiled with option -mcmodel=tiny.
	* gcc.target/aarch64/mingw/variadic_hva3.c: Derived from
	variadic_hva.c and compiled with option -mcmodel=small.
---

diff --git a/gcc/testsuite/gcc.target/aarch64/mingw/variadic_hva1.c b/gcc/testsuite/gcc.target/aarch64/mingw/variadic_hva1.c
new file mode 100644
index 00000000000..65a230445f8
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/mingw/variadic_hva1.c
@@ -0,0 +1,93 @@
+/* { dg-do compile } */
+/* { dg-options "-fno-section-anchors" } */
+/* { dg-final { check-function-bodies "**" "" } } */
+
+#include <arm_neon.h>
+#include <stdarg.h>
+
+typedef struct {
+  float32x4_t a;
+  float32x4_t b;
+  float32x4_t c;
+  float32x4_t d;
+} mat4x4;
+
+mat4x4 accumulate(int count, ...) {
+    va_list va;
+    va_start(va, count);
+
+    mat4x4 result = {
+      vdupq_n_f32(0.0f),
+      vdupq_n_f32(0.0f),
+      vdupq_n_f32(0.0f),
+      vdupq_n_f32(0.0f)
+    };
+
+    for (int i = 0; i < count; ++i) {
+        mat4x4 v = va_arg(va, mat4x4);
+        result.a = vaddq_f32(result.a, v.a);
+        result.b = vaddq_f32(result.b, v.b);
+        result.c = vaddq_f32(result.c, v.c);
+        result.d = vaddq_f32(result.d, v.d);
+    }
+
+    va_end(va);
+    return result;
+}
+
+
+/**
+ * For aarch64-w64-mingw32 target, the Homogeneous Vector Aggregate (HVA) types
+ * are not treated specially.
+ *
+ * This is in contrast to to aarch64-linux-gnu target where float32x4n args
+ * would be loaded into 128 bit Q registers.
+ */
+
+
+/*
+** main:
+**	...
+**	add	x\d+, x\d+, :lo\d+:\.LC\d+
+**	ldr	q\d+, \[x\d+\]
+**	str	q\d+, \[sp, \d+\]
+**	...
+**	add	x\d+, x\d+, :lo\d+:\.LC\d+
+**	ldr	q\d+, \[x\d+\]
+**	str	q\d+, \[sp, \d+\]
+**	...
+**	add	x\d+, x\d+, :lo\d+:\.LC\d+
+**	ldr	q\d+, \[x\d+\]
+**	str	q\d+, \[sp, \d+\]
+**	...
+**	add	x\d+, x\d+, :lo\d+:\.LC\d+
+**	ldr	q\d+, \[x\d+\]
+**	str	q\d+, \[sp, \d+\]
+**	...
+** 	ldr	x\d+, \[sp, \d+\]
+**  	...
+** 	ldr	x\d+, \[sp, \d+\]
+**  	...
+** 	ldr	x\d+, \[sp, \d+\]
+**  	...
+** 	ldr	x\d+, \[sp, \d+\]
+**  	...
+** 	ldr	x\d+, \[sp, \d+\]
+**  	...
+** 	ldr	x\d+, \[sp, \d+\]
+**  	...
+** 	ldr	x\d+, \[sp, \d+\]
+**  	...
+** 	ldr	x\d+, \[sp, \d+\]
+**	...
+*/
+int main()
+{
+  float32x4_t x = {1.0, 2.0, 3.0, 4.0};
+  float32x4_t y = {2.0, 3.0, 4.0, 5.0};
+  float32x4_t z = {3.0, 4.0, 5.0, 6.0};
+  float32x4_t w = {4.0, 5.0, 6.0, 7.0};
+
+  accumulate (4, x, y, z, w);
+  return 0;
+}
diff --git a/gcc/testsuite/gcc.target/aarch64/mingw/variadic_hva.c b/gcc/testsuite/gcc.target/aarch64/mingw/variadic_hva2.c
similarity index 84%
rename from gcc/testsuite/gcc.target/aarch64/mingw/variadic_hva.c
rename to gcc/testsuite/gcc.target/aarch64/mingw/variadic_hva2.c
index 7c690d38472..f7a6dbafa47 100644
--- a/gcc/testsuite/gcc.target/aarch64/mingw/variadic_hva.c
+++ b/gcc/testsuite/gcc.target/aarch64/mingw/variadic_hva2.c
@@ -1,5 +1,5 @@
 /* { dg-do compile } */
-/* { dg-additional-options "-std=c99" } */
+/* { dg-options "-mcmodel=tiny" } */
 /* { dg-final { check-function-bodies "**" "" } } */
 
 #include <arm_neon.h>
@@ -48,34 +48,34 @@ mat4x4 accumulate(int count, ...) {
 /*
 ** main:
 **	...
-** 	ldr	q\d+, \[x\d+, #:lo\d+:\.LC\d+\]
+** 	ldr	q\d+, \.LC\d+
 ** 	str	q\d+, \[sp, \d+\]
 **	...
-** 	ldr	q\d+, \[x\d+, #:lo\d+:\.LC\d+\]
+** 	ldr	q\d+, \.LC\d+
 ** 	str	q\d+, \[sp, \d+\]
 **	...
-** 	ldr	q\d+, \[x\d+, #:lo\d+:\.LC\d+\]
+** 	ldr	q\d+, \.LC\d+
 ** 	str	q\d+, \[sp, \d+\]
 **	...
-** 	ldr	q\d+, \[x\d+, #:lo\d+:\.LC\d+\]
+** 	ldr	q\d+, \.LC\d+
 ** 	str	q\d+, \[sp, \d+\]
-**  ...
+**  	...
 ** 	ldr	x\d+, \[sp, \d+\]
-**  ...
+**  	...
 ** 	ldr	x\d+, \[sp, \d+\]
-**  ...
+**  	...
 ** 	ldr	x\d+, \[sp, \d+\]
-**  ...
+**  	...
 ** 	ldr	x\d+, \[sp, \d+\]
-**  ...
+**  	...
 ** 	ldr	x\d+, \[sp, \d+\]
-**  ...
+**  	...
 ** 	ldr	x\d+, \[sp, \d+\]
-**  ...
+**  	...
 ** 	ldr	x\d+, \[sp, \d+\]
-**  ...
+**  	...
 ** 	ldr	x\d+, \[sp, \d+\]
-**  ...
+**  	...
 */
 int main()
 {
@@ -86,4 +86,4 @@ int main()
 
   accumulate (4, x, y, z, w);
   return 0;
-}
\ No newline at end of file
+}
diff --git a/gcc/testsuite/gcc.target/aarch64/mingw/variadic_hva3.c b/gcc/testsuite/gcc.target/aarch64/mingw/variadic_hva3.c
new file mode 100644
index 00000000000..64971b2cc93
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/mingw/variadic_hva3.c
@@ -0,0 +1,93 @@
+/* { dg-do compile } */
+/* { dg-options "-mcmodel=small" } */
+/* { dg-final { check-function-bodies "**" "" } } */
+
+#include <arm_neon.h>
+#include <stdarg.h>
+
+typedef struct {
+  float32x4_t a;
+  float32x4_t b;
+  float32x4_t c;
+  float32x4_t d;
+} mat4x4;
+
+mat4x4 accumulate(int count, ...) {
+    va_list va;
+    va_start(va, count);
+
+    mat4x4 result = {
+      vdupq_n_f32(0.0f),
+      vdupq_n_f32(0.0f),
+      vdupq_n_f32(0.0f),
+      vdupq_n_f32(0.0f)
+    };
+
+    for (int i = 0; i < count; ++i) {
+        mat4x4 v = va_arg(va, mat4x4);
+        result.a = vaddq_f32(result.a, v.a);
+        result.b = vaddq_f32(result.b, v.b);
+        result.c = vaddq_f32(result.c, v.c);
+        result.d = vaddq_f32(result.d, v.d);
+    }
+
+    va_end(va);
+    return result;
+}
+
+
+/**
+ * For aarch64-w64-mingw32 target, the Homogeneous Vector Aggregate (HVA) types
+ * are not treated specially.
+ *
+ * This is in contrast to to aarch64-linux-gnu target where float32x4n args
+ * would be loaded into 128 bit Q registers.
+ */
+
+
+/*
+** main:
+**	...
+**	add	x\d+, x\d+, :lo\d+:\.LC\d+
+**	ldr	q\d+, \[x\d+\]
+**	str	q\d+, \[sp, \d+\]
+**	...
+**	add	x\d+, x\d+, :lo\d+:\.LC\d+
+**	ldr	q\d+, \[x\d+\]
+**	str	q\d+, \[sp, \d+\]
+**	...
+**	add	x\d+, x\d+, :lo\d+:\.LC\d+
+**	ldr	q\d+, \[x\d+\]
+**	str	q\d+, \[sp, \d+\]
+**	...
+**	add	x\d+, x\d+, :lo\d+:\.LC\d+
+**	ldr	q\d+, \[x\d+\]
+**	str	q\d+, \[sp, \d+\]
+**  	...
+** 	ldr	x\d+, \[sp, \d+\]
+**  	...
+** 	ldr	x\d+, \[sp, \d+\]
+**  	...
+** 	ldr	x\d+, \[sp, \d+\]
+**  	...
+** 	ldr	x\d+, \[sp, \d+\]
+**  	...
+** 	ldr	x\d+, \[sp, \d+\]
+**  	...
+** 	ldr	x\d+, \[sp, \d+\]
+**  	...
+** 	ldr	x\d+, \[sp, \d+\]
+**  	...
+** 	ldr	x\d+, \[sp, \d+\]
+**  	...
+*/
+int main()
+{
+  float32x4_t x = {1.0, 2.0, 3.0, 4.0};
+  float32x4_t y = {2.0, 3.0, 4.0, 5.0};
+  float32x4_t z = {3.0, 4.0, 5.0, 6.0};
+  float32x4_t w = {4.0, 5.0, 6.0, 7.0};
+
+  accumulate (4, x, y, z, w);
+  return 0;
+}