Support vec_fmaddsub/vec_fmsubadd for vector HFmode.

author liuhongt <hongtao.liu@intel.com>

Mon, 31 Jul 2023 08:03:45 +0000 (16:03 +0800)

committer liuhongt <hongtao.liu@intel.com>

Wed, 2 Aug 2023 06:50:03 +0000 (14:50 +0800)
author liuhongt <hongtao.liu@intel.com>
Mon, 31 Jul 2023 08:03:45 +0000 (16:03 +0800)
committer liuhongt <hongtao.liu@intel.com>
Wed, 2 Aug 2023 06:50:03 +0000 (14:50 +0800)
diff --git a/gcc/config/i386/sse.md b/gcc/config/i386/sse.md

index 8dea05703569f893d955ac9c2799e7eb3d405cc2..43afcfdc7502a76b8b939d0af72541b0cc6c17fc 100644 (file)
--- a/gcc/config/i386/sse.md
+++ b/gcc/config/i386/sse.md
@@ -5803,21 +5803,21 @@
  ;; But this doesn't seem useful in practice.
  
  (define_expand "vec_fmaddsub<mode>4"
-  [(set (match_operand:VF 0 "register_operand")
-       (unspec:VF
-         [(match_operand:VF 1 "nonimmediate_operand")
-          (match_operand:VF 2 "nonimmediate_operand")
-          (match_operand:VF 3 "nonimmediate_operand")]
+  [(set (match_operand:VFH 0 "register_operand")
+       (unspec:VFH
+         [(match_operand:VFH 1 "nonimmediate_operand")
+          (match_operand:VFH 2 "nonimmediate_operand")
+          (match_operand:VFH 3 "nonimmediate_operand")]
           UNSPEC_FMADDSUB))]
    "TARGET_FMA || TARGET_FMA4 || (<MODE_SIZE> == 64 || TARGET_AVX512VL)")
  
  (define_expand "vec_fmsubadd<mode>4"
-  [(set (match_operand:VF 0 "register_operand")
-       (unspec:VF
-         [(match_operand:VF 1 "nonimmediate_operand")
-          (match_operand:VF 2 "nonimmediate_operand")
-          (neg:VF
-            (match_operand:VF 3 "nonimmediate_operand"))]
+  [(set (match_operand:VFH 0 "register_operand")
+       (unspec:VFH
+         [(match_operand:VFH 1 "nonimmediate_operand")
+          (match_operand:VFH 2 "nonimmediate_operand")
+          (neg:VFH
+            (match_operand:VFH 3 "nonimmediate_operand"))]
           UNSPEC_FMADDSUB))]
    "TARGET_FMA || TARGET_FMA4 || (<MODE_SIZE> == 64 || TARGET_AVX512VL)")
  
@@ -5877,11 +5877,11 @@
     (set_attr "mode" "<MODE>")])
  
  (define_insn "<sd_mask_codefor>fma_fmaddsub_<mode><sd_maskz_name><round_name>"
-  [(set (match_operand:VFH_SF_AVX512VL 0 "register_operand" "=v,v,v")
-       (unspec:VFH_SF_AVX512VL
-         [(match_operand:VFH_SF_AVX512VL 1 "<round_nimm_predicate>" "%0,0,v")
-          (match_operand:VFH_SF_AVX512VL 2 "<round_nimm_predicate>" "<round_constraint>,v,<round_constraint>")
-          (match_operand:VFH_SF_AVX512VL 3 "<round_nimm_predicate>" "v,<round_constraint>,0")]
+  [(set (match_operand:VFH_AVX512VL 0 "register_operand" "=v,v,v")
+       (unspec:VFH_AVX512VL
+         [(match_operand:VFH_AVX512VL 1 "<round_nimm_predicate>" "%0,0,v")
+          (match_operand:VFH_AVX512VL 2 "<round_nimm_predicate>" "<round_constraint>,v,<round_constraint>")
+          (match_operand:VFH_AVX512VL 3 "<round_nimm_predicate>" "v,<round_constraint>,0")]
           UNSPEC_FMADDSUB))]
    "TARGET_AVX512F && <sd_mask_mode512bit_condition> && <round_mode512bit_condition>"
    "@
@@ -5943,12 +5943,12 @@
     (set_attr "mode" "<MODE>")])
  
  (define_insn "<sd_mask_codefor>fma_fmsubadd_<mode><sd_maskz_name><round_name>"
-  [(set (match_operand:VFH_SF_AVX512VL 0 "register_operand" "=v,v,v")
-       (unspec:VFH_SF_AVX512VL
-         [(match_operand:VFH_SF_AVX512VL   1 "<round_nimm_predicate>" "%0,0,v")
-          (match_operand:VFH_SF_AVX512VL   2 "<round_nimm_predicate>" "<round_constraint>,v,<round_constraint>")
-          (neg:VFH_SF_AVX512VL
-            (match_operand:VFH_SF_AVX512VL 3 "<round_nimm_predicate>" "v,<round_constraint>,0"))]
+  [(set (match_operand:VFH_AVX512VL 0 "register_operand" "=v,v,v")
+       (unspec:VFH_AVX512VL
+         [(match_operand:VFH_AVX512VL   1 "<round_nimm_predicate>" "%0,0,v")
+          (match_operand:VFH_AVX512VL   2 "<round_nimm_predicate>" "<round_constraint>,v,<round_constraint>")
+          (neg:VFH_AVX512VL
+            (match_operand:VFH_AVX512VL 3 "<round_nimm_predicate>" "v,<round_constraint>,0"))]
           UNSPEC_FMADDSUB))]
    "TARGET_AVX512F && <sd_mask_mode512bit_condition> && <round_mode512bit_condition>"
    "@
diff --git a/gcc/testsuite/gcc.target/i386/pr81904.c b/gcc/testsuite/gcc.target/i386/pr81904.c

new file mode 100644 (file)

index 0000000..9f5ad0b
--- /dev/null
+++ b/gcc/testsuite/gcc.target/i386/pr81904.c
@@ -0,0 +1,22 @@
+/* { dg-do compile } */
+/* { dg-options "-mavx512fp16 -mavx512vl -O2 -mprefer-vector-width=512" } */
+/* { dg-final { scan-assembler-times "vfmaddsub...ph\[ \t\]+\[^\n\]*%zmm\[0-9\]" 1 } } */
+/* { dg-final { scan-assembler-times "vfmsubadd...ph\[ \t\]+\[^\n\]*%zmm\[0-9\]" 1 } } */
+
+void vec_fmaddsub_fp16(int n, _Float16 da_r, _Float16 *x, _Float16* y, _Float16* __restrict z)
+{
+  for (int i = 0; i < 32; i += 2)
+    {
+      z[i] =  da_r * x[i] - y[i];
+      z[i+1]  =  da_r * x[i+1] + y[i+1];
+    }
+}
+
+void vec_fmasubadd_fp16(int n, _Float16 da_r, _Float16 *x, _Float16* y, _Float16* __restrict z)
+{
+  for (int i = 0; i < 32; i += 2)
+    {
+      z[i] =  da_r * x[i] + y[i];
+      z[i+1]  =  da_r * x[i+1] - y[i+1];
+    }
+}
author	liuhongt <hongtao.liu@intel.com>
	Mon, 31 Jul 2023 08:03:45 +0000 (16:03 +0800)
committer	liuhongt <hongtao.liu@intel.com>
	Wed, 2 Aug 2023 06:50:03 +0000 (14:50 +0800)
gcc/config/i386/sse.md		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/i386/pr81904.c	[new file with mode: 0644]	patch \| blob