]> git.ipfire.org Git - thirdparty/gcc.git/commitdiff
amdgcn: add fmin/fmax patterns
authorAndrew Stubbs <ams@codesourcery.com>
Fri, 28 Oct 2022 12:09:20 +0000 (13:09 +0100)
committerAndrew Stubbs <ams@codesourcery.com>
Mon, 31 Oct 2022 12:20:53 +0000 (12:20 +0000)
Add fmin/fmax for scalar, vector, and reductions.  The smin/smax patterns are
already using the IEEE compliant hardware instructions anyway, so we can just
expand to use those insns.

gcc/ChangeLog:

* config/gcn/gcn-valu.md (fminmaxop): New iterator.
(<fexpander><mode>3): New define_expand.
(<fexpander><mode>3<exec>): Likewise.
(reduc_<fexpander>_scal_<mode>): Likewise.
* config/gcn/gcn.md (fexpander): New attribute.

gcc/config/gcn/gcn-valu.md
gcc/config/gcn/gcn.md

index 6274d2e922802b3ee912e6355a7f703cc96c7a87..3b619512e13fbbb078795c6467ee002bf9f3b4b8 100644 (file)
   [(set_attr "type" "vop2")
    (set_attr "length" "8,8")])
 
+(define_code_iterator fminmaxop [smin smax])
+(define_expand "<fexpander><mode>3"
+  [(set (match_operand:FP 0 "gcn_valu_dst_operand")
+       (fminmaxop:FP
+         (match_operand:FP 1 "gcn_valu_src0_operand")
+         (match_operand:FP 2 "gcn_valu_src1_operand")))]
+  ""
+  {})
+
+(define_expand "<fexpander><mode>3<exec>"
+  [(set (match_operand:V_FP 0 "gcn_valu_dst_operand")
+       (fminmaxop:V_FP
+         (match_operand:V_FP 1 "gcn_valu_src0_operand")
+         (match_operand:V_FP 2 "gcn_valu_src1_operand")))]
+  ""
+  {})
+
 ;; }}}
 ;; {{{ FP unops
 
     DONE;
   })
 
+(define_expand "reduc_<fexpander>_scal_<mode>"
+  [(match_operand:<SCALAR_MODE> 0 "register_operand")
+   (fminmaxop:V_FP
+     (match_operand:V_FP 1 "register_operand"))]
+  ""
+  {
+    /* fmin/fmax are identical to smin/smax.  */
+    emit_insn (gen_reduc_<expander>_scal_<mode> (operands[0], operands[1]));
+    DONE;
+  })
+
 ;; Warning: This "-ffast-math" implementation converts in-order reductions
 ;;          into associative reductions. It's also used where OpenMP or
 ;;          OpenACC paralellization has already broken the in-order semantics.
index 6c1a438f9d1a0b82191f92bf49fd66d1b7f2a4dd..987b76396cc110fe1cbe8a695fdc1f84ef5216c7 100644 (file)
    (sign_extend "extend")
    (zero_extend "zero_extend")])
 
+(define_code_attr fexpander
+  [(smin "fmin")
+   (smax "fmax")])
+
 ;; }}}
 ;; {{{ Miscellaneous instructions