]> git.ipfire.org Git - thirdparty/gcc.git/commitdiff
i386: vcvtph2ps and vcvtps2ph should be used to convert _Float16 to SFmode with ...
authorkonglin1 <lingling.kong@intel.com>
Wed, 10 Nov 2021 01:37:32 +0000 (09:37 +0800)
committerliuhongt <hongtao.liu@intel.com>
Fri, 26 Nov 2021 01:29:10 +0000 (09:29 +0800)
Add define_insn extendhfsf2 and truncsfhf2 for target_f16c.

gcc/ChangeLog:

PR target/102811
* config/i386/i386.c (ix86_can_change_mode_class): Allow 16 bit data in XMM register
for TARGET_SSE2.
* config/i386/i386.md (extendhfsf2): Add extenndhfsf2 for TARGET_F16C.
(extendhfdf2): Restrict extendhfdf for TARGET_AVX512FP16 only.
(*extendhf<mode>2): Rename from extendhf<mode>2.
(truncsfhf2): Likewise.
(truncdfhf2): Likewise.
(*trunc<mode>2): Likewise.

gcc/testsuite/ChangeLog:

PR target/102811
* gcc.target/i386/pr90773-21.c: Allow pextrw instead of movw.
* gcc.target/i386/pr90773-23.c: Ditto.
* gcc.target/i386/avx512vl-vcvtps2ph-pr102811.c: New test.

gcc/config/i386/i386.c
gcc/config/i386/i386.md
gcc/testsuite/gcc.target/i386/avx512vl-vcvtps2ph-pr102811.c [new file with mode: 0644]
gcc/testsuite/gcc.target/i386/pr90773-21.c
gcc/testsuite/gcc.target/i386/pr90773-23.c

index 10bfa0e74595e8e31f7e293e172b191a06c26611..3dedf522c42adc5071ec8a2aab51635b6d8f5cb2 100644 (file)
@@ -19522,9 +19522,8 @@ ix86_can_change_mode_class (machine_mode from, machine_mode to,
         disallow a change to these modes, reload will assume it's ok to
         drop the subreg from (subreg:SI (reg:HI 100) 0).  This affects
         the vec_dupv4hi pattern.
-        NB: AVX512FP16 supports vmovw which can load 16bit data to sse
-        register.  */
-      int mov_size = MAYBE_SSE_CLASS_P (regclass) && TARGET_AVX512FP16 ? 2 : 4;
+        NB: SSE2 can load 16bit data to sse register via pinsrw.  */
+      int mov_size = MAYBE_SSE_CLASS_P (regclass) && TARGET_SSE2 ? 2 : 4;
       if (GET_MODE_SIZE (from) < mov_size)
        return false;
     }
index 03d401efff8d885c8c7dbd3533df50655a8c14c8..68606e57e6092079058048121ba8ad7f136eb15a 100644 (file)
     case TYPE_SSEMOV:
       return ix86_output_ssemov (insn, operands);
 
+    case TYPE_SSELOG:
+      if (SSE_REG_P (operands[0]))
+       return MEM_P (operands[1])
+         ? "pinsrw\t{$0, %1, %0|%0, %1, 0}"
+         : "pinsrw\t{$0, %k1, %0|%0, %k1, 0}";
+      else
+       return MEM_P (operands[1])
+         ? "pextrw\t{$0, %1, %0|%0, %1, 0}"
+         : "pextrw\t{$0, %1, %k0|%k0, %k1, 0}";
+
     case TYPE_MSKLOG:
       if (operands[1] == const0_rtx)
        return "kxorw\t%0, %0, %0";
     }
 }
   [(set (attr "isa")
-       (cond [(eq_attr "alternative" "9,10,11,12,13")
-                 (const_string "avx512fp16")
+       (cond [(eq_attr "alternative" "9,10,11,12")
+                 (const_string "sse2")
+              (eq_attr "alternative" "13")
+                 (const_string "sse4")
               ]
               (const_string "*")))
    (set (attr "type")
      (cond [(eq_attr "alternative" "9,10,11,12,13")
-             (const_string "ssemov")
+             (if_then_else (match_test "TARGET_AVX512FP16")
+               (const_string "ssemov")
+               (const_string "sselog"))
            (eq_attr "alternative" "4,5,6,7")
              (const_string "mskmov")
            (eq_attr "alternative" "8")
   emit_move_insn (operands[0], CONST0_RTX (V2DFmode));
 })
 
-(define_insn "extendhf<mode>2"
-  [(set (match_operand:MODEF 0 "nonimm_ssenomem_operand" "=v")
+(define_expand "extendhfsf2"
+  [(set (match_operand:SF 0 "register_operand")
+       (float_extend:SF
+         (match_operand:HF 1 "nonimmediate_operand")))]
+  "TARGET_AVX512FP16 || TARGET_F16C || TARGET_AVX512VL"
+{
+  if (!TARGET_AVX512FP16)
+    {
+      rtx res = gen_reg_rtx (V4SFmode);
+      rtx tmp = force_reg (V8HFmode, CONST0_RTX (V8HFmode));
+
+      ix86_expand_vector_set (false, tmp, operands[1], 0);
+      emit_insn (gen_vcvtph2ps (res, gen_lowpart (V8HImode, tmp)));
+      emit_move_insn (operands[0], gen_lowpart (SFmode, res));
+      DONE;
+    }
+})
+
+(define_expand "extendhfdf2"
+  [(set (match_operand:DF 0 "register_operand")
+       (float_extend:DF
+         (match_operand:HF 1 "nonimmediate_operand")))]
+  "TARGET_AVX512FP16")
+
+(define_insn "*extendhf<mode>2"
+  [(set (match_operand:MODEF 0 "register_operand" "=v")
         (float_extend:MODEF
          (match_operand:HF 1 "nonimmediate_operand" "vm")))]
   "TARGET_AVX512FP16"
 
 ;; Conversion from {SF,DF}mode to HFmode.
 
-(define_insn "trunc<mode>hf2"
+(define_expand "truncsfhf2"
+  [(set (match_operand:HF 0 "register_operand")
+       (float_truncate:HF
+         (match_operand:SF 1 "nonimmediate_operand")))]
+  "TARGET_AVX512FP16 || TARGET_F16C || TARGET_AVX512VL"
+  {
+    if (!TARGET_AVX512FP16)
+    {
+      rtx res = gen_reg_rtx (V8HFmode);
+      rtx tmp = force_reg (V4SFmode, CONST0_RTX (V4SFmode));
+
+      ix86_expand_vector_set (false, tmp, operands[1], 0);
+      emit_insn (gen_vcvtps2ph (gen_lowpart (V8HImode, res), tmp, GEN_INT (4)));
+      emit_move_insn (operands[0], gen_lowpart (HFmode, res));
+      DONE;
+    }
+  })
+
+(define_expand "truncdfhf2"
+  [(set (match_operand:HF 0 "register_operand")
+       (float_truncate:HF
+         (match_operand:DF 1 "nonimmediate_operand")))]
+  "TARGET_AVX512FP16")
+
+(define_insn "*trunc<mode>hf2"
   [(set (match_operand:HF 0 "register_operand" "=v")
        (float_truncate:HF
          (match_operand:MODEF 1 "nonimmediate_operand" "vm")))]
diff --git a/gcc/testsuite/gcc.target/i386/avx512vl-vcvtps2ph-pr102811.c b/gcc/testsuite/gcc.target/i386/avx512vl-vcvtps2ph-pr102811.c
new file mode 100644 (file)
index 0000000..dfbfb16
--- /dev/null
@@ -0,0 +1,11 @@
+/* { dg-do compile } */
+/* { dg-options "-O2 -mf16c -mno-avx512fp16" } */
+/* { dg-final { scan-assembler-times "vpxor\[ \\t\]" 2 } } */
+/* { dg-final { scan-assembler-times "vcvtph2ps\[ \\t\]" 2 } } */
+/* { dg-final { scan-assembler-times "vcvtps2ph\[ \\t\]" 1 } } */
+/* { dg-final { scan-assembler-not "__truncsfhf2\[ \\t\]"} } */
+/* { dg-final { scan-assembler-not "__extendhfsf2\[ \\t\]"} } */
+_Float16 test (_Float16 a, _Float16 b)
+{
+  return a + b;
+}
index 5bbb387a3ea692d2a39fde843c3a61180753011f..0d620fff83c3eaa8aac311f351b1218151a050f0 100644 (file)
@@ -10,4 +10,4 @@ foo (int c)
 }
 
 /* { dg-final { scan-assembler-times "vmovdqu\[\\t \]%ymm\[0-9\]+, \\(%\[\^,\]+\\)" 1 } } */
-/* { dg-final { scan-assembler-times "movw\[\\t \]%.*, 32\\(%\[\^,\]+\\)" 1 } } */
+/* { dg-final { scan-assembler-times "(?:movw|pextrw)\[\\t \].*, 32\\(%\[\^,\]+\\)" 1 } } */
index ca4a86f30b854adf69a92294a0f50e645a351e31..b7369e802e10ded1da60ba7c5048aaf95b485fe3 100644 (file)
@@ -10,4 +10,4 @@ foo (void)
 }
 
 /* { dg-final { scan-assembler-times "vmovdqu\[\\t \]%ymm\[0-9\]+, \\(%\[\^,\]+\\)" 1 } } */
-/* { dg-final { scan-assembler-times "movw\[\\t \]+.+, 32\\(%\[\^,\]+\\)" 1 } } */
+/* { dg-final { scan-assembler-times "(?:movw|pextrw)\[\\t \]+.+, 32\\(%\[\^,\]+\\)" 1 } } */