re PR libfortran/78379 (Processor-specific versions for matmul)

[thirdparty/gcc.git] / libgfortran / generated / matmul_r16.c
diff --git a/libgfortran/generated/matmul_r16.c b/libgfortran/generated/matmul_r16.c

index be3e8fd217f88cd8578e3406a0d1d2a1909a2a1b..73e7c9877adf09c4ff13f593aa44e0c478266f49 100644 (file)
--- a/libgfortran/generated/matmul_r16.c
+++ b/libgfortran/generated/matmul_r16.c
@@ -74,13 +74,6 @@ extern void matmul_r16 (gfc_array_r16 * const restrict retarray,
         int blas_limit, blas_call gemm);
  export_proto(matmul_r16);
  
-#if defined(HAVE_AVX) && defined(HAVE_AVX2)
-/* REAL types generate identical code for AVX and AVX2.  Only generate
-   an AVX2 function if we are dealing with integer.  */
-#undef HAVE_AVX2
-#endif
-
-
  /* Put exhaustive list of possible architectures here here, ORed together.  */
  
  #if defined(HAVE_AVX) || defined(HAVE_AVX2) || defined(HAVE_AVX512F)
@@ -632,7 +625,7 @@ matmul_r16_avx (gfc_array_r16 * const restrict retarray,
  static void
  matmul_r16_avx2 (gfc_array_r16 * const restrict retarray, 
         gfc_array_r16 * const restrict a, gfc_array_r16 * const restrict b, int try_blas,
-       int blas_limit, blas_call gemm) __attribute__((__target__("avx2")));
+       int blas_limit, blas_call gemm) __attribute__((__target__("avx2,fma")));
  static void
  matmul_r16_avx2 (gfc_array_r16 * const restrict retarray, 
         gfc_array_r16 * const restrict a, gfc_array_r16 * const restrict b, int try_blas,
@@ -2281,7 +2274,8 @@ void matmul_r16 (gfc_array_r16 * const restrict retarray,
  #endif  /* HAVE_AVX512F */
  
  #ifdef HAVE_AVX2
-         if (__cpu_model.__cpu_features[0] & (1 << FEATURE_AVX2))
+         if ((__cpu_model.__cpu_features[0] & (1 << FEATURE_AVX2))
+            && (__cpu_model.__cpu_features[0] & (1 << FEATURE_FMA)))
             {
               matmul_p = matmul_r16_avx2;
               goto tailcall;