Implement -fexternal-blas64 option.

author Thomas Koenig <tkoenig@gcc.gnu.org>

Wed, 17 Sep 2025 16:50:22 +0000 (18:50 +0200)

committer Thomas Koenig <tkoenig@gcc.gnu.org>

Wed, 17 Sep 2025 16:50:22 +0000 (18:50 +0200)
author Thomas Koenig <tkoenig@gcc.gnu.org>
Wed, 17 Sep 2025 16:50:22 +0000 (18:50 +0200)
committer Thomas Koenig <tkoenig@gcc.gnu.org>
Wed, 17 Sep 2025 16:50:22 +0000 (18:50 +0200)
diff --git a/gcc/fortran/frontend-passes.cc b/gcc/fortran/frontend-passes.cc

index 4a468b936004732a68479cff9661737bc5f560d7..595c5095eaf960b1b50f9a43000949d254e2386d 100644 (file)
--- a/gcc/fortran/frontend-passes.cc
+++ b/gcc/fortran/frontend-passes.cc
@@ -1481,7 +1481,8 @@ optimize_namespace (gfc_namespace *ns)
        gfc_code_walker (&ns->code, convert_elseif, dummy_expr_callback, NULL);
        gfc_code_walker (&ns->code, cfe_code, cfe_expr_0, NULL);
        gfc_code_walker (&ns->code, optimize_code, optimize_expr, NULL);
-      if (flag_inline_matmul_limit != 0 || flag_external_blas)
+      if (flag_inline_matmul_limit != 0 || flag_external_blas
+         || flag_external_blas64)
         {
           bool found;
           do
@@ -1496,7 +1497,7 @@ optimize_namespace (gfc_namespace *ns)
                            NULL);
         }
  
-      if (flag_external_blas)
+      if (flag_external_blas || flag_external_blas64)
         gfc_code_walker (&ns->code, call_external_blas, dummy_expr_callback,
                          NULL);
  
@@ -4644,6 +4645,7 @@ call_external_blas (gfc_code **c, int *walk_subtrees ATTRIBUTE_UNUSED,
    enum matrix_case m_case;
    bool realloc_c;
    gfc_code **next_code_point;
+  int arg_kind;
  
    /* Many of the tests for inline matmul also apply here.  */
  
@@ -4929,13 +4931,20 @@ call_external_blas (gfc_code **c, int *walk_subtrees ATTRIBUTE_UNUSED,
                                        transb, 1);
    actual->next = next;
  
+  if (flag_external_blas)
+    arg_kind = gfc_integer_4_kind;
+  else
+    {
+      gcc_assert (flag_external_blas64);
+      arg_kind = gfc_integer_8_kind;
+    }
+
    c1 = get_array_inq_function (GFC_ISYM_SIZE, gfc_copy_expr (a->expr), 1,
-                              gfc_integer_4_kind);
+                              arg_kind);
    c2 = get_array_inq_function (GFC_ISYM_SIZE, gfc_copy_expr (b->expr), 2,
-                              gfc_integer_4_kind);
-
+                              arg_kind);
    b1 = get_array_inq_function (GFC_ISYM_SIZE, gfc_copy_expr (b->expr), 1,
-                              gfc_integer_4_kind);
+                              arg_kind);
  
    /* Argument M. */
    actual = next;
@@ -4975,7 +4984,7 @@ call_external_blas (gfc_code **c, int *walk_subtrees ATTRIBUTE_UNUSED,
    actual = next;
    next = gfc_get_actual_arglist ();
    next->expr = get_array_inq_function (GFC_ISYM_SIZE, gfc_copy_expr (matrix_a),
-                                      1, gfc_integer_4_kind);
+                                      1, arg_kind);
    actual->next = next;
  
    /* Argument B.  */
@@ -4988,7 +4997,7 @@ call_external_blas (gfc_code **c, int *walk_subtrees ATTRIBUTE_UNUSED,
    actual = next;
    next = gfc_get_actual_arglist ();
    next->expr = get_array_inq_function (GFC_ISYM_SIZE, gfc_copy_expr (matrix_b),
-                                      1, gfc_integer_4_kind);
+                                      1, arg_kind);
    actual->next = next;
  
    /* Argument BETA - set to zero.  */
@@ -5012,7 +5021,7 @@ call_external_blas (gfc_code **c, int *walk_subtrees ATTRIBUTE_UNUSED,
    actual = next;
    next = gfc_get_actual_arglist ();
    next->expr = get_array_inq_function (GFC_ISYM_SIZE, gfc_copy_expr (expr1),
-                                      1, gfc_integer_4_kind);
+                                      1, arg_kind);
    actual->next = next;
  
    return 0;
diff --git a/gcc/fortran/gfortran.h b/gcc/fortran/gfortran.h

index 2e6b368b4c266049ca1c65baa064bb6767a38362..74fcd1ad9deab1e60176930ab154108ad198eee0 100644 (file)
--- a/gcc/fortran/gfortran.h
+++ b/gcc/fortran/gfortran.h
@@ -3672,6 +3672,8 @@ extern int gfc_character_storage_size;
  #define gfc_integer_4_kind 4
  #define gfc_real_4_kind 4
  
+#define gfc_integer_8_kind 8
+
  /* symbol.cc */
  void gfc_clear_new_implicit (void);
  bool gfc_add_new_implicit_range (int, int);
diff --git a/gcc/fortran/invoke.texi b/gcc/fortran/invoke.texi

index 0b893e876a5d86a47c0f94715a2f02f652f06769..d62ee819997fbcf0ed652c8b58d2a69db0326293 100644 (file)
--- a/gcc/fortran/invoke.texi
+++ b/gcc/fortran/invoke.texi
@@ -189,7 +189,7 @@ and warnings}.
  -fbounds-check -ftail-call-workaround -ftail-call-workaround=@var{n}
  -fcheck-array-temporaries
  -fcheck=<all|array-temps|bits|bounds|do|mem|pointer|recursion>
--fcoarray=<none|single|lib> -fexternal-blas -ff2c
+-fcoarray=<none|single|lib> -fexternal-blas -fexternal-blas64 -ff2c
  -ffrontend-loop-interchange -ffrontend-optimize
  -finit-character=@var{n} -finit-integer=@var{n} -finit-local-zero
  -finit-derived -finit-logical=<true|false>
@@ -2014,13 +2014,26 @@ for some matrix operations like @code{MATMUL}, instead of using our own
  algorithms, if the size of the matrices involved is larger than a given
  limit (see @option{-fblas-matmul-limit}).  This may be profitable if an
  optimized vendor BLAS library is available.  The BLAS library has
-to be specified at link time.
+to be specified at link time.  This option specifies a BLAS library
+with integer arguments of default kind (32 bits). It cannot be used
+together with @option{-fexternal-blas64}.
+
+@opindex fexternal-blas64
+@item -fexternal-blas64
+makes @command{gfortran} generate calls to BLAS functions
+for some matrix operations like @code{MATMUL}, instead of using our own
+algorithms, if the size of the matrices involved is larger than a given
+limit (see @option{-fblas-matmul-limit}).  This may be profitable if an
+optimized vendor BLAS library is available.  The BLAS library has
+to be specified at link time.  This option specifies a BLAS library
+with integer arguments of @code{KIND=8} (64 bits). It cannot be used
+together with @option{-fexternal-blas}.
  
  @opindex fblas-matmul-limit
  @item -fblas-matmul-limit=@var{n}
-Only significant when @option{-fexternal-blas} is in effect.
-Matrix multiplication of matrices with size larger than (or equal to) @var{n}
-is performed by calls to BLAS functions, while others are
+Only significant when @option{-fexternal-blas} or @option{-fexternal-blas64}
+are in effect. Matrix multiplication of matrices with size larger than or equal
+to @var{n} is performed by calls to BLAS functions, while others are
  handled by @command{gfortran} internal algorithms. If the matrices
  involved are not square, the size comparison is performed using the
  geometric mean of the dimensions of the argument and result matrices.
diff --git a/gcc/fortran/lang.opt b/gcc/fortran/lang.opt

index 7826a1ab5faea3416fe64b5a3997a4093af56d59..33710d0d920ce9270d97a28b71a01f61aa8de0c5 100644 (file)
--- a/gcc/fortran/lang.opt
+++ b/gcc/fortran/lang.opt
@@ -566,6 +566,10 @@ fexternal-blas
  Fortran Var(flag_external_blas)
  Specify that an external BLAS library should be used for matmul calls on large-size arrays.
  
+fexternal-blas64
+Fortran Var(flag_external_blas64)
+Use an external BLAS library with 64-bit indexing for matmul on large-size arrays.
+
  ff2c
  Fortran Var(flag_f2c)
  Use f2c calling convention.
diff --git a/gcc/fortran/lang.opt.urls b/gcc/fortran/lang.opt.urls

index 4972ff8b7b9b2eb0830aaf333e71609e6cc20284..4a51f5a1be28a20da0011338bbfd6f578fb20d32 100644 (file)
--- a/gcc/fortran/lang.opt.urls
+++ b/gcc/fortran/lang.opt.urls
@@ -295,6 +295,9 @@ LangUrlSuffix_Fortran(gfortran/Developer-Options.html#index-fdump-parse-tree)
  fexternal-blas
  LangUrlSuffix_Fortran(gfortran/Code-Gen-Options.html#index-fexternal-blas)
  
+fexternal-blas64
+LangUrlSuffix_Fortran(gfortran/Code-Gen-Options.html#index-fexternal-blas64)
+
  ff2c
  LangUrlSuffix_Fortran(gfortran/Code-Gen-Options.html#index-ff2c)
  
diff --git a/gcc/fortran/options.cc b/gcc/fortran/options.cc

index 821a8c88bbbb755b8490267065b67fb4f2a8adae..35c1924a9c9b2031497f59069a5870dda9644cec 100644 (file)
--- a/gcc/fortran/options.cc
+++ b/gcc/fortran/options.cc
@@ -504,7 +504,12 @@ gfc_post_options (const char **pfilename)
         flag_inline_matmul_limit = 30;
      }
  
-  /* Optimization implies front end optimization, unless the user
+  /* We can only have a 32-bit or a 64-bit version of BLAS, not both.  */
+
+  if (flag_external_blas && flag_external_blas64)
+    gfc_fatal_error ("32- and 64-bit version of BLAS cannot both be specified");
+
+  /* Optimizationx implies front end optimization, unless the user
       specified it directly.  */
  
    if (flag_frontend_optimize == -1)
diff --git a/gcc/testsuite/gfortran.dg/matmul_blas_3.f90 b/gcc/testsuite/gfortran.dg/matmul_blas_3.f90

new file mode 100644 (file)

index 0000000..d496596
--- /dev/null
+++ b/gcc/testsuite/gfortran.dg/matmul_blas_3.f90
@@ -0,0 +1,12 @@
+! { dg-do compile }
+! { dg-options "-ffrontend-optimize -fexternal-blas64 -fdump-tree-original" }
+! PR 121161 - option for 64-bit BLAS for MATMUL.
+! Check this by making sure there is no KIND=4 integer.
+subroutine foo(a,b,c,n)
+  implicit none
+  integer(kind=8) :: n
+  real, dimension(n,n) :: a, b, c
+  c = matmul(a,b)
+end subroutine foo
+! { dg-final { scan-tree-dump-not "integer\\(kind=4\\)" "original" } }
+! { dg-final { scan-tree-dump-times "sgemm" 1 "original" } }
author	Thomas Koenig <tkoenig@gcc.gnu.org>
	Wed, 17 Sep 2025 16:50:22 +0000 (18:50 +0200)
committer	Thomas Koenig <tkoenig@gcc.gnu.org>
	Wed, 17 Sep 2025 16:50:22 +0000 (18:50 +0200)
gcc/fortran/frontend-passes.cc		patch \| blob \| blame \| history
gcc/fortran/gfortran.h		patch \| blob \| blame \| history
gcc/fortran/invoke.texi		patch \| blob \| blame \| history
gcc/fortran/lang.opt		patch \| blob \| blame \| history
gcc/fortran/lang.opt.urls		patch \| blob \| blame \| history
gcc/fortran/options.cc		patch \| blob \| blame \| history
gcc/testsuite/gfortran.dg/matmul_blas_3.f90	[new file with mode: 0644]	patch \| blob