Update copyright years.

[thirdparty/gcc.git] / gcc / config / arm / cortex-a7.md
diff --git a/gcc/config/arm/cortex-a7.md b/gcc/config/arm/cortex-a7.md

index a8d4432e508b64f31a1c63e06035087bdd7dfb8a..8f326d7727a650369afa4a1ba97e45b2c1678031 100644 (file)
--- a/gcc/config/arm/cortex-a7.md
+++ b/gcc/config/arm/cortex-a7.md
@@ -1,5 +1,5 @@
  ;; ARM Cortex-A7 pipeline description
-;; Copyright (C) 2012-2013 Free Software Foundation, Inc.
+;; Copyright (C) 2012-2024 Free Software Foundation, Inc.
  ;;
  ;; Contributed by ARM Ltd.
  ;; Based on cortex-a5.md which was originally contributed by CodeSourcery.
@@ -20,6 +20,45 @@
  ;; along with GCC; see the file COPYING3.  If not see
  ;; <http://www.gnu.org/licenses/>.
  
+(define_attr "cortex_a7_neon_type"
+  "neon_mul, neon_mla, neon_other"
+  (cond [
+          (eq_attr "type" "neon_mul_b, neon_mul_b_q,\
+                          neon_mul_h, neon_mul_h_q,\
+                          neon_mul_s, neon_mul_s_q,\
+                          neon_mul_b_long, neon_mul_h_long,\
+                          neon_mul_s_long, neon_mul_h_scalar,\
+                          neon_mul_h_scalar_q, neon_mul_s_scalar,\
+                          neon_mul_s_scalar_q, neon_mul_h_scalar_long,\
+                          neon_mul_s_scalar_long,\
+                          neon_sat_mul_b, neon_sat_mul_b_q,\
+                          neon_sat_mul_h, neon_sat_mul_h_q,\
+                          neon_sat_mul_s, neon_sat_mul_s_q,\
+                          neon_sat_mul_b_long, neon_sat_mul_h_long,\
+                          neon_sat_mul_s_long,\
+                          neon_sat_mul_h_scalar, neon_sat_mul_h_scalar_q,\
+                          neon_sat_mul_s_scalar, neon_sat_mul_s_scalar_q,\
+                          neon_sat_mul_h_scalar_long,\
+                          neon_sat_mul_s_scalar_long,\
+                          neon_fp_mul_s, neon_fp_mul_s_q,\
+                          neon_fp_mul_s_scalar, neon_fp_mul_s_scalar_q")
+             (const_string "neon_mul")
+          (eq_attr "type" "neon_mla_b, neon_mla_b_q, neon_mla_h,\
+                          neon_mla_h_q, neon_mla_s, neon_mla_s_q,\
+                          neon_mla_b_long, neon_mla_h_long,\
+                           neon_mla_s_long,\
+                          neon_mla_h_scalar, neon_mla_h_scalar_q,\
+                          neon_mla_s_scalar, neon_mla_s_scalar_q,\
+                          neon_mla_h_scalar_long, neon_mla_s_scalar_long,\
+                          neon_sat_mla_b_long, neon_sat_mla_h_long,\
+                          neon_sat_mla_s_long,\
+                          neon_sat_mla_h_scalar_long,\
+                           neon_sat_mla_s_scalar_long,\
+                          neon_fp_mla_s, neon_fp_mla_s_q,\
+                          neon_fp_mla_s_scalar, neon_fp_mla_s_scalar_q")
+             (const_string "neon_mla")]
+           (const_string "neon_other")))
+
  (define_automaton "cortex_a7")
  
  ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
@@ -57,15 +96,6 @@
  
  (define_cpu_unit "cortex_a7_fp_div_sqrt" "cortex_a7")
  
-;; Neon pipeline
-(define_cpu_unit "cortex_a7_neon" "cortex_a7")
-
-(define_reservation "cortex_a7_all" "cortex_a7_both+\
-                                     cortex_a7_fpmul_pipe+\
-                                     cortex_a7_fpadd_pipe+\
-                                     cortex_a7_fp_div_sqrt+\
-                                     cortex_a7_neon")
-
  ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
  ;; Branches.
  ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
@@ -76,16 +106,17 @@
  
  (define_insn_reservation "cortex_a7_branch" 0
    (and (eq_attr "tune" "cortexa7")
-       (and (eq_attr "type" "branch")
-            (eq_attr "neon_type" "none")))
+       (eq_attr "type" "branch"))
    "(cortex_a7_ex2|cortex_a7_ex1)+cortex_a7_branch")
  
-;; A call reserves all issue slots. The result is available the next cycle.
+;; Call cannot dual-issue as an older instruction. It can dual-issue
+;; as a younger instruction, or single-issue.  Call cannot dual-issue
+;; with another branch instruction.  The result is available the next
+;; cycle.
  (define_insn_reservation "cortex_a7_call" 1
    (and (eq_attr "tune" "cortexa7")
-       (and (eq_attr "type" "call")
-            (eq_attr "neon_type" "none")))
-  "cortex_a7_all")
+       (eq_attr "type" "call"))
+  "(cortex_a7_ex2|cortex_a7_both)+cortex_a7_branch")
  
  ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
  ;; ALU instructions.
@@ -94,36 +125,42 @@
  ;; ALU instruction with an immediate operand can dual-issue.
  (define_insn_reservation "cortex_a7_alu_imm" 2
    (and (eq_attr "tune" "cortexa7")
-       (and (ior (eq_attr "type" "simple_alu_imm")
-                 (ior (eq_attr "type" "simple_alu_shift")
-                      (and (eq_attr "insn" "mov")
-                           (not (eq_attr "length" "8")))))
-            (eq_attr "neon_type" "none")))
+       (ior (eq_attr "type" "adr,alu_imm,alus_imm,logic_imm,logics_imm,\
+                             mov_imm,mvn_imm,extend")
+            (and (eq_attr "type" "mov_reg,mov_shift,mov_shift_reg")
+                 (not (eq_attr "length" "8")))))
    "cortex_a7_ex2|cortex_a7_ex1")
  
  ;; ALU instruction with register operands can dual-issue
  ;; with a younger immediate-based instruction.
-(define_insn_reservation "cortex_a7_alu_reg" 2
+(define_insn_reservation "cortex_a7_alu_sreg" 2
    (and (eq_attr "tune" "cortexa7")
-       (and (eq_attr "type" "alu_reg")
-            (eq_attr "neon_type" "none")))
+       (eq_attr "type" "alu_sreg,alus_sreg,logic_reg,logics_reg,\
+                        adc_imm,adcs_imm,adc_reg,adcs_reg,\
+                        bfm,clz,rbit,rev,alu_dsp_reg,\
+                        shift_imm,shift_reg,mov_reg,mvn_reg"))
    "cortex_a7_ex1")
  
  (define_insn_reservation "cortex_a7_alu_shift" 2
    (and (eq_attr "tune" "cortexa7")
-       (and (eq_attr "type" "alu_shift,alu_shift_reg")
-            (eq_attr "neon_type" "none")))
+       (eq_attr "type" "alu_shift_imm_lsl_1to4,alu_shift_imm_other,alus_shift_imm,\
+                        logic_shift_imm,logics_shift_imm,\
+                        alu_shift_reg,alus_shift_reg,\
+                        logic_shift_reg,logics_shift_reg,\
+                        mov_shift,mov_shift_reg,\
+                        mvn_shift,mvn_shift_reg,\
+                        mrs,multiple"))
    "cortex_a7_ex1")
  
  ;; Forwarding path for unshifted operands.
-(define_bypass 1 "cortex_a7_alu_imm,cortex_a7_alu_reg,cortex_a7_alu_shift"
-  "cortex_a7_alu_imm,cortex_a7_alu_reg,cortex_a7_mul")
+(define_bypass 1 "cortex_a7_alu_imm,cortex_a7_alu_sreg,cortex_a7_alu_shift"
+  "cortex_a7_alu_imm,cortex_a7_alu_sreg,cortex_a7_mul")
  
-(define_bypass 1 "cortex_a7_alu_imm,cortex_a7_alu_reg,cortex_a7_alu_shift"
+(define_bypass 1 "cortex_a7_alu_imm,cortex_a7_alu_sreg,cortex_a7_alu_shift"
    "cortex_a7_store*"
    "arm_no_early_store_addr_dep")
  
-(define_bypass 1 "cortex_a7_alu_imm,cortex_a7_alu_reg,cortex_a7_alu_shift"
+(define_bypass 1 "cortex_a7_alu_imm,cortex_a7_alu_sreg,cortex_a7_alu_shift"
    "cortex_a7_alu_shift"
    "arm_no_early_alu_shift_dep")
  
@@ -133,8 +170,8 @@
  
  (define_insn_reservation "cortex_a7_mul" 2
    (and (eq_attr "tune" "cortexa7")
-       (and (eq_attr "type" "mult")
-            (eq_attr "neon_type" "none")))
+       (ior (eq_attr "mul32" "yes")
+           (eq_attr "widen_mul64" "yes")))
    "cortex_a7_both")
  
  ;; Forward the result of a multiply operation to the accumulator 
@@ -146,8 +183,8 @@
  ;; The latency depends on the operands, so we use an estimate here.
  (define_insn_reservation "cortex_a7_idiv" 5
    (and (eq_attr "tune" "cortexa7")
-       (eq_attr "insn" "udiv,sdiv"))
-  "cortex_a7_all*5")
+       (eq_attr "type" "udiv,sdiv"))
+  "cortex_a7_both*5")
  
  ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
  ;; Load/store instructions.
@@ -159,50 +196,42 @@
  
  (define_insn_reservation "cortex_a7_load1" 2
    (and (eq_attr "tune" "cortexa7")
-       (and (eq_attr "type" "load_byte,load1")
-            (eq_attr "neon_type" "none")))
+       (eq_attr "type" "load_byte,load_4"))
    "cortex_a7_ex1")
  
  (define_insn_reservation "cortex_a7_store1" 0
    (and (eq_attr "tune" "cortexa7")
-       (and (eq_attr "type" "store1")
-            (eq_attr "neon_type" "none")))
+       (eq_attr "type" "store_4"))
    "cortex_a7_ex1")
  
  (define_insn_reservation "cortex_a7_load2" 2
    (and (eq_attr "tune" "cortexa7")
-       (and (eq_attr "type" "load2")
-            (eq_attr "neon_type" "none")))
+       (eq_attr "type" "load_8"))
    "cortex_a7_both")
  
  (define_insn_reservation "cortex_a7_store2" 0
    (and (eq_attr "tune" "cortexa7")
-       (and (eq_attr "type" "store2")
-            (eq_attr "neon_type" "none")))
+       (eq_attr "type" "store_8"))
    "cortex_a7_both")
  
  (define_insn_reservation "cortex_a7_load3" 3
    (and (eq_attr "tune" "cortexa7")
-       (and (eq_attr "type" "load3")
-            (eq_attr "neon_type" "none")))
+       (eq_attr "type" "load_12"))
    "cortex_a7_both, cortex_a7_ex1")
  
  (define_insn_reservation "cortex_a7_store3" 0
    (and (eq_attr "tune" "cortexa7")
-       (and (eq_attr "type" "store4")
-            (eq_attr "neon_type" "none")))
+       (eq_attr "type" "store_16"))
    "cortex_a7_both, cortex_a7_ex1")
  
  (define_insn_reservation "cortex_a7_load4" 3
    (and (eq_attr "tune" "cortexa7")
-       (and (eq_attr "type" "load4")
-            (eq_attr "neon_type" "none")))
+       (eq_attr "type" "load_16"))
    "cortex_a7_both, cortex_a7_both")
  
  (define_insn_reservation "cortex_a7_store4" 0
    (and (eq_attr "tune" "cortexa7")
-       (and (eq_attr "type" "store3")
-            (eq_attr "neon_type" "none")))
+       (eq_attr "type" "store_12"))
    "cortex_a7_both, cortex_a7_both")
  
  ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
@@ -214,9 +243,8 @@
  
  (define_insn_reservation "cortex_a7_fpalu" 4
    (and (eq_attr "tune" "cortexa7")
-       (and (eq_attr "type" "ffariths, fadds, ffarithd, faddd, fcpys,\
-                             f_cvt, fcmps, fcmpd")
-            (eq_attr "neon_type" "none")))
+       (eq_attr "type" "ffariths, fadds, ffarithd, faddd, fmov,\
+                        f_cvt, f_cvtf2i, f_cvti2f, fcmps, fcmpd"))
    "cortex_a7_ex1+cortex_a7_fpadd_pipe")
  
  ;; For fconsts and fconstd, 8-bit immediate data is passed directly from
@@ -224,8 +252,7 @@
  
  (define_insn_reservation "cortex_a7_fconst" 3
    (and (eq_attr "tune" "cortexa7")
-       (and (eq_attr "type" "fconsts,fconstd")
-            (eq_attr "neon_type" "none")))
+       (eq_attr "type" "fconsts,fconstd"))
    "cortex_a7_ex1+cortex_a7_fpadd_pipe")
  
  ;; We should try not to attempt to issue a single-precision multiplication in
@@ -234,40 +261,22 @@
  
  (define_insn_reservation "cortex_a7_fpmuls" 4
    (and (eq_attr "tune" "cortexa7")
-       (and (eq_attr "type" "fmuls")
-            (eq_attr "neon_type" "none")))
+       (eq_attr "type" "fmuls"))
    "cortex_a7_ex1+cortex_a7_fpmul_pipe")
  
  (define_insn_reservation "cortex_a7_neon_mul" 4
    (and (eq_attr "tune" "cortexa7")
-       (eq_attr "neon_type"
-                "neon_mul_ddd_8_16_qdd_16_8_long_32_16_long,\
-                 neon_mul_qqq_8_16_32_ddd_32,\
-                 neon_mul_qdd_64_32_long_qqd_16_ddd_32_scalar_64_32_long_scalar,\
-                 neon_mul_ddd_16_scalar_32_16_long_scalar,\
-                 neon_mul_qqd_32_scalar,\
-                 neon_fp_vmul_ddd,\
-                 neon_fp_vmul_qqd"))
+       (eq_attr "cortex_a7_neon_type" "neon_mul"))
    "(cortex_a7_both+cortex_a7_fpmul_pipe)*2")
  
  (define_insn_reservation "cortex_a7_fpmacs" 8
    (and (eq_attr "tune" "cortexa7")
-       (and (eq_attr "type" "fmacs,ffmas")
-            (eq_attr "neon_type" "none")))
+       (eq_attr "type" "fmacs,ffmas"))
    "cortex_a7_ex1+cortex_a7_fpmul_pipe")
  
  (define_insn_reservation "cortex_a7_neon_mla" 8
    (and (eq_attr "tune" "cortexa7")
-       (eq_attr "neon_type"
-                "neon_mla_ddd_8_16_qdd_16_8_long_32_16_long,\
-                 neon_mla_qqq_8_16,\
-                 neon_mla_ddd_32_qqd_16_ddd_32_scalar_qdd_64_32_long_scalar_qdd_64_32_long,\
-                 neon_mla_qqq_32_qqd_32_scalar,\
-                 neon_mla_ddd_16_scalar_qdd_32_16_long_scalar,\
-                 neon_fp_vmla_ddd,\
-                 neon_fp_vmla_qqq,\
-                 neon_fp_vmla_ddd_scalar,\
-                 neon_fp_vmla_qqq_scalar"))
+       (eq_attr "cortex_a7_neon_type" "neon_mla"))
    "cortex_a7_both+cortex_a7_fpmul_pipe")
  
  (define_bypass 4 "cortex_a7_fpmacs,cortex_a7_neon_mla"
@@ -279,20 +288,17 @@
  
  (define_insn_reservation "cortex_a7_fpmuld" 7
    (and (eq_attr "tune" "cortexa7")
-       (and (eq_attr "type" "fmuld")
-            (eq_attr "neon_type" "none")))
+       (eq_attr "type" "fmuld"))
    "cortex_a7_ex1+cortex_a7_fpmul_pipe, cortex_a7_fpmul_pipe*3")
  
  (define_insn_reservation "cortex_a7_fpmacd" 11
    (and (eq_attr "tune" "cortexa7")
-       (and (eq_attr "type" "fmacd")
-            (eq_attr "neon_type" "none")))
+       (eq_attr "type" "fmacd"))
    "cortex_a7_ex1+cortex_a7_fpmul_pipe, cortex_a7_fpmul_pipe*3")
  
  (define_insn_reservation "cortex_a7_fpfmad" 8
    (and (eq_attr "tune" "cortexa7")
-       (and (eq_attr "type" "ffmad")
-            (eq_attr "neon_type" "none")))
+       (eq_attr "type" "ffmad"))
    "cortex_a7_ex1+cortex_a7_fpmul_pipe, cortex_a7_fpmul_pipe*4")
  
  (define_bypass 7 "cortex_a7_fpmacd"
@@ -305,14 +311,12 @@
  
  (define_insn_reservation "cortex_a7_fdivs" 16
    (and (eq_attr "tune" "cortexa7")
-       (and (eq_attr "type" "fdivs")
-            (eq_attr "neon_type" "none")))
+       (eq_attr "type" "fdivs, fsqrts"))
    "cortex_a7_ex1+cortex_a7_fp_div_sqrt, cortex_a7_fp_div_sqrt * 13")
  
  (define_insn_reservation "cortex_a7_fdivd" 31
    (and (eq_attr "tune" "cortexa7")
-       (and (eq_attr "type" "fdivd")
-            (eq_attr "neon_type" "none")))
+       (eq_attr "type" "fdivd, fsqrtd"))
    "cortex_a7_ex1+cortex_a7_fp_div_sqrt, cortex_a7_fp_div_sqrt * 28")
  
  ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
@@ -323,14 +327,12 @@
  
  (define_insn_reservation "cortex_a7_r2f" 4
    (and (eq_attr "tune" "cortexa7")
-       (and (eq_attr "type" "r_2_f")
-            (eq_attr "neon_type" "none")))
+       (eq_attr "type" "f_mcr,f_mcrr"))
    "cortex_a7_both")
  
  (define_insn_reservation "cortex_a7_f2r" 2
    (and (eq_attr "tune" "cortexa7")
-       (and (eq_attr "type" "f_2_r")
-            (eq_attr "neon_type" "none")))
+       (eq_attr "type" "f_mrc,f_mrrc"))
    "cortex_a7_ex1")
  
  ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
@@ -342,8 +344,7 @@
  
  (define_insn_reservation "cortex_a7_f_flags" 4
    (and (eq_attr "tune" "cortexa7")
-       (and (eq_attr "type" "f_flag")
-            (eq_attr "neon_type" "none")))
+       (eq_attr "type" "f_flag"))
    "cortex_a7_ex1")
  
  ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
@@ -352,26 +353,22 @@
  
  (define_insn_reservation "cortex_a7_f_loads" 4
    (and (eq_attr "tune" "cortexa7")
-       (and (eq_attr "type" "f_loads")
-            (eq_attr "neon_type" "none")))
+       (eq_attr "type" "f_loads"))
    "cortex_a7_ex1")
  
  (define_insn_reservation "cortex_a7_f_loadd" 4
    (and (eq_attr "tune" "cortexa7")
-       (and (eq_attr "type" "f_loadd")
-            (eq_attr "neon_type" "none")))
+       (eq_attr "type" "f_loadd"))
    "cortex_a7_both")
  
  (define_insn_reservation "cortex_a7_f_stores" 0
    (and (eq_attr "tune" "cortexa7")
-       (and (eq_attr "type" "f_stores")
-            (eq_attr "neon_type" "none")))
+       (eq_attr "type" "f_stores"))
    "cortex_a7_ex1")
  
  (define_insn_reservation "cortex_a7_f_stored" 0
    (and (eq_attr "tune" "cortexa7")
-       (and (eq_attr "type" "f_stored")
-            (eq_attr "neon_type" "none")))
+       (eq_attr "type" "f_stored"))
    "cortex_a7_both")
  
  ;; Load-to-use for floating-point values has a penalty of one cycle,
@@ -392,22 +389,6 @@
  
  (define_insn_reservation "cortex_a7_neon" 4
    (and (eq_attr "tune" "cortexa7")
-       (eq_attr "neon_type"
-                "!none,\
-                  neon_mul_ddd_8_16_qdd_16_8_long_32_16_long,\
-                  neon_mul_qqq_8_16_32_ddd_32,\
-                  neon_mul_qdd_64_32_long_qqd_16_ddd_32_scalar_64_32_long_scalar,\
-                  neon_mla_ddd_8_16_qdd_16_8_long_32_16_long,\
-                  neon_mla_qqq_8_16,\
-                  neon_mla_ddd_32_qqd_16_ddd_32_scalar_qdd_64_32_long_scalar_qdd_64_32_long,\
-                  neon_mla_qqq_32_qqd_32_scalar,\
-                  neon_mul_ddd_16_scalar_32_16_long_scalar,\
-                  neon_mul_qqd_32_scalar,\
-                  neon_mla_ddd_16_scalar_qdd_32_16_long_scalar,\
-                  neon_fp_vmul_ddd,\
-                  neon_fp_vmul_qqd,\
-                  neon_fp_vmla_ddd,\
-                  neon_fp_vmla_qqq,\
-                  neon_fp_vmla_ddd_scalar,\
-                  neon_fp_vmla_qqq_scalar"))
+       (and (eq_attr "is_neon_type" "yes")
+            (eq_attr "cortex_a7_neon_type" "neon_other")))
    "cortex_a7_both*2")