gcc/loop.c

   1 /* Perform various loop optimizations, including strength reduction.
   2    Copyright (C) 1987, 1988, 1989, 1991, 1992, 1993, 1994, 1995, 1996, 1997,
   3    1998, 1999, 2000, 2001, 2002, 2003, 2004 Free Software Foundation, Inc.
   4
   5 This file is part of GCC.
   6
   7 GCC is free software; you can redistribute it and/or modify it under
   8 the terms of the GNU General Public License as published by the Free
   9 Software Foundation; either version 2, or (at your option) any later
  10 version.
  11
  12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  14 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  15 for more details.
  16
  17 You should have received a copy of the GNU General Public License
  18 along with GCC; see the file COPYING.  If not, write to the Free
  19 Software Foundation, 59 Temple Place - Suite 330, Boston, MA
  20 02111-1307, USA.  */
  21
  22 /* This is the loop optimization pass of the compiler.
  23    It finds invariant computations within loops and moves them
  24    to the beginning of the loop.  Then it identifies basic and
  25    general induction variables.
  26
  27    Basic induction variables (BIVs) are a pseudo registers which are set within
  28    a loop only by incrementing or decrementing its value.  General induction
  29    variables (GIVs) are pseudo registers with a value which is a linear function
  30    of a basic induction variable.  BIVs are recognized by `basic_induction_var';
  31    GIVs by `general_induction_var'.
  32
  33    Once induction variables are identified, strength reduction is applied to the
  34    general induction variables, and induction variable elimination is applied to
  35    the basic induction variables.
  36
  37    It also finds cases where
  38    a register is set within the loop by zero-extending a narrower value
  39    and changes these to zero the entire register once before the loop
  40    and merely copy the low part within the loop.
  41
  42    Most of the complexity is in heuristics to decide when it is worth
  43    while to do these things.  */
  44
  45 #include "config.h"
  46 #include "system.h"
  47 #include "coretypes.h"
  48 #include "tm.h"
  49 #include "rtl.h"
  50 #include "tm_p.h"
  51 #include "function.h"
  52 #include "expr.h"
  53 #include "hard-reg-set.h"
  54 #include "basic-block.h"
  55 #include "insn-config.h"
  56 #include "regs.h"
  57 #include "recog.h"
  58 #include "flags.h"
  59 #include "real.h"
  60 #include "loop.h"
  61 #include "cselib.h"
  62 #include "except.h"
  63 #include "toplev.h"
  64 #include "predict.h"
  65 #include "insn-flags.h"
  66 #include "optabs.h"
  67 #include "cfgloop.h"
  68 #include "ggc.h"
  69
  70 /* Not really meaningful values, but at least something.  */
  71 #ifndef SIMULTANEOUS_PREFETCHES
  72 #define SIMULTANEOUS_PREFETCHES 3
  73 #endif
  74 #ifndef PREFETCH_BLOCK
  75 #define PREFETCH_BLOCK 32
  76 #endif
  77 #ifndef HAVE_prefetch
  78 #define HAVE_prefetch 0
  79 #define CODE_FOR_prefetch 0
  80 #define gen_prefetch(a,b,c) (abort(), NULL_RTX)
  81 #endif
  82
  83 /* Give up the prefetch optimizations once we exceed a given threshold.
  84    It is unlikely that we would be able to optimize something in a loop
  85    with so many detected prefetches.  */
  86 #define MAX_PREFETCHES 100
  87 /* The number of prefetch blocks that are beneficial to fetch at once before
  88    a loop with a known (and low) iteration count.  */
  89 #define PREFETCH_BLOCKS_BEFORE_LOOP_MAX  6
  90 /* For very tiny loops it is not worthwhile to prefetch even before the loop,
  91    since it is likely that the data are already in the cache.  */
  92 #define PREFETCH_BLOCKS_BEFORE_LOOP_MIN  2
  93
  94 /* Parameterize some prefetch heuristics so they can be turned on and off
  95    easily for performance testing on new architectures.  These can be
  96    defined in target-dependent files.  */
  97
  98 /* Prefetch is worthwhile only when loads/stores are dense.  */
  99 #ifndef PREFETCH_ONLY_DENSE_MEM
 100 #define PREFETCH_ONLY_DENSE_MEM 1
 101 #endif
 102
 103 /* Define what we mean by "dense" loads and stores; This value divided by 256
 104    is the minimum percentage of memory references that worth prefetching.  */
 105 #ifndef PREFETCH_DENSE_MEM
 106 #define PREFETCH_DENSE_MEM 220
 107 #endif
 108
 109 /* Do not prefetch for a loop whose iteration count is known to be low.  */
 110 #ifndef PREFETCH_NO_LOW_LOOPCNT
 111 #define PREFETCH_NO_LOW_LOOPCNT 1
 112 #endif
 113
 114 /* Define what we mean by a "low" iteration count.  */
 115 #ifndef PREFETCH_LOW_LOOPCNT
 116 #define PREFETCH_LOW_LOOPCNT 32
 117 #endif
 118
 119 /* Do not prefetch for a loop that contains a function call; such a loop is
 120    probably not an internal loop.  */
 121 #ifndef PREFETCH_NO_CALL
 122 #define PREFETCH_NO_CALL 1
 123 #endif
 124
 125 /* Do not prefetch accesses with an extreme stride.  */
 126 #ifndef PREFETCH_NO_EXTREME_STRIDE
 127 #define PREFETCH_NO_EXTREME_STRIDE 1
 128 #endif
 129
 130 /* Define what we mean by an "extreme" stride.  */
 131 #ifndef PREFETCH_EXTREME_STRIDE
 132 #define PREFETCH_EXTREME_STRIDE 4096
 133 #endif
 134
 135 /* Define a limit to how far apart indices can be and still be merged
 136    into a single prefetch.  */
 137 #ifndef PREFETCH_EXTREME_DIFFERENCE
 138 #define PREFETCH_EXTREME_DIFFERENCE 4096
 139 #endif
 140
 141 /* Issue prefetch instructions before the loop to fetch data to be used
 142    in the first few loop iterations.  */
 143 #ifndef PREFETCH_BEFORE_LOOP
 144 #define PREFETCH_BEFORE_LOOP 1
 145 #endif
 146
 147 /* Do not handle reversed order prefetches (negative stride).  */
 148 #ifndef PREFETCH_NO_REVERSE_ORDER
 149 #define PREFETCH_NO_REVERSE_ORDER 1
 150 #endif
 151
 152 /* Prefetch even if the GIV is in conditional code.  */
 153 #ifndef PREFETCH_CONDITIONAL
 154 #define PREFETCH_CONDITIONAL 1
 155 #endif
 156
 157 #define LOOP_REG_LIFETIME(LOOP, REGNO) \
 158 ((REGNO_LAST_LUID (REGNO) - REGNO_FIRST_LUID (REGNO)))
 159
 160 #define LOOP_REG_GLOBAL_P(LOOP, REGNO) \
 161 ((REGNO_LAST_LUID (REGNO) > INSN_LUID ((LOOP)->end) \
 162  || REGNO_FIRST_LUID (REGNO) < INSN_LUID ((LOOP)->start)))
 163
 164 #define LOOP_REGNO_NREGS(REGNO, SET_DEST) \
 165 ((REGNO) < FIRST_PSEUDO_REGISTER \
 166  ? (int) hard_regno_nregs[(REGNO)][GET_MODE (SET_DEST)] : 1)
 167
 168
 169 /* Vector mapping INSN_UIDs to luids.
 170    The luids are like uids but increase monotonically always.
 171    We use them to see whether a jump comes from outside a given loop.  */
 172
 173 int *uid_luid;
 174
 175 /* Indexed by INSN_UID, contains the ordinal giving the (innermost) loop
 176    number the insn is contained in.  */
 177
 178 struct loop **uid_loop;
 179
 180 /* 1 + largest uid of any insn.  */
 181
 182 int max_uid_for_loop;
 183
 184 /* Number of loops detected in current function.  Used as index to the
 185    next few tables.  */
 186
 187 static int max_loop_num;
 188
 189 /* Bound on pseudo register number before loop optimization.
 190    A pseudo has valid regscan info if its number is < max_reg_before_loop.  */
 191 unsigned int max_reg_before_loop;
 192
 193 /* The value to pass to the next call of reg_scan_update.  */
 194 static int loop_max_reg;
 195 \f
 196 /* During the analysis of a loop, a chain of `struct movable's
 197    is made to record all the movable insns found.
 198    Then the entire chain can be scanned to decide which to move.  */
 199
 200 struct movable
 201 {
 202   rtx insn;                     /* A movable insn */
 203   rtx set_src;                  /* The expression this reg is set from.  */
 204   rtx set_dest;                 /* The destination of this SET.  */
 205   rtx dependencies;             /* When INSN is libcall, this is an EXPR_LIST
 206                                    of any registers used within the LIBCALL.  */
 207   int consec;                   /* Number of consecutive following insns
 208                                    that must be moved with this one.  */
 209   unsigned int regno;           /* The register it sets */
 210   short lifetime;               /* lifetime of that register;
 211                                    may be adjusted when matching movables
 212                                    that load the same value are found.  */
 213   short savings;                /* Number of insns we can move for this reg,
 214                                    including other movables that force this
 215                                    or match this one.  */
 216   ENUM_BITFIELD(machine_mode) savemode : 8;   /* Nonzero means it is a mode for
 217                                    a low part that we should avoid changing when
 218                                    clearing the rest of the reg.  */
 219   unsigned int cond : 1;        /* 1 if only conditionally movable */
 220   unsigned int force : 1;       /* 1 means MUST move this insn */
 221   unsigned int global : 1;      /* 1 means reg is live outside this loop */
 222                 /* If PARTIAL is 1, GLOBAL means something different:
 223                    that the reg is live outside the range from where it is set
 224                    to the following label.  */
 225   unsigned int done : 1;        /* 1 inhibits further processing of this */
 226
 227   unsigned int partial : 1;     /* 1 means this reg is used for zero-extending.
 228                                    In particular, moving it does not make it
 229                                    invariant.  */
 230   unsigned int move_insn : 1;   /* 1 means that we call emit_move_insn to
 231                                    load SRC, rather than copying INSN.  */
 232   unsigned int move_insn_first:1;/* Same as above, if this is necessary for the
 233                                     first insn of a consecutive sets group.  */
 234   unsigned int is_equiv : 1;    /* 1 means a REG_EQUIV is present on INSN.  */
 235   unsigned int insert_temp : 1;  /* 1 means we copy to a new pseudo and replace
 236                                     the original insn with a copy from that
 237                                     pseudo, rather than deleting it.  */
 238   struct movable *match;        /* First entry for same value */
 239   struct movable *forces;       /* An insn that must be moved if this is */
 240   struct movable *next;
 241 };
 242
 243
 244 FILE *loop_dump_stream;
 245
 246 /* Forward declarations.  */
 247
 248 static void invalidate_loops_containing_label (rtx);
 249 static void find_and_verify_loops (rtx, struct loops *);
 250 static void mark_loop_jump (rtx, struct loop *);
 251 static void prescan_loop (struct loop *);
 252 static int reg_in_basic_block_p (rtx, rtx);
 253 static int consec_sets_invariant_p (const struct loop *, rtx, int, rtx);
 254 static int labels_in_range_p (rtx, int);
 255 static void count_one_set (struct loop_regs *, rtx, rtx, rtx *);
 256 static void note_addr_stored (rtx, rtx, void *);
 257 static void note_set_pseudo_multiple_uses (rtx, rtx, void *);
 258 static int loop_reg_used_before_p (const struct loop *, rtx, rtx);
 259 static rtx find_regs_nested (rtx, rtx);
 260 static void scan_loop (struct loop*, int);
 261 #if 0
 262 static void replace_call_address (rtx, rtx, rtx);
 263 #endif
 264 static rtx skip_consec_insns (rtx, int);
 265 static int libcall_benefit (rtx);
 266 static rtx libcall_other_reg (rtx, rtx);
 267 static void record_excess_regs (rtx, rtx, rtx *);
 268 static void ignore_some_movables (struct loop_movables *);
 269 static void force_movables (struct loop_movables *);
 270 static void combine_movables (struct loop_movables *, struct loop_regs *);
 271 static int num_unmoved_movables (const struct loop *);
 272 static int regs_match_p (rtx, rtx, struct loop_movables *);
 273 static int rtx_equal_for_loop_p (rtx, rtx, struct loop_movables *,
 274                                  struct loop_regs *);
 275 static void add_label_notes (rtx, rtx);
 276 static void move_movables (struct loop *loop, struct loop_movables *, int,
 277                            int);
 278 static void loop_movables_add (struct loop_movables *, struct movable *);
 279 static void loop_movables_free (struct loop_movables *);
 280 static int count_nonfixed_reads (const struct loop *, rtx);
 281 static void loop_bivs_find (struct loop *);
 282 static void loop_bivs_init_find (struct loop *);
 283 static void loop_bivs_check (struct loop *);
 284 static void loop_givs_find (struct loop *);
 285 static void loop_givs_check (struct loop *);
 286 static int loop_biv_eliminable_p (struct loop *, struct iv_class *, int, int);
 287 static int loop_giv_reduce_benefit (struct loop *, struct iv_class *,
 288                                     struct induction *, rtx);
 289 static void loop_givs_dead_check (struct loop *, struct iv_class *);
 290 static void loop_givs_reduce (struct loop *, struct iv_class *);
 291 static void loop_givs_rescan (struct loop *, struct iv_class *, rtx *);
 292 static void loop_ivs_free (struct loop *);
 293 static void strength_reduce (struct loop *, int);
 294 static void find_single_use_in_loop (struct loop_regs *, rtx, rtx);
 295 static int valid_initial_value_p (rtx, rtx, int, rtx);
 296 static void find_mem_givs (const struct loop *, rtx, rtx, int, int);
 297 static void record_biv (struct loop *, struct induction *, rtx, rtx, rtx,
 298                         rtx, rtx *, int, int);
 299 static void check_final_value (const struct loop *, struct induction *);
 300 static void loop_ivs_dump (const struct loop *, FILE *, int);
 301 static void loop_iv_class_dump (const struct iv_class *, FILE *, int);
 302 static void loop_biv_dump (const struct induction *, FILE *, int);
 303 static void loop_giv_dump (const struct induction *, FILE *, int);
 304 static void record_giv (const struct loop *, struct induction *, rtx, rtx,
 305                         rtx, rtx, rtx, rtx, int, enum g_types, int, int,
 306                         rtx *);
 307 static void update_giv_derive (const struct loop *, rtx);
 308 static void check_ext_dependent_givs (const struct loop *, struct iv_class *);
 309 static int basic_induction_var (const struct loop *, rtx, enum machine_mode,
 310                                 rtx, rtx, rtx *, rtx *, rtx **);
 311 static rtx simplify_giv_expr (const struct loop *, rtx, rtx *, int *);
 312 static int general_induction_var (const struct loop *loop, rtx, rtx *, rtx *,
 313                                   rtx *, rtx *, int, int *, enum machine_mode);
 314 static int consec_sets_giv (const struct loop *, int, rtx, rtx, rtx, rtx *,
 315                             rtx *, rtx *, rtx *);
 316 static int check_dbra_loop (struct loop *, int);
 317 static rtx express_from_1 (rtx, rtx, rtx);
 318 static rtx combine_givs_p (struct induction *, struct induction *);
 319 static int cmp_combine_givs_stats (const void *, const void *);
 320 static void combine_givs (struct loop_regs *, struct iv_class *);
 321 static int product_cheap_p (rtx, rtx);
 322 static int maybe_eliminate_biv (const struct loop *, struct iv_class *, int,
 323                                 int, int);
 324 static int maybe_eliminate_biv_1 (const struct loop *, rtx, rtx,
 325                                   struct iv_class *, int, basic_block, rtx);
 326 static int last_use_this_basic_block (rtx, rtx);
 327 static void record_initial (rtx, rtx, void *);
 328 static void update_reg_last_use (rtx, rtx);
 329 static rtx next_insn_in_loop (const struct loop *, rtx);
 330 static void loop_regs_scan (const struct loop *, int);
 331 static int count_insns_in_loop (const struct loop *);
 332 static int find_mem_in_note_1 (rtx *, void *);
 333 static rtx find_mem_in_note (rtx);
 334 static void load_mems (const struct loop *);
 335 static int insert_loop_mem (rtx *, void *);
 336 static int replace_loop_mem (rtx *, void *);
 337 static void replace_loop_mems (rtx, rtx, rtx, int);
 338 static int replace_loop_reg (rtx *, void *);
 339 static void replace_loop_regs (rtx insn, rtx, rtx);
 340 static void note_reg_stored (rtx, rtx, void *);
 341 static void try_copy_prop (const struct loop *, rtx, unsigned int);
 342 static void try_swap_copy_prop (const struct loop *, rtx, unsigned int);
 343 static rtx check_insn_for_givs (struct loop *, rtx, int, int);
 344 static rtx check_insn_for_bivs (struct loop *, rtx, int, int);
 345 static rtx gen_add_mult (rtx, rtx, rtx, rtx);
 346 static void loop_regs_update (const struct loop *, rtx);
 347 static int iv_add_mult_cost (rtx, rtx, rtx, rtx);
 348
 349 static rtx loop_insn_emit_after (const struct loop *, basic_block, rtx, rtx);
 350 static rtx loop_call_insn_emit_before (const struct loop *, basic_block,
 351                                        rtx, rtx);
 352 static rtx loop_call_insn_hoist (const struct loop *, rtx);
 353 static rtx loop_insn_sink_or_swim (const struct loop *, rtx);
 354
 355 static void loop_dump_aux (const struct loop *, FILE *, int);
 356 static void loop_delete_insns (rtx, rtx);
 357 static HOST_WIDE_INT remove_constant_addition (rtx *);
 358 static rtx gen_load_of_final_value (rtx, rtx);
 359 void debug_ivs (const struct loop *);
 360 void debug_iv_class (const struct iv_class *);
 361 void debug_biv (const struct induction *);
 362 void debug_giv (const struct induction *);
 363 void debug_loop (const struct loop *);
 364 void debug_loops (const struct loops *);
 365
 366 typedef struct loop_replace_args
 367 {
 368   rtx match;
 369   rtx replacement;
 370   rtx insn;
 371 } loop_replace_args;
 372
 373 /* Nonzero iff INSN is between START and END, inclusive.  */
 374 #define INSN_IN_RANGE_P(INSN, START, END)       \
 375   (INSN_UID (INSN) < max_uid_for_loop           \
 376    && INSN_LUID (INSN) >= INSN_LUID (START)     \
 377    && INSN_LUID (INSN) <= INSN_LUID (END))
 378
 379 /* Indirect_jump_in_function is computed once per function.  */
 380 static int indirect_jump_in_function;
 381 static int indirect_jump_in_function_p (rtx);
 382
 383 static int compute_luids (rtx, rtx, int);
 384
 385 static int biv_elimination_giv_has_0_offset (struct induction *,
 386                                              struct induction *, rtx);
 387 \f
 388 /* Benefit penalty, if a giv is not replaceable, i.e. must emit an insn to
 389    copy the value of the strength reduced giv to its original register.  */
 390 static int copy_cost;
 391
 392 /* Cost of using a register, to normalize the benefits of a giv.  */
 393 static int reg_address_cost;
 394
 395 void
 396 init_loop (void)
 397 {
 398   rtx reg = gen_rtx_REG (word_mode, LAST_VIRTUAL_REGISTER + 1);
 399
 400   reg_address_cost = address_cost (reg, SImode);
 401
 402   copy_cost = COSTS_N_INSNS (1);
 403 }
 404 \f
 405 /* Compute the mapping from uids to luids.
 406    LUIDs are numbers assigned to insns, like uids,
 407    except that luids increase monotonically through the code.
 408    Start at insn START and stop just before END.  Assign LUIDs
 409    starting with PREV_LUID + 1.  Return the last assigned LUID + 1.  */
 410 static int
 411 compute_luids (rtx start, rtx end, int prev_luid)
 412 {
 413   int i;
 414   rtx insn;
 415
 416   for (insn = start, i = prev_luid; insn != end; insn = NEXT_INSN (insn))
 417     {
 418       if (INSN_UID (insn) >= max_uid_for_loop)
 419         continue;
 420       /* Don't assign luids to line-number NOTEs, so that the distance in
 421          luids between two insns is not affected by -g.  */
 422       if (GET_CODE (insn) != NOTE
 423           || NOTE_LINE_NUMBER (insn) <= 0)
 424         uid_luid[INSN_UID (insn)] = ++i;
 425       else
 426         /* Give a line number note the same luid as preceding insn.  */
 427         uid_luid[INSN_UID (insn)] = i;
 428     }
 429   return i + 1;
 430 }
 431 \f
 432 /* Entry point of this file.  Perform loop optimization
 433    on the current function.  F is the first insn of the function
 434    and DUMPFILE is a stream for output of a trace of actions taken
 435    (or 0 if none should be output).  */
 436
 437 void
 438 loop_optimize (rtx f, FILE *dumpfile, int flags)
 439 {
 440   rtx insn;
 441   int i;
 442   struct loops loops_data;
 443   struct loops *loops = &loops_data;
 444   struct loop_info *loops_info;
 445
 446   loop_dump_stream = dumpfile;
 447
 448   init_recog_no_volatile ();
 449
 450   max_reg_before_loop = max_reg_num ();
 451   loop_max_reg = max_reg_before_loop;
 452
 453   regs_may_share = 0;
 454
 455   /* Count the number of loops.  */
 456
 457   max_loop_num = 0;
 458   for (insn = f; insn; insn = NEXT_INSN (insn))
 459     {
 460       if (GET_CODE (insn) == NOTE
 461           && NOTE_LINE_NUMBER (insn) == NOTE_INSN_LOOP_BEG)
 462         max_loop_num++;
 463     }
 464
 465   /* Don't waste time if no loops.  */
 466   if (max_loop_num == 0)
 467     return;
 468
 469   loops->num = max_loop_num;
 470
 471   /* Get size to use for tables indexed by uids.
 472      Leave some space for labels allocated by find_and_verify_loops.  */
 473   max_uid_for_loop = get_max_uid () + 1 + max_loop_num * 32;
 474
 475   uid_luid = xcalloc (max_uid_for_loop, sizeof (int));
 476   uid_loop = xcalloc (max_uid_for_loop, sizeof (struct loop *));
 477
 478   /* Allocate storage for array of loops.  */
 479   loops->array = xcalloc (loops->num, sizeof (struct loop));
 480
 481   /* Find and process each loop.
 482      First, find them, and record them in order of their beginnings.  */
 483   find_and_verify_loops (f, loops);
 484
 485   /* Allocate and initialize auxiliary loop information.  */
 486   loops_info = xcalloc (loops->num, sizeof (struct loop_info));
 487   for (i = 0; i < (int) loops->num; i++)
 488     loops->array[i].aux = loops_info + i;
 489
 490   /* Now find all register lifetimes.  This must be done after
 491      find_and_verify_loops, because it might reorder the insns in the
 492      function.  */
 493   reg_scan (f, max_reg_before_loop, 1);
 494
 495   /* This must occur after reg_scan so that registers created by gcse
 496      will have entries in the register tables.
 497
 498      We could have added a call to reg_scan after gcse_main in toplev.c,
 499      but moving this call to init_alias_analysis is more efficient.  */
 500   init_alias_analysis ();
 501
 502   /* See if we went too far.  Note that get_max_uid already returns
 503      one more that the maximum uid of all insn.  */
 504   if (get_max_uid () > max_uid_for_loop)
 505     abort ();
 506   /* Now reset it to the actual size we need.  See above.  */
 507   max_uid_for_loop = get_max_uid ();
 508
 509   /* find_and_verify_loops has already called compute_luids, but it
 510      might have rearranged code afterwards, so we need to recompute
 511      the luids now.  */
 512   compute_luids (f, NULL_RTX, 0);
 513
 514   /* Don't leave gaps in uid_luid for insns that have been
 515      deleted.  It is possible that the first or last insn
 516      using some register has been deleted by cross-jumping.
 517      Make sure that uid_luid for that former insn's uid
 518      points to the general area where that insn used to be.  */
 519   for (i = 0; i < max_uid_for_loop; i++)
 520     {
 521       uid_luid[0] = uid_luid[i];
 522       if (uid_luid[0] != 0)
 523         break;
 524     }
 525   for (i = 0; i < max_uid_for_loop; i++)
 526     if (uid_luid[i] == 0)
 527       uid_luid[i] = uid_luid[i - 1];
 528
 529   /* Determine if the function has indirect jump.  On some systems
 530      this prevents low overhead loop instructions from being used.  */
 531   indirect_jump_in_function = indirect_jump_in_function_p (f);
 532
 533   /* Now scan the loops, last ones first, since this means inner ones are done
 534      before outer ones.  */
 535   for (i = max_loop_num - 1; i >= 0; i--)
 536     {
 537       struct loop *loop = &loops->array[i];
 538
 539       if (! loop->invalid && loop->end)
 540         {
 541           scan_loop (loop, flags);
 542           ggc_collect ();
 543         }
 544     }
 545
 546   end_alias_analysis ();
 547
 548   /* Clean up.  */
 549   for (i = 0; i < (int) loops->num; i++)
 550     free (loops_info[i].mems);
 551
 552   free (uid_luid);
 553   free (uid_loop);
 554   free (loops_info);
 555   free (loops->array);
 556 }
 557 \f
 558 /* Returns the next insn, in execution order, after INSN.  START and
 559    END are the NOTE_INSN_LOOP_BEG and NOTE_INSN_LOOP_END for the loop,
 560    respectively.  LOOP->TOP, if non-NULL, is the top of the loop in the
 561    insn-stream; it is used with loops that are entered near the
 562    bottom.  */
 563
 564 static rtx
 565 next_insn_in_loop (const struct loop *loop, rtx insn)
 566 {
 567   insn = NEXT_INSN (insn);
 568
 569   if (insn == loop->end)
 570     {
 571       if (loop->top)
 572         /* Go to the top of the loop, and continue there.  */
 573         insn = loop->top;
 574       else
 575         /* We're done.  */
 576         insn = NULL_RTX;
 577     }
 578
 579   if (insn == loop->scan_start)
 580     /* We're done.  */
 581     insn = NULL_RTX;
 582
 583   return insn;
 584 }
 585
 586 /* Find any register references hidden inside X and add them to
 587    the dependency list DEPS.  This is used to look inside CLOBBER (MEM
 588    when checking whether a PARALLEL can be pulled out of a loop.  */
 589
 590 static rtx
 591 find_regs_nested (rtx deps, rtx x)
 592 {
 593   enum rtx_code code = GET_CODE (x);
 594   if (code == REG)
 595     deps = gen_rtx_EXPR_LIST (VOIDmode, x, deps);
 596   else
 597     {
 598       const char *fmt = GET_RTX_FORMAT (code);
 599       int i, j;
 600       for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
 601         {
 602           if (fmt[i] == 'e')
 603             deps = find_regs_nested (deps, XEXP (x, i));
 604           else if (fmt[i] == 'E')
 605             for (j = 0; j < XVECLEN (x, i); j++)
 606               deps = find_regs_nested (deps, XVECEXP (x, i, j));
 607         }
 608     }
 609   return deps;
 610 }
 611
 612 /* Optimize one loop described by LOOP.  */
 613
 614 /* ??? Could also move memory writes out of loops if the destination address
 615    is invariant, the source is invariant, the memory write is not volatile,
 616    and if we can prove that no read inside the loop can read this address
 617    before the write occurs.  If there is a read of this address after the
 618    write, then we can also mark the memory read as invariant.  */
 619
 620 static void
 621 scan_loop (struct loop *loop, int flags)
 622 {
 623   struct loop_info *loop_info = LOOP_INFO (loop);
 624   struct loop_regs *regs = LOOP_REGS (loop);
 625   int i;
 626   rtx loop_start = loop->start;
 627   rtx loop_end = loop->end;
 628   rtx p;
 629   /* 1 if we are scanning insns that could be executed zero times.  */
 630   int maybe_never = 0;
 631   /* 1 if we are scanning insns that might never be executed
 632      due to a subroutine call which might exit before they are reached.  */
 633   int call_passed = 0;
 634   /* Number of insns in the loop.  */
 635   int insn_count;
 636   int tem;
 637   rtx temp, update_start, update_end;
 638   /* The SET from an insn, if it is the only SET in the insn.  */
 639   rtx set, set1;
 640   /* Chain describing insns movable in current loop.  */
 641   struct loop_movables *movables = LOOP_MOVABLES (loop);
 642   /* Ratio of extra register life span we can justify
 643      for saving an instruction.  More if loop doesn't call subroutines
 644      since in that case saving an insn makes more difference
 645      and more registers are available.  */
 646   int threshold;
 647   /* Nonzero if we are scanning instructions in a sub-loop.  */
 648   int loop_depth = 0;
 649   int in_libcall;
 650
 651   loop->top = 0;
 652
 653   movables->head = 0;
 654   movables->last = 0;
 655
 656   /* Determine whether this loop starts with a jump down to a test at
 657      the end.  This will occur for a small number of loops with a test
 658      that is too complex to duplicate in front of the loop.
 659
 660      We search for the first insn or label in the loop, skipping NOTEs.
 661      However, we must be careful not to skip past a NOTE_INSN_LOOP_BEG
 662      (because we might have a loop executed only once that contains a
 663      loop which starts with a jump to its exit test) or a NOTE_INSN_LOOP_END
 664      (in case we have a degenerate loop).
 665
 666      Note that if we mistakenly think that a loop is entered at the top
 667      when, in fact, it is entered at the exit test, the only effect will be
 668      slightly poorer optimization.  Making the opposite error can generate
 669      incorrect code.  Since very few loops now start with a jump to the
 670      exit test, the code here to detect that case is very conservative.  */
 671
 672   for (p = NEXT_INSN (loop_start);
 673        p != loop_end
 674          && GET_CODE (p) != CODE_LABEL && ! INSN_P (p)
 675          && (GET_CODE (p) != NOTE
 676              || (NOTE_LINE_NUMBER (p) != NOTE_INSN_LOOP_BEG
 677                  && NOTE_LINE_NUMBER (p) != NOTE_INSN_LOOP_END));
 678        p = NEXT_INSN (p))
 679     ;
 680
 681   loop->scan_start = p;
 682
 683   /* If loop end is the end of the current function, then emit a
 684      NOTE_INSN_DELETED after loop_end and set loop->sink to the dummy
 685      note insn.  This is the position we use when sinking insns out of
 686      the loop.  */
 687   if (NEXT_INSN (loop->end) != 0)
 688     loop->sink = NEXT_INSN (loop->end);
 689   else
 690     loop->sink = emit_note_after (NOTE_INSN_DELETED, loop->end);
 691
 692   /* Set up variables describing this loop.  */
 693   prescan_loop (loop);
 694   threshold = (loop_info->has_call ? 1 : 2) * (1 + n_non_fixed_regs);
 695
 696   /* If loop has a jump before the first label,
 697      the true entry is the target of that jump.
 698      Start scan from there.
 699      But record in LOOP->TOP the place where the end-test jumps
 700      back to so we can scan that after the end of the loop.  */
 701   if (GET_CODE (p) == JUMP_INSN
 702       /* Loop entry must be unconditional jump (and not a RETURN)  */
 703       && any_uncondjump_p (p)
 704       && JUMP_LABEL (p) != 0
 705       /* Check to see whether the jump actually
 706          jumps out of the loop (meaning it's no loop).
 707          This case can happen for things like
 708          do {..} while (0).  If this label was generated previously
 709          by loop, we can't tell anything about it and have to reject
 710          the loop.  */
 711       && INSN_IN_RANGE_P (JUMP_LABEL (p), loop_start, loop_end))
 712     {
 713       loop->top = next_label (loop->scan_start);
 714       loop->scan_start = JUMP_LABEL (p);
 715     }
 716
 717   /* If LOOP->SCAN_START was an insn created by loop, we don't know its luid
 718      as required by loop_reg_used_before_p.  So skip such loops.  (This
 719      test may never be true, but it's best to play it safe.)
 720
 721      Also, skip loops where we do not start scanning at a label.  This
 722      test also rejects loops starting with a JUMP_INSN that failed the
 723      test above.  */
 724
 725   if (INSN_UID (loop->scan_start) >= max_uid_for_loop
 726       || GET_CODE (loop->scan_start) != CODE_LABEL)
 727     {
 728       if (loop_dump_stream)
 729         fprintf (loop_dump_stream, "\nLoop from %d to %d is phony.\n\n",
 730                  INSN_UID (loop_start), INSN_UID (loop_end));
 731       return;
 732     }
 733
 734   /* Allocate extra space for REGs that might be created by load_mems.
 735      We allocate a little extra slop as well, in the hopes that we
 736      won't have to reallocate the regs array.  */
 737   loop_regs_scan (loop, loop_info->mems_idx + 16);
 738   insn_count = count_insns_in_loop (loop);
 739
 740   if (loop_dump_stream)
 741     {
 742       fprintf (loop_dump_stream, "\nLoop from %d to %d: %d real insns.\n",
 743                INSN_UID (loop_start), INSN_UID (loop_end), insn_count);
 744       if (loop->cont)
 745         fprintf (loop_dump_stream, "Continue at insn %d.\n",
 746                  INSN_UID (loop->cont));
 747     }
 748
 749   /* Scan through the loop finding insns that are safe to move.
 750      Set REGS->ARRAY[I].SET_IN_LOOP negative for the reg I being set, so that
 751      this reg will be considered invariant for subsequent insns.
 752      We consider whether subsequent insns use the reg
 753      in deciding whether it is worth actually moving.
 754
 755      MAYBE_NEVER is nonzero if we have passed a conditional jump insn
 756      and therefore it is possible that the insns we are scanning
 757      would never be executed.  At such times, we must make sure
 758      that it is safe to execute the insn once instead of zero times.
 759      When MAYBE_NEVER is 0, all insns will be executed at least once
 760      so that is not a problem.  */
 761
 762   for (in_libcall = 0, p = next_insn_in_loop (loop, loop->scan_start);
 763        p != NULL_RTX;
 764        p = next_insn_in_loop (loop, p))
 765     {
 766       if (in_libcall && INSN_P (p) && find_reg_note (p, REG_RETVAL, NULL_RTX))
 767         in_libcall--;
 768       if (GET_CODE (p) == INSN)
 769         {
 770           temp = find_reg_note (p, REG_LIBCALL, NULL_RTX);
 771           if (temp)
 772             in_libcall++;
 773           if (! in_libcall
 774               && (set = single_set (p))
 775               && GET_CODE (SET_DEST (set)) == REG
 776 #ifdef PIC_OFFSET_TABLE_REG_CALL_CLOBBERED
 777               && SET_DEST (set) != pic_offset_table_rtx
 778 #endif
 779               && ! regs->array[REGNO (SET_DEST (set))].may_not_optimize)
 780             {
 781               int tem1 = 0;
 782               int tem2 = 0;
 783               int move_insn = 0;
 784               int insert_temp = 0;
 785               rtx src = SET_SRC (set);
 786               rtx dependencies = 0;
 787
 788               /* Figure out what to use as a source of this insn.  If a
 789                  REG_EQUIV note is given or if a REG_EQUAL note with a
 790                  constant operand is specified, use it as the source and
 791                  mark that we should move this insn by calling
 792                  emit_move_insn rather that duplicating the insn.
 793
 794                  Otherwise, only use the REG_EQUAL contents if a REG_RETVAL
 795                  note is present.  */
 796               temp = find_reg_note (p, REG_EQUIV, NULL_RTX);
 797               if (temp)
 798                 src = XEXP (temp, 0), move_insn = 1;
 799               else
 800                 {
 801                   temp = find_reg_note (p, REG_EQUAL, NULL_RTX);
 802                   if (temp && CONSTANT_P (XEXP (temp, 0)))
 803                     src = XEXP (temp, 0), move_insn = 1;
 804                   if (temp && find_reg_note (p, REG_RETVAL, NULL_RTX))
 805                     {
 806                       src = XEXP (temp, 0);
 807                       /* A libcall block can use regs that don't appear in
 808                          the equivalent expression.  To move the libcall,
 809                          we must move those regs too.  */
 810                       dependencies = libcall_other_reg (p, src);
 811                     }
 812                 }
 813
 814               /* For parallels, add any possible uses to the dependencies, as
 815                  we can't move the insn without resolving them first.
 816                  MEMs inside CLOBBERs may also reference registers; these
 817                  count as implicit uses.  */
 818               if (GET_CODE (PATTERN (p)) == PARALLEL)
 819                 {
 820                   for (i = 0; i < XVECLEN (PATTERN (p), 0); i++)
 821                     {
 822                       rtx x = XVECEXP (PATTERN (p), 0, i);
 823                       if (GET_CODE (x) == USE)
 824                         dependencies
 825                           = gen_rtx_EXPR_LIST (VOIDmode, XEXP (x, 0),
 826                                                dependencies);
 827                       else if (GET_CODE (x) == CLOBBER
 828                                && GET_CODE (XEXP (x, 0)) == MEM)
 829                         dependencies = find_regs_nested (dependencies,
 830                                                   XEXP (XEXP (x, 0), 0));
 831                     }
 832                 }
 833
 834               if (/* The register is used in basic blocks other
 835                       than the one where it is set (meaning that
 836                       something after this point in the loop might
 837                       depend on its value before the set).  */
 838                    ! reg_in_basic_block_p (p, SET_DEST (set))
 839                    /* And the set is not guaranteed to be executed once
 840                       the loop starts, or the value before the set is
 841                       needed before the set occurs...
 842
 843                       ??? Note we have quadratic behavior here, mitigated
 844                       by the fact that the previous test will often fail for
 845                       large loops.  Rather than re-scanning the entire loop
 846                       each time for register usage, we should build tables
 847                       of the register usage and use them here instead.  */
 848                    && (maybe_never
 849                        || loop_reg_used_before_p (loop, set, p)))
 850                 /* It is unsafe to move the set.  However, it may be OK to
 851                    move the source into a new pseudo, and substitute a
 852                    reg-to-reg copy for the original insn.
 853
 854                    This code used to consider it OK to move a set of a variable
 855                    which was not created by the user and not used in an exit
 856                    test.
 857                    That behavior is incorrect and was removed.  */
 858                 insert_temp = 1;
 859
 860               /* Don't try to optimize a MODE_CC set with a constant
 861                  source.  It probably will be combined with a conditional
 862                  jump.  */
 863               if (GET_MODE_CLASS (GET_MODE (SET_DEST (set))) == MODE_CC
 864                   && CONSTANT_P (src))
 865                 ;
 866               /* Don't try to optimize a register that was made
 867                  by loop-optimization for an inner loop.
 868                  We don't know its life-span, so we can't compute
 869                  the benefit.  */
 870               else if (REGNO (SET_DEST (set)) >= max_reg_before_loop)
 871                 ;
 872               /* Don't move the source and add a reg-to-reg copy:
 873                  - with -Os (this certainly increases size),
 874                  - if the mode doesn't support copy operations (obviously),
 875                  - if the source is already a reg (the motion will gain nothing),
 876                  - if the source is a legitimate constant (likewise).  */
 877               else if (insert_temp
 878                        && (optimize_size
 879                            || ! can_copy_p (GET_MODE (SET_SRC (set)))
 880                            || GET_CODE (SET_SRC (set)) == REG
 881                            || (CONSTANT_P (SET_SRC (set))
 882                                && LEGITIMATE_CONSTANT_P (SET_SRC (set)))))
 883                 ;
 884               else if ((tem = loop_invariant_p (loop, src))
 885                        && (dependencies == 0
 886                            || (tem2
 887                                = loop_invariant_p (loop, dependencies)) != 0)
 888                        && (regs->array[REGNO (SET_DEST (set))].set_in_loop == 1
 889                            || (tem1
 890                                = consec_sets_invariant_p
 891                                (loop, SET_DEST (set),
 892                                 regs->array[REGNO (SET_DEST (set))].set_in_loop,
 893                                 p)))
 894                        /* If the insn can cause a trap (such as divide by zero),
 895                           can't move it unless it's guaranteed to be executed
 896                           once loop is entered.  Even a function call might
 897                           prevent the trap insn from being reached
 898                           (since it might exit!)  */
 899                        && ! ((maybe_never || call_passed)
 900                              && may_trap_p (src)))
 901                 {
 902                   struct movable *m;
 903                   int regno = REGNO (SET_DEST (set));
 904
 905                   /* A potential lossage is where we have a case where two insns
 906                      can be combined as long as they are both in the loop, but
 907                      we move one of them outside the loop.  For large loops,
 908                      this can lose.  The most common case of this is the address
 909                      of a function being called.
 910
 911                      Therefore, if this register is marked as being used
 912                      exactly once if we are in a loop with calls
 913                      (a "large loop"), see if we can replace the usage of
 914                      this register with the source of this SET.  If we can,
 915                      delete this insn.
 916
 917                      Don't do this if P has a REG_RETVAL note or if we have
 918                      SMALL_REGISTER_CLASSES and SET_SRC is a hard register.  */
 919
 920                   if (loop_info->has_call
 921                       && regs->array[regno].single_usage != 0
 922                       && regs->array[regno].single_usage != const0_rtx
 923                       && REGNO_FIRST_UID (regno) == INSN_UID (p)
 924                       && (REGNO_LAST_UID (regno)
 925                           == INSN_UID (regs->array[regno].single_usage))
 926                       && regs->array[regno].set_in_loop == 1
 927                       && GET_CODE (SET_SRC (set)) != ASM_OPERANDS
 928                       && ! side_effects_p (SET_SRC (set))
 929                       && ! find_reg_note (p, REG_RETVAL, NULL_RTX)
 930                       && (! SMALL_REGISTER_CLASSES
 931                           || (! (GET_CODE (SET_SRC (set)) == REG
 932                                  && (REGNO (SET_SRC (set))
 933                                      < FIRST_PSEUDO_REGISTER))))
 934                       /* This test is not redundant; SET_SRC (set) might be
 935                          a call-clobbered register and the life of REGNO
 936                          might span a call.  */
 937                       && ! modified_between_p (SET_SRC (set), p,
 938                                                regs->array[regno].single_usage)
 939                       && no_labels_between_p (p,
 940                                               regs->array[regno].single_usage)
 941                       && validate_replace_rtx (SET_DEST (set), SET_SRC (set),
 942                                                regs->array[regno].single_usage))
 943                     {
 944                       /* Replace any usage in a REG_EQUAL note.  Must copy
 945                          the new source, so that we don't get rtx sharing
 946                          between the SET_SOURCE and REG_NOTES of insn p.  */
 947                       REG_NOTES (regs->array[regno].single_usage)
 948                         = (replace_rtx
 949                            (REG_NOTES (regs->array[regno].single_usage),
 950                             SET_DEST (set), copy_rtx (SET_SRC (set))));
 951
 952                       delete_insn (p);
 953                       for (i = 0; i < LOOP_REGNO_NREGS (regno, SET_DEST (set));
 954                            i++)
 955                         regs->array[regno+i].set_in_loop = 0;
 956                       continue;
 957                     }
 958
 959                   m = xmalloc (sizeof (struct movable));
 960                   m->next = 0;
 961                   m->insn = p;
 962                   m->set_src = src;
 963                   m->dependencies = dependencies;
 964                   m->set_dest = SET_DEST (set);
 965                   m->force = 0;
 966                   m->consec
 967                     = regs->array[REGNO (SET_DEST (set))].set_in_loop - 1;
 968                   m->done = 0;
 969                   m->forces = 0;
 970                   m->partial = 0;
 971                   m->move_insn = move_insn;
 972                   m->move_insn_first = 0;
 973                   m->insert_temp = insert_temp;
 974                   m->is_equiv = (find_reg_note (p, REG_EQUIV, NULL_RTX) != 0);
 975                   m->savemode = VOIDmode;
 976                   m->regno = regno;
 977                   /* Set M->cond if either loop_invariant_p
 978                      or consec_sets_invariant_p returned 2
 979                      (only conditionally invariant).  */
 980                   m->cond = ((tem | tem1 | tem2) > 1);
 981                   m->global =  LOOP_REG_GLOBAL_P (loop, regno);
 982                   m->match = 0;
 983                   m->lifetime = LOOP_REG_LIFETIME (loop, regno);
 984                   m->savings = regs->array[regno].n_times_set;
 985                   if (find_reg_note (p, REG_RETVAL, NULL_RTX))
 986                     m->savings += libcall_benefit (p);
 987                   for (i = 0; i < LOOP_REGNO_NREGS (regno, SET_DEST (set)); i++)
 988                     regs->array[regno+i].set_in_loop = move_insn ? -2 : -1;
 989                   /* Add M to the end of the chain MOVABLES.  */
 990                   loop_movables_add (movables, m);
 991
 992                   if (m->consec > 0)
 993                     {
 994                       /* It is possible for the first instruction to have a
 995                          REG_EQUAL note but a non-invariant SET_SRC, so we must
 996                          remember the status of the first instruction in case
 997                          the last instruction doesn't have a REG_EQUAL note.  */
 998                       m->move_insn_first = m->move_insn;
 999
1000                       /* Skip this insn, not checking REG_LIBCALL notes.  */
1001                       p = next_nonnote_insn (p);
1002                       /* Skip the consecutive insns, if there are any.  */
1003                       p = skip_consec_insns (p, m->consec);
1004                       /* Back up to the last insn of the consecutive group.  */
1005                       p = prev_nonnote_insn (p);
1006
1007                       /* We must now reset m->move_insn, m->is_equiv, and
1008                          possibly m->set_src to correspond to the effects of
1009                          all the insns.  */
1010                       temp = find_reg_note (p, REG_EQUIV, NULL_RTX);
1011                       if (temp)
1012                         m->set_src = XEXP (temp, 0), m->move_insn = 1;
1013                       else
1014                         {
1015                           temp = find_reg_note (p, REG_EQUAL, NULL_RTX);
1016                           if (temp && CONSTANT_P (XEXP (temp, 0)))
1017                             m->set_src = XEXP (temp, 0), m->move_insn = 1;
1018                           else
1019                             m->move_insn = 0;
1020
1021                         }
1022                       m->is_equiv
1023                         = (find_reg_note (p, REG_EQUIV, NULL_RTX) != 0);
1024                     }
1025                 }
1026               /* If this register is always set within a STRICT_LOW_PART
1027                  or set to zero, then its high bytes are constant.
1028                  So clear them outside the loop and within the loop
1029                  just load the low bytes.
1030                  We must check that the machine has an instruction to do so.
1031                  Also, if the value loaded into the register
1032                  depends on the same register, this cannot be done.  */
1033               else if (SET_SRC (set) == const0_rtx
1034                        && GET_CODE (NEXT_INSN (p)) == INSN
1035                        && (set1 = single_set (NEXT_INSN (p)))
1036                        && GET_CODE (set1) == SET
1037                        && (GET_CODE (SET_DEST (set1)) == STRICT_LOW_PART)
1038                        && (GET_CODE (XEXP (SET_DEST (set1), 0)) == SUBREG)
1039                        && (SUBREG_REG (XEXP (SET_DEST (set1), 0))
1040                            == SET_DEST (set))
1041                        && !reg_mentioned_p (SET_DEST (set), SET_SRC (set1)))
1042                 {
1043                   int regno = REGNO (SET_DEST (set));
1044                   if (regs->array[regno].set_in_loop == 2)
1045                     {
1046                       struct movable *m;
1047                       m = xmalloc (sizeof (struct movable));
1048                       m->next = 0;
1049                       m->insn = p;
1050                       m->set_dest = SET_DEST (set);
1051                       m->dependencies = 0;
1052                       m->force = 0;
1053                       m->consec = 0;
1054                       m->done = 0;
1055                       m->forces = 0;
1056                       m->move_insn = 0;
1057                       m->move_insn_first = 0;
1058                       m->insert_temp = insert_temp;
1059                       m->partial = 1;
1060                       /* If the insn may not be executed on some cycles,
1061                          we can't clear the whole reg; clear just high part.
1062                          Not even if the reg is used only within this loop.
1063                          Consider this:
1064                          while (1)
1065                            while (s != t) {
1066                              if (foo ()) x = *s;
1067                              use (x);
1068                            }
1069                          Clearing x before the inner loop could clobber a value
1070                          being saved from the last time around the outer loop.
1071                          However, if the reg is not used outside this loop
1072                          and all uses of the register are in the same
1073                          basic block as the store, there is no problem.
1074
1075                          If this insn was made by loop, we don't know its
1076                          INSN_LUID and hence must make a conservative
1077                          assumption.  */
1078                       m->global = (INSN_UID (p) >= max_uid_for_loop
1079                                    || LOOP_REG_GLOBAL_P (loop, regno)
1080                                    || (labels_in_range_p
1081                                        (p, REGNO_FIRST_LUID (regno))));
1082                       if (maybe_never && m->global)
1083                         m->savemode = GET_MODE (SET_SRC (set1));
1084                       else
1085                         m->savemode = VOIDmode;
1086                       m->regno = regno;
1087                       m->cond = 0;
1088                       m->match = 0;
1089                       m->lifetime = LOOP_REG_LIFETIME (loop, regno);
1090                       m->savings = 1;
1091                       for (i = 0;
1092                            i < LOOP_REGNO_NREGS (regno, SET_DEST (set));
1093                            i++)
1094                         regs->array[regno+i].set_in_loop = -1;
1095                       /* Add M to the end of the chain MOVABLES.  */
1096                       loop_movables_add (movables, m);
1097                     }
1098                 }
1099             }
1100         }
1101       /* Past a call insn, we get to insns which might not be executed
1102          because the call might exit.  This matters for insns that trap.
1103          Constant and pure call insns always return, so they don't count.  */
1104       else if (GET_CODE (p) == CALL_INSN && ! CONST_OR_PURE_CALL_P (p))
1105         call_passed = 1;
1106       /* Past a label or a jump, we get to insns for which we
1107          can't count on whether or how many times they will be
1108          executed during each iteration.  Therefore, we can
1109          only move out sets of trivial variables
1110          (those not used after the loop).  */
1111       /* Similar code appears twice in strength_reduce.  */
1112       else if ((GET_CODE (p) == CODE_LABEL || GET_CODE (p) == JUMP_INSN)
1113                /* If we enter the loop in the middle, and scan around to the
1114                   beginning, don't set maybe_never for that.  This must be an
1115                   unconditional jump, otherwise the code at the top of the
1116                   loop might never be executed.  Unconditional jumps are
1117                   followed by a barrier then the loop_end.  */
1118                && ! (GET_CODE (p) == JUMP_INSN && JUMP_LABEL (p) == loop->top
1119                      && NEXT_INSN (NEXT_INSN (p)) == loop_end
1120                      && any_uncondjump_p (p)))
1121         maybe_never = 1;
1122       else if (GET_CODE (p) == NOTE)
1123         {
1124           /* At the virtual top of a converted loop, insns are again known to
1125              be executed: logically, the loop begins here even though the exit
1126              code has been duplicated.  */
1127           if (NOTE_LINE_NUMBER (p) == NOTE_INSN_LOOP_VTOP && loop_depth == 0)
1128             maybe_never = call_passed = 0;
1129           else if (NOTE_LINE_NUMBER (p) == NOTE_INSN_LOOP_BEG)
1130             loop_depth++;
1131           else if (NOTE_LINE_NUMBER (p) == NOTE_INSN_LOOP_END)
1132             loop_depth--;
1133         }
1134     }
1135
1136   /* If one movable subsumes another, ignore that other.  */
1137
1138   ignore_some_movables (movables);
1139
1140   /* For each movable insn, see if the reg that it loads
1141      leads when it dies right into another conditionally movable insn.
1142      If so, record that the second insn "forces" the first one,
1143      since the second can be moved only if the first is.  */
1144
1145   force_movables (movables);
1146
1147   /* See if there are multiple movable insns that load the same value.
1148      If there are, make all but the first point at the first one
1149      through the `match' field, and add the priorities of them
1150      all together as the priority of the first.  */
1151
1152   combine_movables (movables, regs);
1153
1154   /* Now consider each movable insn to decide whether it is worth moving.
1155      Store 0 in regs->array[I].set_in_loop for each reg I that is moved.
1156
1157      For machines with few registers this increases code size, so do not
1158      move moveables when optimizing for code size on such machines.
1159      (The 18 below is the value for i386.)  */
1160
1161   if (!optimize_size
1162       || (reg_class_size[GENERAL_REGS] > 18 && !loop_info->has_call))
1163     {
1164       move_movables (loop, movables, threshold, insn_count);
1165
1166       /* Recalculate regs->array if move_movables has created new
1167          registers.  */
1168       if (max_reg_num () > regs->num)
1169         {
1170           loop_regs_scan (loop, 0);
1171           for (update_start = loop_start;
1172                PREV_INSN (update_start)
1173                && GET_CODE (PREV_INSN (update_start)) != CODE_LABEL;
1174                update_start = PREV_INSN (update_start))
1175             ;
1176           update_end = NEXT_INSN (loop_end);
1177
1178           reg_scan_update (update_start, update_end, loop_max_reg);
1179           loop_max_reg = max_reg_num ();
1180         }
1181     }
1182
1183   /* Now candidates that still are negative are those not moved.
1184      Change regs->array[I].set_in_loop to indicate that those are not actually
1185      invariant.  */
1186   for (i = 0; i < regs->num; i++)
1187     if (regs->array[i].set_in_loop < 0)
1188       regs->array[i].set_in_loop = regs->array[i].n_times_set;
1189
1190   /* Now that we've moved some things out of the loop, we might be able to
1191      hoist even more memory references.  */
1192   load_mems (loop);
1193
1194   /* Recalculate regs->array if load_mems has created new registers.  */
1195   if (max_reg_num () > regs->num)
1196     loop_regs_scan (loop, 0);
1197
1198   for (update_start = loop_start;
1199        PREV_INSN (update_start)
1200          && GET_CODE (PREV_INSN (update_start)) != CODE_LABEL;
1201        update_start = PREV_INSN (update_start))
1202     ;
1203   update_end = NEXT_INSN (loop_end);
1204
1205   reg_scan_update (update_start, update_end, loop_max_reg);
1206   loop_max_reg = max_reg_num ();
1207
1208   if (flag_strength_reduce)
1209     {
1210       if (update_end && GET_CODE (update_end) == CODE_LABEL)
1211         /* Ensure our label doesn't go away.  */
1212         LABEL_NUSES (update_end)++;
1213
1214       strength_reduce (loop, flags);
1215
1216       reg_scan_update (update_start, update_end, loop_max_reg);
1217       loop_max_reg = max_reg_num ();
1218
1219       if (update_end && GET_CODE (update_end) == CODE_LABEL
1220           && --LABEL_NUSES (update_end) == 0)
1221         delete_related_insns (update_end);
1222     }
1223
1224
1225   /* The movable information is required for strength reduction.  */
1226   loop_movables_free (movables);
1227
1228   free (regs->array);
1229   regs->array = 0;
1230   regs->num = 0;
1231 }
1232 \f
1233 /* Add elements to *OUTPUT to record all the pseudo-regs
1234    mentioned in IN_THIS but not mentioned in NOT_IN_THIS.  */
1235
1236 static void
1237 record_excess_regs (rtx in_this, rtx not_in_this, rtx *output)
1238 {
1239   enum rtx_code code;
1240   const char *fmt;
1241   int i;
1242
1243   code = GET_CODE (in_this);
1244
1245   switch (code)
1246     {
1247     case PC:
1248     case CC0:
1249     case CONST_INT:
1250     case CONST_DOUBLE:
1251     case CONST:
1252     case SYMBOL_REF:
1253     case LABEL_REF:
1254       return;
1255
1256     case REG:
1257       if (REGNO (in_this) >= FIRST_PSEUDO_REGISTER
1258           && ! reg_mentioned_p (in_this, not_in_this))
1259         *output = gen_rtx_EXPR_LIST (VOIDmode, in_this, *output);
1260       return;
1261
1262     default:
1263       break;
1264     }
1265
1266   fmt = GET_RTX_FORMAT (code);
1267   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
1268     {
1269       int j;
1270
1271       switch (fmt[i])
1272         {
1273         case 'E':
1274           for (j = 0; j < XVECLEN (in_this, i); j++)
1275             record_excess_regs (XVECEXP (in_this, i, j), not_in_this, output);
1276           break;
1277
1278         case 'e':
1279           record_excess_regs (XEXP (in_this, i), not_in_this, output);
1280           break;
1281         }
1282     }
1283 }
1284 \f
1285 /* Check what regs are referred to in the libcall block ending with INSN,
1286    aside from those mentioned in the equivalent value.
1287    If there are none, return 0.
1288    If there are one or more, return an EXPR_LIST containing all of them.  */
1289
1290 static rtx
1291 libcall_other_reg (rtx insn, rtx equiv)
1292 {
1293   rtx note = find_reg_note (insn, REG_RETVAL, NULL_RTX);
1294   rtx p = XEXP (note, 0);
1295   rtx output = 0;
1296
1297   /* First, find all the regs used in the libcall block
1298      that are not mentioned as inputs to the result.  */
1299
1300   while (p != insn)
1301     {
1302       if (GET_CODE (p) == INSN || GET_CODE (p) == JUMP_INSN
1303           || GET_CODE (p) == CALL_INSN)
1304         record_excess_regs (PATTERN (p), equiv, &output);
1305       p = NEXT_INSN (p);
1306     }
1307
1308   return output;
1309 }
1310 \f
1311 /* Return 1 if all uses of REG
1312    are between INSN and the end of the basic block.  */
1313
1314 static int
1315 reg_in_basic_block_p (rtx insn, rtx reg)
1316 {
1317   int regno = REGNO (reg);
1318   rtx p;
1319
1320   if (REGNO_FIRST_UID (regno) != INSN_UID (insn))
1321     return 0;
1322
1323   /* Search this basic block for the already recorded last use of the reg.  */
1324   for (p = insn; p; p = NEXT_INSN (p))
1325     {
1326       switch (GET_CODE (p))
1327         {
1328         case NOTE:
1329           break;
1330
1331         case INSN:
1332         case CALL_INSN:
1333           /* Ordinary insn: if this is the last use, we win.  */
1334           if (REGNO_LAST_UID (regno) == INSN_UID (p))
1335             return 1;
1336           break;
1337
1338         case JUMP_INSN:
1339           /* Jump insn: if this is the last use, we win.  */
1340           if (REGNO_LAST_UID (regno) == INSN_UID (p))
1341             return 1;
1342           /* Otherwise, it's the end of the basic block, so we lose.  */
1343           return 0;
1344
1345         case CODE_LABEL:
1346         case BARRIER:
1347           /* It's the end of the basic block, so we lose.  */
1348           return 0;
1349
1350         default:
1351           break;
1352         }
1353     }
1354
1355   /* The "last use" that was recorded can't be found after the first
1356      use.  This can happen when the last use was deleted while
1357      processing an inner loop, this inner loop was then completely
1358      unrolled, and the outer loop is always exited after the inner loop,
1359      so that everything after the first use becomes a single basic block.  */
1360   return 1;
1361 }
1362 \f
1363 /* Compute the benefit of eliminating the insns in the block whose
1364    last insn is LAST.  This may be a group of insns used to compute a
1365    value directly or can contain a library call.  */
1366
1367 static int
1368 libcall_benefit (rtx last)
1369 {
1370   rtx insn;
1371   int benefit = 0;
1372
1373   for (insn = XEXP (find_reg_note (last, REG_RETVAL, NULL_RTX), 0);
1374        insn != last; insn = NEXT_INSN (insn))
1375     {
1376       if (GET_CODE (insn) == CALL_INSN)
1377         benefit += 10;          /* Assume at least this many insns in a library
1378                                    routine.  */
1379       else if (GET_CODE (insn) == INSN
1380                && GET_CODE (PATTERN (insn)) != USE
1381                && GET_CODE (PATTERN (insn)) != CLOBBER)
1382         benefit++;
1383     }
1384
1385   return benefit;
1386 }
1387 \f
1388 /* Skip COUNT insns from INSN, counting library calls as 1 insn.  */
1389
1390 static rtx
1391 skip_consec_insns (rtx insn, int count)
1392 {
1393   for (; count > 0; count--)
1394     {
1395       rtx temp;
1396
1397       /* If first insn of libcall sequence, skip to end.  */
1398       /* Do this at start of loop, since INSN is guaranteed to
1399          be an insn here.  */
1400       if (GET_CODE (insn) != NOTE
1401           && (temp = find_reg_note (insn, REG_LIBCALL, NULL_RTX)))
1402         insn = XEXP (temp, 0);
1403
1404       do
1405         insn = NEXT_INSN (insn);
1406       while (GET_CODE (insn) == NOTE);
1407     }
1408
1409   return insn;
1410 }
1411
1412 /* Ignore any movable whose insn falls within a libcall
1413    which is part of another movable.
1414    We make use of the fact that the movable for the libcall value
1415    was made later and so appears later on the chain.  */
1416
1417 static void
1418 ignore_some_movables (struct loop_movables *movables)
1419 {
1420   struct movable *m, *m1;
1421
1422   for (m = movables->head; m; m = m->next)
1423     {
1424       /* Is this a movable for the value of a libcall?  */
1425       rtx note = find_reg_note (m->insn, REG_RETVAL, NULL_RTX);
1426       if (note)
1427         {
1428           rtx insn;
1429           /* Check for earlier movables inside that range,
1430              and mark them invalid.  We cannot use LUIDs here because
1431              insns created by loop.c for prior loops don't have LUIDs.
1432              Rather than reject all such insns from movables, we just
1433              explicitly check each insn in the libcall (since invariant
1434              libcalls aren't that common).  */
1435           for (insn = XEXP (note, 0); insn != m->insn; insn = NEXT_INSN (insn))
1436             for (m1 = movables->head; m1 != m; m1 = m1->next)
1437               if (m1->insn == insn)
1438                 m1->done = 1;
1439         }
1440     }
1441 }
1442
1443 /* For each movable insn, see if the reg that it loads
1444    leads when it dies right into another conditionally movable insn.
1445    If so, record that the second insn "forces" the first one,
1446    since the second can be moved only if the first is.  */
1447
1448 static void
1449 force_movables (struct loop_movables *movables)
1450 {
1451   struct movable *m, *m1;
1452
1453   for (m1 = movables->head; m1; m1 = m1->next)
1454     /* Omit this if moving just the (SET (REG) 0) of a zero-extend.  */
1455     if (!m1->partial && !m1->done)
1456       {
1457         int regno = m1->regno;
1458         for (m = m1->next; m; m = m->next)
1459           /* ??? Could this be a bug?  What if CSE caused the
1460              register of M1 to be used after this insn?
1461              Since CSE does not update regno_last_uid,
1462              this insn M->insn might not be where it dies.
1463              But very likely this doesn't matter; what matters is
1464              that M's reg is computed from M1's reg.  */
1465           if (INSN_UID (m->insn) == REGNO_LAST_UID (regno)
1466               && !m->done)
1467             break;
1468         if (m != 0 && m->set_src == m1->set_dest
1469             /* If m->consec, m->set_src isn't valid.  */
1470             && m->consec == 0)
1471           m = 0;
1472
1473         /* Increase the priority of the moving the first insn
1474            since it permits the second to be moved as well.
1475            Likewise for insns already forced by the first insn.  */
1476         if (m != 0)
1477           {
1478             struct movable *m2;
1479
1480             m->forces = m1;
1481             for (m2 = m1; m2; m2 = m2->forces)
1482               {
1483                 m2->lifetime += m->lifetime;
1484                 m2->savings += m->savings;
1485               }
1486           }
1487       }
1488 }
1489 \f
1490 /* Find invariant expressions that are equal and can be combined into
1491    one register.  */
1492
1493 static void
1494 combine_movables (struct loop_movables *movables, struct loop_regs *regs)
1495 {
1496   struct movable *m;
1497   char *matched_regs = xmalloc (regs->num);
1498   enum machine_mode mode;
1499
1500   /* Regs that are set more than once are not allowed to match
1501      or be matched.  I'm no longer sure why not.  */
1502   /* Only pseudo registers are allowed to match or be matched,
1503      since move_movables does not validate the change.  */
1504   /* Perhaps testing m->consec_sets would be more appropriate here?  */
1505
1506   for (m = movables->head; m; m = m->next)
1507     if (m->match == 0 && regs->array[m->regno].n_times_set == 1
1508         && m->regno >= FIRST_PSEUDO_REGISTER
1509         && !m->insert_temp
1510         && !m->partial)
1511       {
1512         struct movable *m1;
1513         int regno = m->regno;
1514
1515         memset (matched_regs, 0, regs->num);
1516         matched_regs[regno] = 1;
1517
1518         /* We want later insns to match the first one.  Don't make the first
1519            one match any later ones.  So start this loop at m->next.  */
1520         for (m1 = m->next; m1; m1 = m1->next)
1521           if (m != m1 && m1->match == 0
1522               && !m1->insert_temp
1523               && regs->array[m1->regno].n_times_set == 1
1524               && m1->regno >= FIRST_PSEUDO_REGISTER
1525               /* A reg used outside the loop mustn't be eliminated.  */
1526               && !m1->global
1527               /* A reg used for zero-extending mustn't be eliminated.  */
1528               && !m1->partial
1529               && (matched_regs[m1->regno]
1530                   ||
1531                   (
1532                    /* Can combine regs with different modes loaded from the
1533                       same constant only if the modes are the same or
1534                       if both are integer modes with M wider or the same
1535                       width as M1.  The check for integer is redundant, but
1536                       safe, since the only case of differing destination
1537                       modes with equal sources is when both sources are
1538                       VOIDmode, i.e., CONST_INT.  */
1539                    (GET_MODE (m->set_dest) == GET_MODE (m1->set_dest)
1540                     || (GET_MODE_CLASS (GET_MODE (m->set_dest)) == MODE_INT
1541                         && GET_MODE_CLASS (GET_MODE (m1->set_dest)) == MODE_INT
1542                         && (GET_MODE_BITSIZE (GET_MODE (m->set_dest))
1543                             >= GET_MODE_BITSIZE (GET_MODE (m1->set_dest)))))
1544                    /* See if the source of M1 says it matches M.  */
1545                    && ((GET_CODE (m1->set_src) == REG
1546                         && matched_regs[REGNO (m1->set_src)])
1547                        || rtx_equal_for_loop_p (m->set_src, m1->set_src,
1548                                                 movables, regs))))
1549               && ((m->dependencies == m1->dependencies)
1550                   || rtx_equal_p (m->dependencies, m1->dependencies)))
1551             {
1552               m->lifetime += m1->lifetime;
1553               m->savings += m1->savings;
1554               m1->done = 1;
1555               m1->match = m;
1556               matched_regs[m1->regno] = 1;
1557             }
1558       }
1559
1560   /* Now combine the regs used for zero-extension.
1561      This can be done for those not marked `global'
1562      provided their lives don't overlap.  */
1563
1564   for (mode = GET_CLASS_NARROWEST_MODE (MODE_INT); mode != VOIDmode;
1565        mode = GET_MODE_WIDER_MODE (mode))
1566     {
1567       struct movable *m0 = 0;
1568
1569       /* Combine all the registers for extension from mode MODE.
1570          Don't combine any that are used outside this loop.  */
1571       for (m = movables->head; m; m = m->next)
1572         if (m->partial && ! m->global
1573             && mode == GET_MODE (SET_SRC (PATTERN (NEXT_INSN (m->insn)))))
1574           {
1575             struct movable *m1;
1576
1577             int first = REGNO_FIRST_LUID (m->regno);
1578             int last = REGNO_LAST_LUID (m->regno);
1579
1580             if (m0 == 0)
1581               {
1582                 /* First one: don't check for overlap, just record it.  */
1583                 m0 = m;
1584                 continue;
1585               }
1586
1587             /* Make sure they extend to the same mode.
1588                (Almost always true.)  */
1589             if (GET_MODE (m->set_dest) != GET_MODE (m0->set_dest))
1590               continue;
1591
1592             /* We already have one: check for overlap with those
1593                already combined together.  */
1594             for (m1 = movables->head; m1 != m; m1 = m1->next)
1595               if (m1 == m0 || (m1->partial && m1->match == m0))
1596                 if (! (REGNO_FIRST_LUID (m1->regno) > last
1597                        || REGNO_LAST_LUID (m1->regno) < first))
1598                   goto overlap;
1599
1600             /* No overlap: we can combine this with the others.  */
1601             m0->lifetime += m->lifetime;
1602             m0->savings += m->savings;
1603             m->done = 1;
1604             m->match = m0;
1605
1606           overlap:
1607             ;
1608           }
1609     }
1610
1611   /* Clean up.  */
1612   free (matched_regs);
1613 }
1614
1615 /* Returns the number of movable instructions in LOOP that were not
1616    moved outside the loop.  */
1617
1618 static int
1619 num_unmoved_movables (const struct loop *loop)
1620 {
1621   int num = 0;
1622   struct movable *m;
1623
1624   for (m = LOOP_MOVABLES (loop)->head; m; m = m->next)
1625     if (!m->done)
1626       ++num;
1627
1628   return num;
1629 }
1630
1631 \f
1632 /* Return 1 if regs X and Y will become the same if moved.  */
1633
1634 static int
1635 regs_match_p (rtx x, rtx y, struct loop_movables *movables)
1636 {
1637   unsigned int xn = REGNO (x);
1638   unsigned int yn = REGNO (y);
1639   struct movable *mx, *my;
1640
1641   for (mx = movables->head; mx; mx = mx->next)
1642     if (mx->regno == xn)
1643       break;
1644
1645   for (my = movables->head; my; my = my->next)
1646     if (my->regno == yn)
1647       break;
1648
1649   return (mx && my
1650           && ((mx->match == my->match && mx->match != 0)
1651               || mx->match == my
1652               || mx == my->match));
1653 }
1654
1655 /* Return 1 if X and Y are identical-looking rtx's.
1656    This is the Lisp function EQUAL for rtx arguments.
1657
1658    If two registers are matching movables or a movable register and an
1659    equivalent constant, consider them equal.  */
1660
1661 static int
1662 rtx_equal_for_loop_p (rtx x, rtx y, struct loop_movables *movables,
1663                       struct loop_regs *regs)
1664 {
1665   int i;
1666   int j;
1667   struct movable *m;
1668   enum rtx_code code;
1669   const char *fmt;
1670
1671   if (x == y)
1672     return 1;
1673   if (x == 0 || y == 0)
1674     return 0;
1675
1676   code = GET_CODE (x);
1677
1678   /* If we have a register and a constant, they may sometimes be
1679      equal.  */
1680   if (GET_CODE (x) == REG && regs->array[REGNO (x)].set_in_loop == -2
1681       && CONSTANT_P (y))
1682     {
1683       for (m = movables->head; m; m = m->next)
1684         if (m->move_insn && m->regno == REGNO (x)
1685             && rtx_equal_p (m->set_src, y))
1686           return 1;
1687     }
1688   else if (GET_CODE (y) == REG && regs->array[REGNO (y)].set_in_loop == -2
1689            && CONSTANT_P (x))
1690     {
1691       for (m = movables->head; m; m = m->next)
1692         if (m->move_insn && m->regno == REGNO (y)
1693             && rtx_equal_p (m->set_src, x))
1694           return 1;
1695     }
1696
1697   /* Otherwise, rtx's of different codes cannot be equal.  */
1698   if (code != GET_CODE (y))
1699     return 0;
1700
1701   /* (MULT:SI x y) and (MULT:HI x y) are NOT equivalent.
1702      (REG:SI x) and (REG:HI x) are NOT equivalent.  */
1703
1704   if (GET_MODE (x) != GET_MODE (y))
1705     return 0;
1706
1707   /* These three types of rtx's can be compared nonrecursively.  */
1708   if (code == REG)
1709     return (REGNO (x) == REGNO (y) || regs_match_p (x, y, movables));
1710
1711   if (code == LABEL_REF)
1712     return XEXP (x, 0) == XEXP (y, 0);
1713   if (code == SYMBOL_REF)
1714     return XSTR (x, 0) == XSTR (y, 0);
1715
1716   /* Compare the elements.  If any pair of corresponding elements
1717      fail to match, return 0 for the whole things.  */
1718
1719   fmt = GET_RTX_FORMAT (code);
1720   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
1721     {
1722       switch (fmt[i])
1723         {
1724         case 'w':
1725           if (XWINT (x, i) != XWINT (y, i))
1726             return 0;
1727           break;
1728
1729         case 'i':
1730           if (XINT (x, i) != XINT (y, i))
1731             return 0;
1732           break;
1733
1734         case 'E':
1735           /* Two vectors must have the same length.  */
1736           if (XVECLEN (x, i) != XVECLEN (y, i))
1737             return 0;
1738
1739           /* And the corresponding elements must match.  */
1740           for (j = 0; j < XVECLEN (x, i); j++)
1741             if (rtx_equal_for_loop_p (XVECEXP (x, i, j), XVECEXP (y, i, j),
1742                                       movables, regs) == 0)
1743               return 0;
1744           break;
1745
1746         case 'e':
1747           if (rtx_equal_for_loop_p (XEXP (x, i), XEXP (y, i), movables, regs)
1748               == 0)
1749             return 0;
1750           break;
1751
1752         case 's':
1753           if (strcmp (XSTR (x, i), XSTR (y, i)))
1754             return 0;
1755           break;
1756
1757         case 'u':
1758           /* These are just backpointers, so they don't matter.  */
1759           break;
1760
1761         case '0':
1762           break;
1763
1764           /* It is believed that rtx's at this level will never
1765              contain anything but integers and other rtx's,
1766              except for within LABEL_REFs and SYMBOL_REFs.  */
1767         default:
1768           abort ();
1769         }
1770     }
1771   return 1;
1772 }
1773 \f
1774 /* If X contains any LABEL_REF's, add REG_LABEL notes for them to all
1775    insns in INSNS which use the reference.  LABEL_NUSES for CODE_LABEL
1776    references is incremented once for each added note.  */
1777
1778 static void
1779 add_label_notes (rtx x, rtx insns)
1780 {
1781   enum rtx_code code = GET_CODE (x);
1782   int i, j;
1783   const char *fmt;
1784   rtx insn;
1785
1786   if (code == LABEL_REF && !LABEL_REF_NONLOCAL_P (x))
1787     {
1788       /* This code used to ignore labels that referred to dispatch tables to
1789          avoid flow generating (slightly) worse code.
1790
1791          We no longer ignore such label references (see LABEL_REF handling in
1792          mark_jump_label for additional information).  */
1793       for (insn = insns; insn; insn = NEXT_INSN (insn))
1794         if (reg_mentioned_p (XEXP (x, 0), insn))
1795           {
1796             REG_NOTES (insn) = gen_rtx_INSN_LIST (REG_LABEL, XEXP (x, 0),
1797                                                   REG_NOTES (insn));
1798             if (LABEL_P (XEXP (x, 0)))
1799               LABEL_NUSES (XEXP (x, 0))++;
1800           }
1801     }
1802
1803   fmt = GET_RTX_FORMAT (code);
1804   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
1805     {
1806       if (fmt[i] == 'e')
1807         add_label_notes (XEXP (x, i), insns);
1808       else if (fmt[i] == 'E')
1809         for (j = XVECLEN (x, i) - 1; j >= 0; j--)
1810           add_label_notes (XVECEXP (x, i, j), insns);
1811     }
1812 }
1813 \f
1814 /* Scan MOVABLES, and move the insns that deserve to be moved.
1815    If two matching movables are combined, replace one reg with the
1816    other throughout.  */
1817
1818 static void
1819 move_movables (struct loop *loop, struct loop_movables *movables,
1820                int threshold, int insn_count)
1821 {
1822   struct loop_regs *regs = LOOP_REGS (loop);
1823   int nregs = regs->num;
1824   rtx new_start = 0;
1825   struct movable *m;
1826   rtx p;
1827   rtx loop_start = loop->start;
1828   rtx loop_end = loop->end;
1829   /* Map of pseudo-register replacements to handle combining
1830      when we move several insns that load the same value
1831      into different pseudo-registers.  */
1832   rtx *reg_map = xcalloc (nregs, sizeof (rtx));
1833   char *already_moved = xcalloc (nregs, sizeof (char));
1834
1835   for (m = movables->head; m; m = m->next)
1836     {
1837       /* Describe this movable insn.  */
1838
1839       if (loop_dump_stream)
1840         {
1841           fprintf (loop_dump_stream, "Insn %d: regno %d (life %d), ",
1842                    INSN_UID (m->insn), m->regno, m->lifetime);
1843           if (m->consec > 0)
1844             fprintf (loop_dump_stream, "consec %d, ", m->consec);
1845           if (m->cond)
1846             fprintf (loop_dump_stream, "cond ");
1847           if (m->force)
1848             fprintf (loop_dump_stream, "force ");
1849           if (m->global)
1850             fprintf (loop_dump_stream, "global ");
1851           if (m->done)
1852             fprintf (loop_dump_stream, "done ");
1853           if (m->move_insn)
1854             fprintf (loop_dump_stream, "move-insn ");
1855           if (m->match)
1856             fprintf (loop_dump_stream, "matches %d ",
1857                      INSN_UID (m->match->insn));
1858           if (m->forces)
1859             fprintf (loop_dump_stream, "forces %d ",
1860                      INSN_UID (m->forces->insn));
1861         }
1862
1863       /* Ignore the insn if it's already done (it matched something else).
1864          Otherwise, see if it is now safe to move.  */
1865
1866       if (!m->done
1867           && (! m->cond
1868               || (1 == loop_invariant_p (loop, m->set_src)
1869                   && (m->dependencies == 0
1870                       || 1 == loop_invariant_p (loop, m->dependencies))
1871                   && (m->consec == 0
1872                       || 1 == consec_sets_invariant_p (loop, m->set_dest,
1873                                                        m->consec + 1,
1874                                                        m->insn))))
1875           && (! m->forces || m->forces->done))
1876         {
1877           int regno;
1878           rtx p;
1879           int savings = m->savings;
1880
1881           /* We have an insn that is safe to move.
1882              Compute its desirability.  */
1883
1884           p = m->insn;
1885           regno = m->regno;
1886
1887           if (loop_dump_stream)
1888             fprintf (loop_dump_stream, "savings %d ", savings);
1889
1890           if (regs->array[regno].moved_once && loop_dump_stream)
1891             fprintf (loop_dump_stream, "halved since already moved ");
1892
1893           /* An insn MUST be moved if we already moved something else
1894              which is safe only if this one is moved too: that is,
1895              if already_moved[REGNO] is nonzero.  */
1896
1897           /* An insn is desirable to move if the new lifetime of the
1898              register is no more than THRESHOLD times the old lifetime.
1899              If it's not desirable, it means the loop is so big
1900              that moving won't speed things up much,
1901              and it is liable to make register usage worse.  */
1902
1903           /* It is also desirable to move if it can be moved at no
1904              extra cost because something else was already moved.  */
1905
1906           if (already_moved[regno]
1907               || flag_move_all_movables
1908               || (threshold * savings * m->lifetime) >=
1909                  (regs->array[regno].moved_once ? insn_count * 2 : insn_count)
1910               || (m->forces && m->forces->done
1911                   && regs->array[m->forces->regno].n_times_set == 1))
1912             {
1913               int count;
1914               struct movable *m1;
1915               rtx first = NULL_RTX;
1916               rtx newreg = NULL_RTX;
1917
1918               if (m->insert_temp)
1919                 newreg = gen_reg_rtx (GET_MODE (m->set_dest));
1920
1921               /* Now move the insns that set the reg.  */
1922
1923               if (m->partial && m->match)
1924                 {
1925                   rtx newpat, i1;
1926                   rtx r1, r2;
1927                   /* Find the end of this chain of matching regs.
1928                      Thus, we load each reg in the chain from that one reg.
1929                      And that reg is loaded with 0 directly,
1930                      since it has ->match == 0.  */
1931                   for (m1 = m; m1->match; m1 = m1->match);
1932                   newpat = gen_move_insn (SET_DEST (PATTERN (m->insn)),
1933                                           SET_DEST (PATTERN (m1->insn)));
1934                   i1 = loop_insn_hoist (loop, newpat);
1935
1936                   /* Mark the moved, invariant reg as being allowed to
1937                      share a hard reg with the other matching invariant.  */
1938                   REG_NOTES (i1) = REG_NOTES (m->insn);
1939                   r1 = SET_DEST (PATTERN (m->insn));
1940                   r2 = SET_DEST (PATTERN (m1->insn));
1941                   regs_may_share
1942                     = gen_rtx_EXPR_LIST (VOIDmode, r1,
1943                                          gen_rtx_EXPR_LIST (VOIDmode, r2,
1944                                                             regs_may_share));
1945                   delete_insn (m->insn);
1946
1947                   if (new_start == 0)
1948                     new_start = i1;
1949
1950                   if (loop_dump_stream)
1951                     fprintf (loop_dump_stream, " moved to %d", INSN_UID (i1));
1952                 }
1953               /* If we are to re-generate the item being moved with a
1954                  new move insn, first delete what we have and then emit
1955                  the move insn before the loop.  */
1956               else if (m->move_insn)
1957                 {
1958                   rtx i1, temp, seq;
1959
1960                   for (count = m->consec; count >= 0; count--)
1961                     {
1962                       /* If this is the first insn of a library call sequence,
1963                          something is very wrong.  */
1964                       if (GET_CODE (p) != NOTE
1965                           && (temp = find_reg_note (p, REG_LIBCALL, NULL_RTX)))
1966                         abort ();
1967
1968                       /* If this is the last insn of a libcall sequence, then
1969                          delete every insn in the sequence except the last.
1970                          The last insn is handled in the normal manner.  */
1971                       if (GET_CODE (p) != NOTE
1972                           && (temp = find_reg_note (p, REG_RETVAL, NULL_RTX)))
1973                         {
1974                           temp = XEXP (temp, 0);
1975                           while (temp != p)
1976                             temp = delete_insn (temp);
1977                         }
1978
1979                       temp = p;
1980                       p = delete_insn (p);
1981
1982                       /* simplify_giv_expr expects that it can walk the insns
1983                          at m->insn forwards and see this old sequence we are
1984                          tossing here.  delete_insn does preserve the next
1985                          pointers, but when we skip over a NOTE we must fix
1986                          it up.  Otherwise that code walks into the non-deleted
1987                          insn stream.  */
1988                       while (p && GET_CODE (p) == NOTE)
1989                         p = NEXT_INSN (temp) = NEXT_INSN (p);
1990
1991                       if (m->insert_temp)
1992                         {
1993                           /* Replace the original insn with a move from
1994                              our newly created temp.  */
1995                           start_sequence ();
1996                           emit_move_insn (m->set_dest, newreg);
1997                           seq = get_insns ();
1998                           end_sequence ();
1999                           emit_insn_before (seq, p);
2000                         }
2001                     }
2002
2003                   start_sequence ();
2004                   emit_move_insn (m->insert_temp ? newreg : m->set_dest,
2005                                   m->set_src);
2006                   seq = get_insns ();
2007                   end_sequence ();
2008
2009                   add_label_notes (m->set_src, seq);
2010
2011                   i1 = loop_insn_hoist (loop, seq);
2012                   if (! find_reg_note (i1, REG_EQUAL, NULL_RTX))
2013                     set_unique_reg_note (i1,
2014                                          m->is_equiv ? REG_EQUIV : REG_EQUAL,
2015                                          m->set_src);
2016
2017                   if (loop_dump_stream)
2018                     fprintf (loop_dump_stream, " moved to %d", INSN_UID (i1));
2019
2020                   /* The more regs we move, the less we like moving them.  */
2021                   threshold -= 3;
2022                 }
2023               else
2024                 {
2025                   for (count = m->consec; count >= 0; count--)
2026                     {
2027                       rtx i1, temp;
2028
2029                       /* If first insn of libcall sequence, skip to end.  */
2030                       /* Do this at start of loop, since p is guaranteed to
2031                          be an insn here.  */
2032                       if (GET_CODE (p) != NOTE
2033                           && (temp = find_reg_note (p, REG_LIBCALL, NULL_RTX)))
2034                         p = XEXP (temp, 0);
2035
2036                       /* If last insn of libcall sequence, move all
2037                          insns except the last before the loop.  The last
2038                          insn is handled in the normal manner.  */
2039                       if (GET_CODE (p) != NOTE
2040                           && (temp = find_reg_note (p, REG_RETVAL, NULL_RTX)))
2041                         {
2042                           rtx fn_address = 0;
2043                           rtx fn_reg = 0;
2044                           rtx fn_address_insn = 0;
2045
2046                           first = 0;
2047                           for (temp = XEXP (temp, 0); temp != p;
2048                                temp = NEXT_INSN (temp))
2049                             {
2050                               rtx body;
2051                               rtx n;
2052                               rtx next;
2053
2054                               if (GET_CODE (temp) == NOTE)
2055                                 continue;
2056
2057                               body = PATTERN (temp);
2058
2059                               /* Find the next insn after TEMP,
2060                                  not counting USE or NOTE insns.  */
2061                               for (next = NEXT_INSN (temp); next != p;
2062                                    next = NEXT_INSN (next))
2063                                 if (! (GET_CODE (next) == INSN
2064                                        && GET_CODE (PATTERN (next)) == USE)
2065                                     && GET_CODE (next) != NOTE)
2066                                   break;
2067
2068                               /* If that is the call, this may be the insn
2069                                  that loads the function address.
2070
2071                                  Extract the function address from the insn
2072                                  that loads it into a register.
2073                                  If this insn was cse'd, we get incorrect code.
2074
2075                                  So emit a new move insn that copies the
2076                                  function address into the register that the
2077                                  call insn will use.  flow.c will delete any
2078                                  redundant stores that we have created.  */
2079                               if (GET_CODE (next) == CALL_INSN
2080                                   && GET_CODE (body) == SET
2081                                   && GET_CODE (SET_DEST (body)) == REG
2082                                   && (n = find_reg_note (temp, REG_EQUAL,
2083                                                          NULL_RTX)))
2084                                 {
2085                                   fn_reg = SET_SRC (body);
2086                                   if (GET_CODE (fn_reg) != REG)
2087                                     fn_reg = SET_DEST (body);
2088                                   fn_address = XEXP (n, 0);
2089                                   fn_address_insn = temp;
2090                                 }
2091                               /* We have the call insn.
2092                                  If it uses the register we suspect it might,
2093                                  load it with the correct address directly.  */
2094                               if (GET_CODE (temp) == CALL_INSN
2095                                   && fn_address != 0
2096                                   && reg_referenced_p (fn_reg, body))
2097                                 loop_insn_emit_after (loop, 0, fn_address_insn,
2098                                                       gen_move_insn
2099                                                       (fn_reg, fn_address));
2100
2101                               if (GET_CODE (temp) == CALL_INSN)
2102                                 {
2103                                   i1 = loop_call_insn_hoist (loop, body);
2104                                   /* Because the USAGE information potentially
2105                                      contains objects other than hard registers
2106                                      we need to copy it.  */
2107                                   if (CALL_INSN_FUNCTION_USAGE (temp))
2108                                     CALL_INSN_FUNCTION_USAGE (i1)
2109                                       = copy_rtx (CALL_INSN_FUNCTION_USAGE (temp));
2110                                 }
2111                               else
2112                                 i1 = loop_insn_hoist (loop, body);
2113                               if (first == 0)
2114                                 first = i1;
2115                               if (temp == fn_address_insn)
2116                                 fn_address_insn = i1;
2117                               REG_NOTES (i1) = REG_NOTES (temp);
2118                               REG_NOTES (temp) = NULL;
2119                               delete_insn (temp);
2120                             }
2121                           if (new_start == 0)
2122                             new_start = first;
2123                         }
2124                       if (m->savemode != VOIDmode)
2125                         {
2126                           /* P sets REG to zero; but we should clear only
2127                              the bits that are not covered by the mode
2128                              m->savemode.  */
2129                           rtx reg = m->set_dest;
2130                           rtx sequence;
2131                           rtx tem;
2132
2133                           start_sequence ();
2134                           tem = expand_simple_binop
2135                             (GET_MODE (reg), AND, reg,
2136                              GEN_INT ((((HOST_WIDE_INT) 1
2137                                         << GET_MODE_BITSIZE (m->savemode)))
2138                                       - 1),
2139                              reg, 1, OPTAB_LIB_WIDEN);
2140                           if (tem == 0)
2141                             abort ();
2142                           if (tem != reg)
2143                             emit_move_insn (reg, tem);
2144                           sequence = get_insns ();
2145                           end_sequence ();
2146                           i1 = loop_insn_hoist (loop, sequence);
2147                         }
2148                       else if (GET_CODE (p) == CALL_INSN)
2149                         {
2150                           i1 = loop_call_insn_hoist (loop, PATTERN (p));
2151                           /* Because the USAGE information potentially
2152                              contains objects other than hard registers
2153                              we need to copy it.  */
2154                           if (CALL_INSN_FUNCTION_USAGE (p))
2155                             CALL_INSN_FUNCTION_USAGE (i1)
2156                               = copy_rtx (CALL_INSN_FUNCTION_USAGE (p));
2157                         }
2158                       else if (count == m->consec && m->move_insn_first)
2159                         {
2160                           rtx seq;
2161                           /* The SET_SRC might not be invariant, so we must
2162                              use the REG_EQUAL note.  */
2163                           start_sequence ();
2164                           emit_move_insn (m->insert_temp ? newreg : m->set_dest,
2165                                           m->set_src);
2166                           seq = get_insns ();
2167                           end_sequence ();
2168
2169                           add_label_notes (m->set_src, seq);
2170
2171                           i1 = loop_insn_hoist (loop, seq);
2172                           if (! find_reg_note (i1, REG_EQUAL, NULL_RTX))
2173                             set_unique_reg_note (i1, m->is_equiv ? REG_EQUIV
2174                                                      : REG_EQUAL, m->set_src);
2175                         }
2176                       else if (m->insert_temp)
2177                         {
2178                           rtx *reg_map2 = xcalloc (REGNO (newreg),
2179                                                    sizeof(rtx));
2180                           reg_map2 [m->regno] = newreg;
2181
2182                           i1 = loop_insn_hoist (loop, copy_rtx (PATTERN (p)));
2183                           replace_regs (i1, reg_map2, REGNO (newreg), 1);
2184                           free (reg_map2);
2185                         }
2186                       else
2187                         i1 = loop_insn_hoist (loop, PATTERN (p));
2188
2189                       if (REG_NOTES (i1) == 0)
2190                         {
2191                           REG_NOTES (i1) = REG_NOTES (p);
2192                           REG_NOTES (p) = NULL;
2193
2194                           /* If there is a REG_EQUAL note present whose value
2195                              is not loop invariant, then delete it, since it
2196                              may cause problems with later optimization passes.
2197                              It is possible for cse to create such notes
2198                              like this as a result of record_jump_cond.  */
2199
2200                           if ((temp = find_reg_note (i1, REG_EQUAL, NULL_RTX))
2201                               && ! loop_invariant_p (loop, XEXP (temp, 0)))
2202                             remove_note (i1, temp);
2203                         }
2204
2205                       if (new_start == 0)
2206                         new_start = i1;
2207
2208                       if (loop_dump_stream)
2209                         fprintf (loop_dump_stream, " moved to %d",
2210                                  INSN_UID (i1));
2211
2212                       /* If library call, now fix the REG_NOTES that contain
2213                          insn pointers, namely REG_LIBCALL on FIRST
2214                          and REG_RETVAL on I1.  */
2215                       if ((temp = find_reg_note (i1, REG_RETVAL, NULL_RTX)))
2216                         {
2217                           XEXP (temp, 0) = first;
2218                           temp = find_reg_note (first, REG_LIBCALL, NULL_RTX);
2219                           XEXP (temp, 0) = i1;
2220                         }
2221
2222                       temp = p;
2223                       delete_insn (p);
2224                       p = NEXT_INSN (p);
2225
2226                       /* simplify_giv_expr expects that it can walk the insns
2227                          at m->insn forwards and see this old sequence we are
2228                          tossing here.  delete_insn does preserve the next
2229                          pointers, but when we skip over a NOTE we must fix
2230                          it up.  Otherwise that code walks into the non-deleted
2231                          insn stream.  */
2232                       while (p && GET_CODE (p) == NOTE)
2233                         p = NEXT_INSN (temp) = NEXT_INSN (p);
2234
2235                       if (m->insert_temp)
2236                         {
2237                           rtx seq;
2238                           /* Replace the original insn with a move from
2239                              our newly created temp.  */
2240                           start_sequence ();
2241                           emit_move_insn (m->set_dest, newreg);
2242                           seq = get_insns ();
2243                           end_sequence ();
2244                           emit_insn_before (seq, p);
2245                         }
2246                     }
2247
2248                   /* The more regs we move, the less we like moving them.  */
2249                   threshold -= 3;
2250                 }
2251
2252               m->done = 1;
2253
2254               if (!m->insert_temp)
2255                 {
2256                   /* Any other movable that loads the same register
2257                      MUST be moved.  */
2258                   already_moved[regno] = 1;
2259
2260                   /* This reg has been moved out of one loop.  */
2261                   regs->array[regno].moved_once = 1;
2262
2263                   /* The reg set here is now invariant.  */
2264                   if (! m->partial)
2265                     {
2266                       int i;
2267                       for (i = 0; i < LOOP_REGNO_NREGS (regno, m->set_dest); i++)
2268                         regs->array[regno+i].set_in_loop = 0;
2269                     }
2270
2271                   /* Change the length-of-life info for the register
2272                      to say it lives at least the full length of this loop.
2273                      This will help guide optimizations in outer loops.  */
2274
2275                   if (REGNO_FIRST_LUID (regno) > INSN_LUID (loop_start))
2276                     /* This is the old insn before all the moved insns.
2277                        We can't use the moved insn because it is out of range
2278                        in uid_luid.  Only the old insns have luids.  */
2279                     REGNO_FIRST_UID (regno) = INSN_UID (loop_start);
2280                   if (REGNO_LAST_LUID (regno) < INSN_LUID (loop_end))
2281                     REGNO_LAST_UID (regno) = INSN_UID (loop_end);
2282                 }
2283
2284               /* Combine with this moved insn any other matching movables.  */
2285
2286               if (! m->partial)
2287                 for (m1 = movables->head; m1; m1 = m1->next)
2288                   if (m1->match == m)
2289                     {
2290                       rtx temp;
2291
2292                       /* Schedule the reg loaded by M1
2293                          for replacement so that shares the reg of M.
2294                          If the modes differ (only possible in restricted
2295                          circumstances, make a SUBREG.
2296
2297                          Note this assumes that the target dependent files
2298                          treat REG and SUBREG equally, including within
2299                          GO_IF_LEGITIMATE_ADDRESS and in all the
2300                          predicates since we never verify that replacing the
2301                          original register with a SUBREG results in a
2302                          recognizable insn.  */
2303                       if (GET_MODE (m->set_dest) == GET_MODE (m1->set_dest))
2304                         reg_map[m1->regno] = m->set_dest;
2305                       else
2306                         reg_map[m1->regno]
2307                           = gen_lowpart_common (GET_MODE (m1->set_dest),
2308                                                 m->set_dest);
2309
2310                       /* Get rid of the matching insn
2311                          and prevent further processing of it.  */
2312                       m1->done = 1;
2313
2314                       /* If library call, delete all insns.  */
2315                       if ((temp = find_reg_note (m1->insn, REG_RETVAL,
2316                                                  NULL_RTX)))
2317                         delete_insn_chain (XEXP (temp, 0), m1->insn);
2318                       else
2319                         delete_insn (m1->insn);
2320
2321                       /* Any other movable that loads the same register
2322                          MUST be moved.  */
2323                       already_moved[m1->regno] = 1;
2324
2325                       /* The reg merged here is now invariant,
2326                          if the reg it matches is invariant.  */
2327                       if (! m->partial)
2328                         {
2329                           int i;
2330                           for (i = 0;
2331                                i < LOOP_REGNO_NREGS (regno, m1->set_dest);
2332                                i++)
2333                             regs->array[m1->regno+i].set_in_loop = 0;
2334                         }
2335                     }
2336             }
2337           else if (loop_dump_stream)
2338             fprintf (loop_dump_stream, "not desirable");
2339         }
2340       else if (loop_dump_stream && !m->match)
2341         fprintf (loop_dump_stream, "not safe");
2342
2343       if (loop_dump_stream)
2344         fprintf (loop_dump_stream, "\n");
2345     }
2346
2347   if (new_start == 0)
2348     new_start = loop_start;
2349
2350   /* Go through all the instructions in the loop, making
2351      all the register substitutions scheduled in REG_MAP.  */
2352   for (p = new_start; p != loop_end; p = NEXT_INSN (p))
2353     if (GET_CODE (p) == INSN || GET_CODE (p) == JUMP_INSN
2354         || GET_CODE (p) == CALL_INSN)
2355       {
2356         replace_regs (PATTERN (p), reg_map, nregs, 0);
2357         replace_regs (REG_NOTES (p), reg_map, nregs, 0);
2358         INSN_CODE (p) = -1;
2359       }
2360
2361   /* Clean up.  */
2362   free (reg_map);
2363   free (already_moved);
2364 }
2365
2366
2367 static void
2368 loop_movables_add (struct loop_movables *movables, struct movable *m)
2369 {
2370   if (movables->head == 0)
2371     movables->head = m;
2372   else
2373     movables->last->next = m;
2374   movables->last = m;
2375 }
2376
2377
2378 static void
2379 loop_movables_free (struct loop_movables *movables)
2380 {
2381   struct movable *m;
2382   struct movable *m_next;
2383
2384   for (m = movables->head; m; m = m_next)
2385     {
2386       m_next = m->next;
2387       free (m);
2388     }
2389 }
2390 \f
2391 #if 0
2392 /* Scan X and replace the address of any MEM in it with ADDR.
2393    REG is the address that MEM should have before the replacement.  */
2394
2395 static void
2396 replace_call_address (rtx x, rtx reg, rtx addr)
2397 {
2398   enum rtx_code code;
2399   int i;
2400   const char *fmt;
2401
2402   if (x == 0)
2403     return;
2404   code = GET_CODE (x);
2405   switch (code)
2406     {
2407     case PC:
2408     case CC0:
2409     case CONST_INT:
2410     case CONST_DOUBLE:
2411     case CONST:
2412     case SYMBOL_REF:
2413     case LABEL_REF:
2414     case REG:
2415       return;
2416
2417     case SET:
2418       /* Short cut for very common case.  */
2419       replace_call_address (XEXP (x, 1), reg, addr);
2420       return;
2421
2422     case CALL:
2423       /* Short cut for very common case.  */
2424       replace_call_address (XEXP (x, 0), reg, addr);
2425       return;
2426
2427     case MEM:
2428       /* If this MEM uses a reg other than the one we expected,
2429          something is wrong.  */
2430       if (XEXP (x, 0) != reg)
2431         abort ();
2432       XEXP (x, 0) = addr;
2433       return;
2434
2435     default:
2436       break;
2437     }
2438
2439   fmt = GET_RTX_FORMAT (code);
2440   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
2441     {
2442       if (fmt[i] == 'e')
2443         replace_call_address (XEXP (x, i), reg, addr);
2444       else if (fmt[i] == 'E')
2445         {
2446           int j;
2447           for (j = 0; j < XVECLEN (x, i); j++)
2448             replace_call_address (XVECEXP (x, i, j), reg, addr);
2449         }
2450     }
2451 }
2452 #endif
2453 \f
2454 /* Return the number of memory refs to addresses that vary
2455    in the rtx X.  */
2456
2457 static int
2458 count_nonfixed_reads (const struct loop *loop, rtx x)
2459 {
2460   enum rtx_code code;
2461   int i;
2462   const char *fmt;
2463   int value;
2464
2465   if (x == 0)
2466     return 0;
2467
2468   code = GET_CODE (x);
2469   switch (code)
2470     {
2471     case PC:
2472     case CC0:
2473     case CONST_INT:
2474     case CONST_DOUBLE:
2475     case CONST:
2476     case SYMBOL_REF:
2477     case LABEL_REF:
2478     case REG:
2479       return 0;
2480
2481     case MEM:
2482       return ((loop_invariant_p (loop, XEXP (x, 0)) != 1)
2483               + count_nonfixed_reads (loop, XEXP (x, 0)));
2484
2485     default:
2486       break;
2487     }
2488
2489   value = 0;
2490   fmt = GET_RTX_FORMAT (code);
2491   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
2492     {
2493       if (fmt[i] == 'e')
2494         value += count_nonfixed_reads (loop, XEXP (x, i));
2495       if (fmt[i] == 'E')
2496         {
2497           int j;
2498           for (j = 0; j < XVECLEN (x, i); j++)
2499             value += count_nonfixed_reads (loop, XVECEXP (x, i, j));
2500         }
2501     }
2502   return value;
2503 }
2504 \f
2505 /* Scan a loop setting the elements `cont', `vtop', `loops_enclosed',
2506    `has_call', `has_nonconst_call', `has_volatile', `has_tablejump',
2507    `unknown_address_altered', `unknown_constant_address_altered', and
2508    `num_mem_sets' in LOOP.  Also, fill in the array `mems' and the
2509    list `store_mems' in LOOP.  */
2510
2511 static void
2512 prescan_loop (struct loop *loop)
2513 {
2514   int level = 1;
2515   rtx insn;
2516   struct loop_info *loop_info = LOOP_INFO (loop);
2517   rtx start = loop->start;
2518   rtx end = loop->end;
2519   /* The label after END.  Jumping here is just like falling off the
2520      end of the loop.  We use next_nonnote_insn instead of next_label
2521      as a hedge against the (pathological) case where some actual insn
2522      might end up between the two.  */
2523   rtx exit_target = next_nonnote_insn (end);
2524
2525   loop_info->has_indirect_jump = indirect_jump_in_function;
2526   loop_info->pre_header_has_call = 0;
2527   loop_info->has_call = 0;
2528   loop_info->has_nonconst_call = 0;
2529   loop_info->has_prefetch = 0;
2530   loop_info->has_volatile = 0;
2531   loop_info->has_tablejump = 0;
2532   loop_info->has_multiple_exit_targets = 0;
2533   loop->level = 1;
2534
2535   loop_info->unknown_address_altered = 0;
2536   loop_info->unknown_constant_address_altered = 0;
2537   loop_info->store_mems = NULL_RTX;
2538   loop_info->first_loop_store_insn = NULL_RTX;
2539   loop_info->mems_idx = 0;
2540   loop_info->num_mem_sets = 0;
2541   /* If loop opts run twice, this was set on 1st pass for 2nd.  */
2542   loop_info->preconditioned = NOTE_PRECONDITIONED (end);
2543
2544   for (insn = start; insn && GET_CODE (insn) != CODE_LABEL;
2545        insn = PREV_INSN (insn))
2546     {
2547       if (GET_CODE (insn) == CALL_INSN)
2548         {
2549           loop_info->pre_header_has_call = 1;
2550           break;
2551         }
2552     }
2553
2554   for (insn = NEXT_INSN (start); insn != NEXT_INSN (end);
2555        insn = NEXT_INSN (insn))
2556     {
2557       switch (GET_CODE (insn))
2558         {
2559         case NOTE:
2560           if (NOTE_LINE_NUMBER (insn) == NOTE_INSN_LOOP_BEG)
2561             {
2562               ++level;
2563               /* Count number of loops contained in this one.  */
2564               loop->level++;
2565             }
2566           else if (NOTE_LINE_NUMBER (insn) == NOTE_INSN_LOOP_END)
2567             --level;
2568           break;
2569
2570         case CALL_INSN:
2571           if (! CONST_OR_PURE_CALL_P (insn))
2572             {
2573               loop_info->unknown_address_altered = 1;
2574               loop_info->has_nonconst_call = 1;
2575             }
2576           else if (pure_call_p (insn))
2577             loop_info->has_nonconst_call = 1;
2578           loop_info->has_call = 1;
2579           if (can_throw_internal (insn))
2580             loop_info->has_multiple_exit_targets = 1;
2581
2582           /* Calls initializing constant objects have CLOBBER of MEM /u in the
2583              attached FUNCTION_USAGE expression list, not accounted for by the
2584              code above. We should note these to avoid missing dependencies in
2585              later references.  */
2586           {
2587             rtx fusage_entry;
2588
2589             for (fusage_entry = CALL_INSN_FUNCTION_USAGE (insn);
2590                  fusage_entry; fusage_entry = XEXP (fusage_entry, 1))
2591               {
2592                 rtx fusage = XEXP (fusage_entry, 0);
2593
2594                 if (GET_CODE (fusage) == CLOBBER
2595                     && GET_CODE (XEXP (fusage, 0)) == MEM
2596                     && RTX_UNCHANGING_P (XEXP (fusage, 0)))
2597                   {
2598                     note_stores (fusage, note_addr_stored, loop_info);
2599                     if (! loop_info->first_loop_store_insn
2600                         && loop_info->store_mems)
2601                       loop_info->first_loop_store_insn = insn;
2602                   }
2603               }
2604           }
2605           break;
2606
2607         case JUMP_INSN:
2608           if (! loop_info->has_multiple_exit_targets)
2609             {
2610               rtx set = pc_set (insn);
2611
2612               if (set)
2613                 {
2614                   rtx src = SET_SRC (set);
2615                   rtx label1, label2;
2616
2617                   if (GET_CODE (src) == IF_THEN_ELSE)
2618                     {
2619                       label1 = XEXP (src, 1);
2620                       label2 = XEXP (src, 2);
2621                     }
2622                   else
2623                     {
2624                       label1 = src;
2625                       label2 = NULL_RTX;
2626                     }
2627
2628                   do
2629                     {
2630                       if (label1 && label1 != pc_rtx)
2631                         {
2632                           if (GET_CODE (label1) != LABEL_REF)
2633                             {
2634                               /* Something tricky.  */
2635                               loop_info->has_multiple_exit_targets = 1;
2636                               break;
2637                             }
2638                           else if (XEXP (label1, 0) != exit_target
2639                                    && LABEL_OUTSIDE_LOOP_P (label1))
2640                             {
2641                               /* A jump outside the current loop.  */
2642                               loop_info->has_multiple_exit_targets = 1;
2643                               break;
2644                             }
2645                         }
2646
2647                       label1 = label2;
2648                       label2 = NULL_RTX;
2649                     }
2650                   while (label1);
2651                 }
2652               else
2653                 {
2654                   /* A return, or something tricky.  */
2655                   loop_info->has_multiple_exit_targets = 1;
2656                 }
2657             }
2658           /* Fall through.  */
2659
2660         case INSN:
2661           if (volatile_refs_p (PATTERN (insn)))
2662             loop_info->has_volatile = 1;
2663
2664           if (GET_CODE (insn) == JUMP_INSN
2665               && (GET_CODE (PATTERN (insn)) == ADDR_DIFF_VEC
2666                   || GET_CODE (PATTERN (insn)) == ADDR_VEC))
2667             loop_info->has_tablejump = 1;
2668
2669           note_stores (PATTERN (insn), note_addr_stored, loop_info);
2670           if (! loop_info->first_loop_store_insn && loop_info->store_mems)
2671             loop_info->first_loop_store_insn = insn;
2672
2673           if (flag_non_call_exceptions && can_throw_internal (insn))
2674             loop_info->has_multiple_exit_targets = 1;
2675           break;
2676
2677         default:
2678           break;
2679         }
2680     }
2681
2682   /* Now, rescan the loop, setting up the LOOP_MEMS array.  */
2683   if (/* An exception thrown by a called function might land us
2684          anywhere.  */
2685       ! loop_info->has_nonconst_call
2686       /* We don't want loads for MEMs moved to a location before the
2687          one at which their stack memory becomes allocated.  (Note
2688          that this is not a problem for malloc, etc., since those
2689          require actual function calls.  */
2690       && ! current_function_calls_alloca
2691       /* There are ways to leave the loop other than falling off the
2692          end.  */
2693       && ! loop_info->has_multiple_exit_targets)
2694     for (insn = NEXT_INSN (start); insn != NEXT_INSN (end);
2695          insn = NEXT_INSN (insn))
2696       for_each_rtx (&insn, insert_loop_mem, loop_info);
2697
2698   /* BLKmode MEMs are added to LOOP_STORE_MEM as necessary so
2699      that loop_invariant_p and load_mems can use true_dependence
2700      to determine what is really clobbered.  */
2701   if (loop_info->unknown_address_altered)
2702     {
2703       rtx mem = gen_rtx_MEM (BLKmode, const0_rtx);
2704
2705       loop_info->store_mems
2706         = gen_rtx_EXPR_LIST (VOIDmode, mem, loop_info->store_mems);
2707     }
2708   if (loop_info->unknown_constant_address_altered)
2709     {
2710       rtx mem = gen_rtx_MEM (BLKmode, const0_rtx);
2711
2712       RTX_UNCHANGING_P (mem) = 1;
2713       loop_info->store_mems
2714         = gen_rtx_EXPR_LIST (VOIDmode, mem, loop_info->store_mems);
2715     }
2716 }
2717 \f
2718 /* Invalidate all loops containing LABEL.  */
2719
2720 static void
2721 invalidate_loops_containing_label (rtx label)
2722 {
2723   struct loop *loop;
2724   for (loop = uid_loop[INSN_UID (label)]; loop; loop = loop->outer)
2725     loop->invalid = 1;
2726 }
2727
2728 /* Scan the function looking for loops.  Record the start and end of each loop.
2729    Also mark as invalid loops any loops that contain a setjmp or are branched
2730    to from outside the loop.  */
2731
2732 static void
2733 find_and_verify_loops (rtx f, struct loops *loops)
2734 {
2735   rtx insn;
2736   rtx label;
2737   int num_loops;
2738   struct loop *current_loop;
2739   struct loop *next_loop;
2740   struct loop *loop;
2741
2742   num_loops = loops->num;
2743
2744   compute_luids (f, NULL_RTX, 0);
2745
2746   /* If there are jumps to undefined labels,
2747      treat them as jumps out of any/all loops.
2748      This also avoids writing past end of tables when there are no loops.  */
2749   uid_loop[0] = NULL;
2750
2751   /* Find boundaries of loops, mark which loops are contained within
2752      loops, and invalidate loops that have setjmp.  */
2753
2754   num_loops = 0;
2755   current_loop = NULL;
2756   for (insn = f; insn; insn = NEXT_INSN (insn))
2757     {
2758       if (GET_CODE (insn) == NOTE)
2759         switch (NOTE_LINE_NUMBER (insn))
2760           {
2761           case NOTE_INSN_LOOP_BEG:
2762             next_loop = loops->array + num_loops;
2763             next_loop->num = num_loops;
2764             num_loops++;
2765             next_loop->start = insn;
2766             next_loop->outer = current_loop;
2767             current_loop = next_loop;
2768             break;
2769
2770           case NOTE_INSN_LOOP_CONT:
2771             current_loop->cont = insn;
2772             break;
2773
2774           case NOTE_INSN_LOOP_VTOP:
2775             current_loop->vtop = insn;
2776             break;
2777
2778           case NOTE_INSN_LOOP_END:
2779             if (! current_loop)
2780               abort ();
2781
2782             current_loop->end = insn;
2783             current_loop = current_loop->outer;
2784             break;
2785
2786           default:
2787             break;
2788           }
2789
2790       if (GET_CODE (insn) == CALL_INSN
2791           && find_reg_note (insn, REG_SETJMP, NULL))
2792         {
2793           /* In this case, we must invalidate our current loop and any
2794              enclosing loop.  */
2795           for (loop = current_loop; loop; loop = loop->outer)
2796             {
2797               loop->invalid = 1;
2798               if (loop_dump_stream)
2799                 fprintf (loop_dump_stream,
2800                          "\nLoop at %d ignored due to setjmp.\n",
2801                          INSN_UID (loop->start));
2802             }
2803         }
2804
2805       /* Note that this will mark the NOTE_INSN_LOOP_END note as being in the
2806          enclosing loop, but this doesn't matter.  */
2807       uid_loop[INSN_UID (insn)] = current_loop;
2808     }
2809
2810   /* Any loop containing a label used in an initializer must be invalidated,
2811      because it can be jumped into from anywhere.  */
2812   for (label = forced_labels; label; label = XEXP (label, 1))
2813     invalidate_loops_containing_label (XEXP (label, 0));
2814
2815   /* Any loop containing a label used for an exception handler must be
2816      invalidated, because it can be jumped into from anywhere.  */
2817   for_each_eh_label (invalidate_loops_containing_label);
2818
2819   /* Now scan all insn's in the function.  If any JUMP_INSN branches into a
2820      loop that it is not contained within, that loop is marked invalid.
2821      If any INSN or CALL_INSN uses a label's address, then the loop containing
2822      that label is marked invalid, because it could be jumped into from
2823      anywhere.
2824
2825      Also look for blocks of code ending in an unconditional branch that
2826      exits the loop.  If such a block is surrounded by a conditional
2827      branch around the block, move the block elsewhere (see below) and
2828      invert the jump to point to the code block.  This may eliminate a
2829      label in our loop and will simplify processing by both us and a
2830      possible second cse pass.  */
2831
2832   for (insn = f; insn; insn = NEXT_INSN (insn))
2833     if (INSN_P (insn))
2834       {
2835         struct loop *this_loop = uid_loop[INSN_UID (insn)];
2836
2837         if (GET_CODE (insn) == INSN || GET_CODE (insn) == CALL_INSN)
2838           {
2839             rtx note = find_reg_note (insn, REG_LABEL, NULL_RTX);
2840             if (note)
2841               invalidate_loops_containing_label (XEXP (note, 0));
2842           }
2843
2844         if (GET_CODE (insn) != JUMP_INSN)
2845           continue;
2846
2847         mark_loop_jump (PATTERN (insn), this_loop);
2848
2849         /* See if this is an unconditional branch outside the loop.  */
2850         if (this_loop
2851             && (GET_CODE (PATTERN (insn)) == RETURN
2852                 || (any_uncondjump_p (insn)
2853                     && onlyjump_p (insn)
2854                     && (uid_loop[INSN_UID (JUMP_LABEL (insn))]
2855                         != this_loop)))
2856             && get_max_uid () < max_uid_for_loop)
2857           {
2858             rtx p;
2859             rtx our_next = next_real_insn (insn);
2860             rtx last_insn_to_move = NEXT_INSN (insn);
2861             struct loop *dest_loop;
2862             struct loop *outer_loop = NULL;
2863
2864             /* Go backwards until we reach the start of the loop, a label,
2865                or a JUMP_INSN.  */
2866             for (p = PREV_INSN (insn);
2867                  GET_CODE (p) != CODE_LABEL
2868                  && ! (GET_CODE (p) == NOTE
2869                        && NOTE_LINE_NUMBER (p) == NOTE_INSN_LOOP_BEG)
2870                  && GET_CODE (p) != JUMP_INSN;
2871                  p = PREV_INSN (p))
2872               ;
2873
2874             /* Check for the case where we have a jump to an inner nested
2875                loop, and do not perform the optimization in that case.  */
2876
2877             if (JUMP_LABEL (insn))
2878               {
2879                 dest_loop = uid_loop[INSN_UID (JUMP_LABEL (insn))];
2880                 if (dest_loop)
2881                   {
2882                     for (outer_loop = dest_loop; outer_loop;
2883                          outer_loop = outer_loop->outer)
2884                       if (outer_loop == this_loop)
2885                         break;
2886                   }
2887               }
2888
2889             /* Make sure that the target of P is within the current loop.  */
2890
2891             if (GET_CODE (p) == JUMP_INSN && JUMP_LABEL (p)
2892                 && uid_loop[INSN_UID (JUMP_LABEL (p))] != this_loop)
2893               outer_loop = this_loop;
2894
2895             /* If we stopped on a JUMP_INSN to the next insn after INSN,
2896                we have a block of code to try to move.
2897
2898                We look backward and then forward from the target of INSN
2899                to find a BARRIER at the same loop depth as the target.
2900                If we find such a BARRIER, we make a new label for the start
2901                of the block, invert the jump in P and point it to that label,
2902                and move the block of code to the spot we found.  */
2903
2904             if (! outer_loop
2905                 && GET_CODE (p) == JUMP_INSN
2906                 && JUMP_LABEL (p) != 0
2907                 /* Just ignore jumps to labels that were never emitted.
2908                    These always indicate compilation errors.  */
2909                 && INSN_UID (JUMP_LABEL (p)) != 0
2910                 && any_condjump_p (p) && onlyjump_p (p)
2911                 && next_real_insn (JUMP_LABEL (p)) == our_next
2912                 /* If it's not safe to move the sequence, then we
2913                    mustn't try.  */
2914                 && insns_safe_to_move_p (p, NEXT_INSN (insn),
2915                                          &last_insn_to_move))
2916               {
2917                 rtx target
2918                   = JUMP_LABEL (insn) ? JUMP_LABEL (insn) : get_last_insn ();
2919                 struct loop *target_loop = uid_loop[INSN_UID (target)];
2920                 rtx loc, loc2;
2921                 rtx tmp;
2922
2923                 /* Search for possible garbage past the conditional jumps
2924                    and look for the last barrier.  */
2925                 for (tmp = last_insn_to_move;
2926                      tmp && GET_CODE (tmp) != CODE_LABEL; tmp = NEXT_INSN (tmp))
2927                   if (GET_CODE (tmp) == BARRIER)
2928                     last_insn_to_move = tmp;
2929
2930                 for (loc = target; loc; loc = PREV_INSN (loc))
2931                   if (GET_CODE (loc) == BARRIER
2932                       /* Don't move things inside a tablejump.  */
2933                       && ((loc2 = next_nonnote_insn (loc)) == 0
2934                           || GET_CODE (loc2) != CODE_LABEL
2935                           || (loc2 = next_nonnote_insn (loc2)) == 0
2936                           || GET_CODE (loc2) != JUMP_INSN
2937                           || (GET_CODE (PATTERN (loc2)) != ADDR_VEC
2938                               && GET_CODE (PATTERN (loc2)) != ADDR_DIFF_VEC))
2939                       && uid_loop[INSN_UID (loc)] == target_loop)
2940                     break;
2941
2942                 if (loc == 0)
2943                   for (loc = target; loc; loc = NEXT_INSN (loc))
2944                     if (GET_CODE (loc) == BARRIER
2945                         /* Don't move things inside a tablejump.  */
2946                         && ((loc2 = next_nonnote_insn (loc)) == 0
2947                             || GET_CODE (loc2) != CODE_LABEL
2948                             || (loc2 = next_nonnote_insn (loc2)) == 0
2949                             || GET_CODE (loc2) != JUMP_INSN
2950                             || (GET_CODE (PATTERN (loc2)) != ADDR_VEC
2951                                 && GET_CODE (PATTERN (loc2)) != ADDR_DIFF_VEC))
2952                         && uid_loop[INSN_UID (loc)] == target_loop)
2953                       break;
2954
2955                 if (loc)
2956                   {
2957                     rtx cond_label = JUMP_LABEL (p);
2958                     rtx new_label = get_label_after (p);
2959
2960                     /* Ensure our label doesn't go away.  */
2961                     LABEL_NUSES (cond_label)++;
2962
2963                     /* Verify that uid_loop is large enough and that
2964                        we can invert P.  */
2965                     if (invert_jump (p, new_label, 1))
2966                       {
2967                         rtx q, r;
2968
2969                         /* If no suitable BARRIER was found, create a suitable
2970                            one before TARGET.  Since TARGET is a fall through
2971                            path, we'll need to insert a jump around our block
2972                            and add a BARRIER before TARGET.
2973
2974                            This creates an extra unconditional jump outside
2975                            the loop.  However, the benefits of removing rarely
2976                            executed instructions from inside the loop usually
2977                            outweighs the cost of the extra unconditional jump
2978                            outside the loop.  */
2979                         if (loc == 0)
2980                           {
2981                             rtx temp;
2982
2983                             temp = gen_jump (JUMP_LABEL (insn));
2984                             temp = emit_jump_insn_before (temp, target);
2985                             JUMP_LABEL (temp) = JUMP_LABEL (insn);
2986                             LABEL_NUSES (JUMP_LABEL (insn))++;
2987                             loc = emit_barrier_before (target);
2988                           }
2989
2990                         /* Include the BARRIER after INSN and copy the
2991                            block after LOC.  */
2992                         if (squeeze_notes (&new_label, &last_insn_to_move))
2993                           abort ();
2994                         reorder_insns (new_label, last_insn_to_move, loc);
2995
2996                         /* All those insns are now in TARGET_LOOP.  */
2997                         for (q = new_label;
2998                              q != NEXT_INSN (last_insn_to_move);
2999                              q = NEXT_INSN (q))
3000                           uid_loop[INSN_UID (q)] = target_loop;
3001
3002                         /* The label jumped to by INSN is no longer a loop
3003                            exit.  Unless INSN does not have a label (e.g.,
3004                            it is a RETURN insn), search loop->exit_labels
3005                            to find its label_ref, and remove it.  Also turn
3006                            off LABEL_OUTSIDE_LOOP_P bit.  */
3007                         if (JUMP_LABEL (insn))
3008                           {
3009                             for (q = 0, r = this_loop->exit_labels;
3010                                  r;
3011                                  q = r, r = LABEL_NEXTREF (r))
3012                               if (XEXP (r, 0) == JUMP_LABEL (insn))
3013                                 {
3014                                   LABEL_OUTSIDE_LOOP_P (r) = 0;
3015                                   if (q)
3016                                     LABEL_NEXTREF (q) = LABEL_NEXTREF (r);
3017                                   else
3018                                     this_loop->exit_labels = LABEL_NEXTREF (r);
3019                                   break;
3020                                 }
3021
3022                             for (loop = this_loop; loop && loop != target_loop;
3023                                  loop = loop->outer)
3024                               loop->exit_count--;
3025
3026                             /* If we didn't find it, then something is
3027                                wrong.  */
3028                             if (! r)
3029                               abort ();
3030                           }
3031
3032                         /* P is now a jump outside the loop, so it must be put
3033                            in loop->exit_labels, and marked as such.
3034                            The easiest way to do this is to just call
3035                            mark_loop_jump again for P.  */
3036                         mark_loop_jump (PATTERN (p), this_loop);
3037
3038                         /* If INSN now jumps to the insn after it,
3039                            delete INSN.  */
3040                         if (JUMP_LABEL (insn) != 0
3041                             && (next_real_insn (JUMP_LABEL (insn))
3042                                 == next_real_insn (insn)))
3043                           delete_related_insns (insn);
3044                       }
3045
3046                     /* Continue the loop after where the conditional
3047                        branch used to jump, since the only branch insn
3048                        in the block (if it still remains) is an inter-loop
3049                        branch and hence needs no processing.  */
3050                     insn = NEXT_INSN (cond_label);
3051
3052                     if (--LABEL_NUSES (cond_label) == 0)
3053                       delete_related_insns (cond_label);
3054
3055                     /* This loop will be continued with NEXT_INSN (insn).  */
3056                     insn = PREV_INSN (insn);
3057                   }
3058               }
3059           }
3060       }
3061 }
3062
3063 /* If any label in X jumps to a loop different from LOOP_NUM and any of the
3064    loops it is contained in, mark the target loop invalid.
3065
3066    For speed, we assume that X is part of a pattern of a JUMP_INSN.  */
3067
3068 static void
3069 mark_loop_jump (rtx x, struct loop *loop)
3070 {
3071   struct loop *dest_loop;
3072   struct loop *outer_loop;
3073   int i;
3074
3075   switch (GET_CODE (x))
3076     {
3077     case PC:
3078     case USE:
3079     case CLOBBER:
3080     case REG:
3081     case MEM:
3082     case CONST_INT:
3083     case CONST_DOUBLE:
3084     case RETURN:
3085       return;
3086
3087     case CONST:
3088       /* There could be a label reference in here.  */
3089       mark_loop_jump (XEXP (x, 0), loop);
3090       return;
3091
3092     case PLUS:
3093     case MINUS:
3094     case MULT:
3095       mark_loop_jump (XEXP (x, 0), loop);
3096       mark_loop_jump (XEXP (x, 1), loop);
3097       return;
3098
3099     case LO_SUM:
3100       /* This may refer to a LABEL_REF or SYMBOL_REF.  */
3101       mark_loop_jump (XEXP (x, 1), loop);
3102       return;
3103
3104     case SIGN_EXTEND:
3105     case ZERO_EXTEND:
3106       mark_loop_jump (XEXP (x, 0), loop);
3107       return;
3108
3109     case LABEL_REF:
3110       dest_loop = uid_loop[INSN_UID (XEXP (x, 0))];
3111
3112       /* Link together all labels that branch outside the loop.  This
3113          is used by final_[bg]iv_value and the loop unrolling code.  Also
3114          mark this LABEL_REF so we know that this branch should predict
3115          false.  */
3116
3117       /* A check to make sure the label is not in an inner nested loop,
3118          since this does not count as a loop exit.  */
3119       if (dest_loop)
3120         {
3121           for (outer_loop = dest_loop; outer_loop;
3122                outer_loop = outer_loop->outer)
3123             if (outer_loop == loop)
3124               break;
3125         }
3126       else
3127         outer_loop = NULL;
3128
3129       if (loop && ! outer_loop)
3130         {
3131           LABEL_OUTSIDE_LOOP_P (x) = 1;
3132           LABEL_NEXTREF (x) = loop->exit_labels;
3133           loop->exit_labels = x;
3134
3135           for (outer_loop = loop;
3136                outer_loop && outer_loop != dest_loop;
3137                outer_loop = outer_loop->outer)
3138             outer_loop->exit_count++;
3139         }
3140
3141       /* If this is inside a loop, but not in the current loop or one enclosed
3142          by it, it invalidates at least one loop.  */
3143
3144       if (! dest_loop)
3145         return;
3146
3147       /* We must invalidate every nested loop containing the target of this
3148          label, except those that also contain the jump insn.  */
3149
3150       for (; dest_loop; dest_loop = dest_loop->outer)
3151         {
3152           /* Stop when we reach a loop that also contains the jump insn.  */
3153           for (outer_loop = loop; outer_loop; outer_loop = outer_loop->outer)
3154             if (dest_loop == outer_loop)
3155               return;
3156
3157           /* If we get here, we know we need to invalidate a loop.  */
3158           if (loop_dump_stream && ! dest_loop->invalid)
3159             fprintf (loop_dump_stream,
3160                      "\nLoop at %d ignored due to multiple entry points.\n",
3161                      INSN_UID (dest_loop->start));
3162
3163           dest_loop->invalid = 1;
3164         }
3165       return;
3166
3167     case SET:
3168       /* If this is not setting pc, ignore.  */
3169       if (SET_DEST (x) == pc_rtx)
3170         mark_loop_jump (SET_SRC (x), loop);
3171       return;
3172
3173     case IF_THEN_ELSE:
3174       mark_loop_jump (XEXP (x, 1), loop);
3175       mark_loop_jump (XEXP (x, 2), loop);
3176       return;
3177
3178     case PARALLEL:
3179     case ADDR_VEC:
3180       for (i = 0; i < XVECLEN (x, 0); i++)
3181         mark_loop_jump (XVECEXP (x, 0, i), loop);
3182       return;
3183
3184     case ADDR_DIFF_VEC:
3185       for (i = 0; i < XVECLEN (x, 1); i++)
3186         mark_loop_jump (XVECEXP (x, 1, i), loop);
3187       return;
3188
3189     default:
3190       /* Strictly speaking this is not a jump into the loop, only a possible
3191          jump out of the loop.  However, we have no way to link the destination
3192          of this jump onto the list of exit labels.  To be safe we mark this
3193          loop and any containing loops as invalid.  */
3194       if (loop)
3195         {
3196           for (outer_loop = loop; outer_loop; outer_loop = outer_loop->outer)
3197             {
3198               if (loop_dump_stream && ! outer_loop->invalid)
3199                 fprintf (loop_dump_stream,
3200                          "\nLoop at %d ignored due to unknown exit jump.\n",
3201                          INSN_UID (outer_loop->start));
3202               outer_loop->invalid = 1;
3203             }
3204         }
3205       return;
3206     }
3207 }
3208 \f
3209 /* Return nonzero if there is a label in the range from
3210    insn INSN to and including the insn whose luid is END
3211    INSN must have an assigned luid (i.e., it must not have
3212    been previously created by loop.c).  */
3213
3214 static int
3215 labels_in_range_p (rtx insn, int end)
3216 {
3217   while (insn && INSN_LUID (insn) <= end)
3218     {
3219       if (GET_CODE (insn) == CODE_LABEL)
3220         return 1;
3221       insn = NEXT_INSN (insn);
3222     }
3223
3224   return 0;
3225 }
3226
3227 /* Record that a memory reference X is being set.  */
3228
3229 static void
3230 note_addr_stored (rtx x, rtx y ATTRIBUTE_UNUSED,
3231                   void *data ATTRIBUTE_UNUSED)
3232 {
3233   struct loop_info *loop_info = data;
3234
3235   if (x == 0 || GET_CODE (x) != MEM)
3236     return;
3237
3238   /* Count number of memory writes.
3239      This affects heuristics in strength_reduce.  */
3240   loop_info->num_mem_sets++;
3241
3242   /* BLKmode MEM means all memory is clobbered.  */
3243   if (GET_MODE (x) == BLKmode)
3244     {
3245       if (RTX_UNCHANGING_P (x))
3246         loop_info->unknown_constant_address_altered = 1;
3247       else
3248         loop_info->unknown_address_altered = 1;
3249
3250       return;
3251     }
3252
3253   loop_info->store_mems = gen_rtx_EXPR_LIST (VOIDmode, x,
3254                                              loop_info->store_mems);
3255 }
3256
3257 /* X is a value modified by an INSN that references a biv inside a loop
3258    exit test (ie, X is somehow related to the value of the biv).  If X
3259    is a pseudo that is used more than once, then the biv is (effectively)
3260    used more than once.  DATA is a pointer to a loop_regs structure.  */
3261
3262 static void
3263 note_set_pseudo_multiple_uses (rtx x, rtx y ATTRIBUTE_UNUSED, void *data)
3264 {
3265   struct loop_regs *regs = (struct loop_regs *) data;
3266
3267   if (x == 0)
3268     return;
3269
3270   while (GET_CODE (x) == STRICT_LOW_PART
3271          || GET_CODE (x) == SIGN_EXTRACT
3272          || GET_CODE (x) == ZERO_EXTRACT
3273          || GET_CODE (x) == SUBREG)
3274     x = XEXP (x, 0);
3275
3276   if (GET_CODE (x) != REG || REGNO (x) < FIRST_PSEUDO_REGISTER)
3277     return;
3278
3279   /* If we do not have usage information, or if we know the register
3280      is used more than once, note that fact for check_dbra_loop.  */
3281   if (REGNO (x) >= max_reg_before_loop
3282       || ! regs->array[REGNO (x)].single_usage
3283       || regs->array[REGNO (x)].single_usage == const0_rtx)
3284     regs->multiple_uses = 1;
3285 }
3286 \f
3287 /* Return nonzero if the rtx X is invariant over the current loop.
3288
3289    The value is 2 if we refer to something only conditionally invariant.
3290
3291    A memory ref is invariant if it is not volatile and does not conflict
3292    with anything stored in `loop_info->store_mems'.  */
3293
3294 int
3295 loop_invariant_p (const struct loop *loop, rtx x)
3296 {
3297   struct loop_info *loop_info = LOOP_INFO (loop);
3298   struct loop_regs *regs = LOOP_REGS (loop);
3299   int i;
3300   enum rtx_code code;
3301   const char *fmt;
3302   int conditional = 0;
3303   rtx mem_list_entry;
3304
3305   if (x == 0)
3306     return 1;
3307   code = GET_CODE (x);
3308   switch (code)
3309     {
3310     case CONST_INT:
3311     case CONST_DOUBLE:
3312     case SYMBOL_REF:
3313     case CONST:
3314       return 1;
3315
3316     case LABEL_REF:
3317       /* A LABEL_REF is normally invariant, however, if we are unrolling
3318          loops, and this label is inside the loop, then it isn't invariant.
3319          This is because each unrolled copy of the loop body will have
3320          a copy of this label.  If this was invariant, then an insn loading
3321          the address of this label into a register might get moved outside
3322          the loop, and then each loop body would end up using the same label.
3323
3324          We don't know the loop bounds here though, so just fail for all
3325          labels.  */
3326       if (flag_old_unroll_loops)
3327         return 0;
3328       else
3329         return 1;
3330
3331     case PC:
3332     case CC0:
3333     case UNSPEC_VOLATILE:
3334       return 0;
3335
3336     case REG:
3337       /* We used to check RTX_UNCHANGING_P (x) here, but that is invalid
3338          since the reg might be set by initialization within the loop.  */
3339
3340       if ((x == frame_pointer_rtx || x == hard_frame_pointer_rtx
3341            || x == arg_pointer_rtx || x == pic_offset_table_rtx)
3342           && ! current_function_has_nonlocal_goto)
3343         return 1;
3344
3345       if (LOOP_INFO (loop)->has_call
3346           && REGNO (x) < FIRST_PSEUDO_REGISTER && call_used_regs[REGNO (x)])
3347         return 0;
3348
3349       /* Out-of-range regs can occur when we are called from unrolling.
3350          These registers created by the unroller are set in the loop,
3351          hence are never invariant.
3352          Other out-of-range regs can be generated by load_mems; those that
3353          are written to in the loop are not invariant, while those that are
3354          not written to are invariant.  It would be easy for load_mems
3355          to set n_times_set correctly for these registers, however, there
3356          is no easy way to distinguish them from registers created by the
3357          unroller.  */
3358
3359       if (REGNO (x) >= (unsigned) regs->num)
3360         return 0;
3361
3362       if (regs->array[REGNO (x)].set_in_loop < 0)
3363         return 2;
3364
3365       return regs->array[REGNO (x)].set_in_loop == 0;
3366
3367     case MEM:
3368       /* Volatile memory references must be rejected.  Do this before
3369          checking for read-only items, so that volatile read-only items
3370          will be rejected also.  */
3371       if (MEM_VOLATILE_P (x))
3372         return 0;
3373
3374       /* See if there is any dependence between a store and this load.  */
3375       mem_list_entry = loop_info->store_mems;
3376       while (mem_list_entry)
3377         {
3378           if (true_dependence (XEXP (mem_list_entry, 0), VOIDmode,
3379                                x, rtx_varies_p))
3380             return 0;
3381
3382           mem_list_entry = XEXP (mem_list_entry, 1);
3383         }
3384
3385       /* It's not invalidated by a store in memory
3386          but we must still verify the address is invariant.  */
3387       break;
3388
3389     case ASM_OPERANDS:
3390       /* Don't mess with insns declared volatile.  */
3391       if (MEM_VOLATILE_P (x))
3392         return 0;
3393       break;
3394
3395     default:
3396       break;
3397     }
3398
3399   fmt = GET_RTX_FORMAT (code);
3400   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
3401     {
3402       if (fmt[i] == 'e')
3403         {
3404           int tem = loop_invariant_p (loop, XEXP (x, i));
3405           if (tem == 0)
3406             return 0;
3407           if (tem == 2)
3408             conditional = 1;
3409         }
3410       else if (fmt[i] == 'E')
3411         {
3412           int j;
3413           for (j = 0; j < XVECLEN (x, i); j++)
3414             {
3415               int tem = loop_invariant_p (loop, XVECEXP (x, i, j));
3416               if (tem == 0)
3417                 return 0;
3418               if (tem == 2)
3419                 conditional = 1;
3420             }
3421
3422         }
3423     }
3424
3425   return 1 + conditional;
3426 }
3427 \f
3428 /* Return nonzero if all the insns in the loop that set REG
3429    are INSN and the immediately following insns,
3430    and if each of those insns sets REG in an invariant way
3431    (not counting uses of REG in them).
3432
3433    The value is 2 if some of these insns are only conditionally invariant.
3434
3435    We assume that INSN itself is the first set of REG
3436    and that its source is invariant.  */
3437
3438 static int
3439 consec_sets_invariant_p (const struct loop *loop, rtx reg, int n_sets,
3440                          rtx insn)
3441 {
3442   struct loop_regs *regs = LOOP_REGS (loop);
3443   rtx p = insn;
3444   unsigned int regno = REGNO (reg);
3445   rtx temp;
3446   /* Number of sets we have to insist on finding after INSN.  */
3447   int count = n_sets - 1;
3448   int old = regs->array[regno].set_in_loop;
3449   int value = 0;
3450   int this;
3451
3452   /* If N_SETS hit the limit, we can't rely on its value.  */
3453   if (n_sets == 127)
3454     return 0;
3455
3456   regs->array[regno].set_in_loop = 0;
3457
3458   while (count > 0)
3459     {
3460       enum rtx_code code;
3461       rtx set;
3462
3463       p = NEXT_INSN (p);
3464       code = GET_CODE (p);
3465
3466       /* If library call, skip to end of it.  */
3467       if (code == INSN && (temp = find_reg_note (p, REG_LIBCALL, NULL_RTX)))
3468         p = XEXP (temp, 0);
3469
3470       this = 0;
3471       if (code == INSN
3472           && (set = single_set (p))
3473           && GET_CODE (SET_DEST (set)) == REG
3474           && REGNO (SET_DEST (set)) == regno)
3475         {
3476           this = loop_invariant_p (loop, SET_SRC (set));
3477           if (this != 0)
3478             value |= this;
3479           else if ((temp = find_reg_note (p, REG_EQUAL, NULL_RTX)))
3480             {
3481               /* If this is a libcall, then any invariant REG_EQUAL note is OK.
3482                  If this is an ordinary insn, then only CONSTANT_P REG_EQUAL
3483                  notes are OK.  */
3484               this = (CONSTANT_P (XEXP (temp, 0))
3485                       || (find_reg_note (p, REG_RETVAL, NULL_RTX)
3486                           && loop_invariant_p (loop, XEXP (temp, 0))));
3487               if (this != 0)
3488                 value |= this;
3489             }
3490         }
3491       if (this != 0)
3492         count--;
3493       else if (code != NOTE)
3494         {
3495           regs->array[regno].set_in_loop = old;
3496           return 0;
3497         }
3498     }
3499
3500   regs->array[regno].set_in_loop = old;
3501   /* If loop_invariant_p ever returned 2, we return 2.  */
3502   return 1 + (value & 2);
3503 }
3504 \f
3505 /* Look at all uses (not sets) of registers in X.  For each, if it is
3506    the single use, set USAGE[REGNO] to INSN; if there was a previous use in
3507    a different insn, set USAGE[REGNO] to const0_rtx.  */
3508
3509 static void
3510 find_single_use_in_loop (struct loop_regs *regs, rtx insn, rtx x)
3511 {
3512   enum rtx_code code = GET_CODE (x);
3513   const char *fmt = GET_RTX_FORMAT (code);
3514   int i, j;
3515
3516   if (code == REG)
3517     regs->array[REGNO (x)].single_usage
3518       = (regs->array[REGNO (x)].single_usage != 0
3519          && regs->array[REGNO (x)].single_usage != insn)
3520         ? const0_rtx : insn;
3521
3522   else if (code == SET)
3523     {
3524       /* Don't count SET_DEST if it is a REG; otherwise count things
3525          in SET_DEST because if a register is partially modified, it won't
3526          show up as a potential movable so we don't care how USAGE is set
3527          for it.  */
3528       if (GET_CODE (SET_DEST (x)) != REG)
3529         find_single_use_in_loop (regs, insn, SET_DEST (x));
3530       find_single_use_in_loop (regs, insn, SET_SRC (x));
3531     }
3532   else
3533     for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
3534       {
3535         if (fmt[i] == 'e' && XEXP (x, i) != 0)
3536           find_single_use_in_loop (regs, insn, XEXP (x, i));
3537         else if (fmt[i] == 'E')
3538           for (j = XVECLEN (x, i) - 1; j >= 0; j--)
3539             find_single_use_in_loop (regs, insn, XVECEXP (x, i, j));
3540       }
3541 }
3542 \f
3543 /* Count and record any set in X which is contained in INSN.  Update
3544    REGS->array[I].MAY_NOT_OPTIMIZE and LAST_SET for any register I set
3545    in X.  */
3546
3547 static void
3548 count_one_set (struct loop_regs *regs, rtx insn, rtx x, rtx *last_set)
3549 {
3550   if (GET_CODE (x) == CLOBBER && GET_CODE (XEXP (x, 0)) == REG)
3551     /* Don't move a reg that has an explicit clobber.
3552        It's not worth the pain to try to do it correctly.  */
3553     regs->array[REGNO (XEXP (x, 0))].may_not_optimize = 1;
3554
3555   if (GET_CODE (x) == SET || GET_CODE (x) == CLOBBER)
3556     {
3557       rtx dest = SET_DEST (x);
3558       while (GET_CODE (dest) == SUBREG
3559              || GET_CODE (dest) == ZERO_EXTRACT
3560              || GET_CODE (dest) == SIGN_EXTRACT
3561              || GET_CODE (dest) == STRICT_LOW_PART)
3562         dest = XEXP (dest, 0);
3563       if (GET_CODE (dest) == REG)
3564         {
3565           int i;
3566           int regno = REGNO (dest);
3567           for (i = 0; i < LOOP_REGNO_NREGS (regno, dest); i++)
3568             {
3569               /* If this is the first setting of this reg
3570                  in current basic block, and it was set before,
3571                  it must be set in two basic blocks, so it cannot
3572                  be moved out of the loop.  */
3573               if (regs->array[regno].set_in_loop > 0
3574                   && last_set[regno] == 0)
3575                 regs->array[regno+i].may_not_optimize = 1;
3576               /* If this is not first setting in current basic block,
3577                  see if reg was used in between previous one and this.
3578                  If so, neither one can be moved.  */
3579               if (last_set[regno] != 0
3580                   && reg_used_between_p (dest, last_set[regno], insn))
3581                 regs->array[regno+i].may_not_optimize = 1;
3582               if (regs->array[regno+i].set_in_loop < 127)
3583                 ++regs->array[regno+i].set_in_loop;
3584               last_set[regno+i] = insn;
3585             }
3586         }
3587     }
3588 }
3589 \f
3590 /* Given a loop that is bounded by LOOP->START and LOOP->END and that
3591    is entered at LOOP->SCAN_START, return 1 if the register set in SET
3592    contained in insn INSN is used by any insn that precedes INSN in
3593    cyclic order starting from the loop entry point.
3594
3595    We don't want to use INSN_LUID here because if we restrict INSN to those
3596    that have a valid INSN_LUID, it means we cannot move an invariant out
3597    from an inner loop past two loops.  */
3598
3599 static int
3600 loop_reg_used_before_p (const struct loop *loop, rtx set, rtx insn)
3601 {
3602   rtx reg = SET_DEST (set);
3603   rtx p;
3604
3605   /* Scan forward checking for register usage.  If we hit INSN, we
3606      are done.  Otherwise, if we hit LOOP->END, wrap around to LOOP->START.  */
3607   for (p = loop->scan_start; p != insn; p = NEXT_INSN (p))
3608     {
3609       if (INSN_P (p) && reg_overlap_mentioned_p (reg, PATTERN (p)))
3610         return 1;
3611
3612       if (p == loop->end)
3613         p = loop->start;
3614     }
3615
3616   return 0;
3617 }
3618 \f
3619
3620 /* Information we collect about arrays that we might want to prefetch.  */
3621 struct prefetch_info
3622 {
3623   struct iv_class *class;       /* Class this prefetch is based on.  */
3624   struct induction *giv;        /* GIV this prefetch is based on.  */
3625   rtx base_address;             /* Start prefetching from this address plus
3626                                    index.  */
3627   HOST_WIDE_INT index;
3628   HOST_WIDE_INT stride;         /* Prefetch stride in bytes in each
3629                                    iteration.  */
3630   unsigned int bytes_accessed;  /* Sum of sizes of all accesses to this
3631                                    prefetch area in one iteration.  */
3632   unsigned int total_bytes;     /* Total bytes loop will access in this block.
3633                                    This is set only for loops with known
3634                                    iteration counts and is 0xffffffff
3635                                    otherwise.  */
3636   int prefetch_in_loop;         /* Number of prefetch insns in loop.  */
3637   int prefetch_before_loop;     /* Number of prefetch insns before loop.  */
3638   unsigned int write : 1;       /* 1 for read/write prefetches.  */
3639 };
3640
3641 /* Data used by check_store function.  */
3642 struct check_store_data
3643 {
3644   rtx mem_address;
3645   int mem_write;
3646 };
3647
3648 static void check_store (rtx, rtx, void *);
3649 static void emit_prefetch_instructions (struct loop *);
3650 static int rtx_equal_for_prefetch_p (rtx, rtx);
3651
3652 /* Set mem_write when mem_address is found.  Used as callback to
3653    note_stores.  */
3654 static void
3655 check_store (rtx x, rtx pat ATTRIBUTE_UNUSED, void *data)
3656 {
3657   struct check_store_data *d = (struct check_store_data *) data;
3658
3659   if ((GET_CODE (x) == MEM) && rtx_equal_p (d->mem_address, XEXP (x, 0)))
3660     d->mem_write = 1;
3661 }
3662 \f
3663 /* Like rtx_equal_p, but attempts to swap commutative operands.  This is
3664    important to get some addresses combined.  Later more sophisticated
3665    transformations can be added when necessary.
3666
3667    ??? Same trick with swapping operand is done at several other places.
3668    It can be nice to develop some common way to handle this.  */
3669
3670 static int
3671 rtx_equal_for_prefetch_p (rtx x, rtx y)
3672 {
3673   int i;
3674   int j;
3675   enum rtx_code code = GET_CODE (x);
3676   const char *fmt;
3677
3678   if (x == y)
3679     return 1;
3680   if (code != GET_CODE (y))
3681     return 0;
3682
3683   if (COMMUTATIVE_ARITH_P (x))
3684     {
3685       return ((rtx_equal_for_prefetch_p (XEXP (x, 0), XEXP (y, 0))
3686                && rtx_equal_for_prefetch_p (XEXP (x, 1), XEXP (y, 1)))
3687               || (rtx_equal_for_prefetch_p (XEXP (x, 0), XEXP (y, 1))
3688                   && rtx_equal_for_prefetch_p (XEXP (x, 1), XEXP (y, 0))));
3689     }
3690
3691   /* Compare the elements.  If any pair of corresponding elements fails to
3692      match, return 0 for the whole thing.  */
3693
3694   fmt = GET_RTX_FORMAT (code);
3695   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
3696     {
3697       switch (fmt[i])
3698         {
3699         case 'w':
3700           if (XWINT (x, i) != XWINT (y, i))
3701             return 0;
3702           break;
3703
3704         case 'i':
3705           if (XINT (x, i) != XINT (y, i))
3706             return 0;
3707           break;
3708
3709         case 'E':
3710           /* Two vectors must have the same length.  */
3711           if (XVECLEN (x, i) != XVECLEN (y, i))
3712             return 0;
3713
3714           /* And the corresponding elements must match.  */
3715           for (j = 0; j < XVECLEN (x, i); j++)
3716             if (rtx_equal_for_prefetch_p (XVECEXP (x, i, j),
3717                                           XVECEXP (y, i, j)) == 0)
3718               return 0;
3719           break;
3720
3721         case 'e':
3722           if (rtx_equal_for_prefetch_p (XEXP (x, i), XEXP (y, i)) == 0)
3723             return 0;
3724           break;
3725
3726         case 's':
3727           if (strcmp (XSTR (x, i), XSTR (y, i)))
3728             return 0;
3729           break;
3730
3731         case 'u':
3732           /* These are just backpointers, so they don't matter.  */
3733           break;
3734
3735         case '0':
3736           break;
3737
3738           /* It is believed that rtx's at this level will never
3739              contain anything but integers and other rtx's,
3740              except for within LABEL_REFs and SYMBOL_REFs.  */
3741         default:
3742           abort ();
3743         }
3744     }
3745   return 1;
3746 }
3747 \f
3748 /* Remove constant addition value from the expression X (when present)
3749    and return it.  */
3750
3751 static HOST_WIDE_INT
3752 remove_constant_addition (rtx *x)
3753 {
3754   HOST_WIDE_INT addval = 0;
3755   rtx exp = *x;
3756
3757   /* Avoid clobbering a shared CONST expression.  */
3758   if (GET_CODE (exp) == CONST)
3759     {
3760       if (GET_CODE (XEXP (exp, 0)) == PLUS
3761           && GET_CODE (XEXP (XEXP (exp, 0), 0)) == SYMBOL_REF
3762           && GET_CODE (XEXP (XEXP (exp, 0), 1)) == CONST_INT)
3763         {
3764           *x = XEXP (XEXP (exp, 0), 0);
3765           return INTVAL (XEXP (XEXP (exp, 0), 1));
3766         }
3767       return 0;
3768     }
3769
3770   if (GET_CODE (exp) == CONST_INT)
3771     {
3772       addval = INTVAL (exp);
3773       *x = const0_rtx;
3774     }
3775
3776   /* For plus expression recurse on ourself.  */
3777   else if (GET_CODE (exp) == PLUS)
3778     {
3779       addval += remove_constant_addition (&XEXP (exp, 0));
3780       addval += remove_constant_addition (&XEXP (exp, 1));
3781
3782       /* In case our parameter was constant, remove extra zero from the
3783          expression.  */
3784       if (XEXP (exp, 0) == const0_rtx)
3785         *x = XEXP (exp, 1);
3786       else if (XEXP (exp, 1) == const0_rtx)
3787         *x = XEXP (exp, 0);
3788     }
3789
3790   return addval;
3791 }
3792
3793 /* Attempt to identify accesses to arrays that are most likely to cause cache
3794    misses, and emit prefetch instructions a few prefetch blocks forward.
3795
3796    To detect the arrays we use the GIV information that was collected by the
3797    strength reduction pass.
3798
3799    The prefetch instructions are generated after the GIV information is done
3800    and before the strength reduction process. The new GIVs are injected into
3801    the strength reduction tables, so the prefetch addresses are optimized as
3802    well.
3803
3804    GIVs are split into base address, stride, and constant addition values.
3805    GIVs with the same address, stride and close addition values are combined
3806    into a single prefetch.  Also writes to GIVs are detected, so that prefetch
3807    for write instructions can be used for the block we write to, on machines
3808    that support write prefetches.
3809
3810    Several heuristics are used to determine when to prefetch.  They are
3811    controlled by defined symbols that can be overridden for each target.  */
3812
3813 static void
3814 emit_prefetch_instructions (struct loop *loop)
3815 {
3816   int num_prefetches = 0;
3817   int num_real_prefetches = 0;
3818   int num_real_write_prefetches = 0;
3819   int num_prefetches_before = 0;
3820   int num_write_prefetches_before = 0;
3821   int ahead = 0;
3822   int i;
3823   struct iv_class *bl;
3824   struct induction *iv;
3825   struct prefetch_info info[MAX_PREFETCHES];
3826   struct loop_ivs *ivs = LOOP_IVS (loop);
3827
3828   if (!HAVE_prefetch)
3829     return;
3830
3831   /* Consider only loops w/o calls.  When a call is done, the loop is probably
3832      slow enough to read the memory.  */
3833   if (PREFETCH_NO_CALL && LOOP_INFO (loop)->has_call)
3834     {
3835       if (loop_dump_stream)
3836         fprintf (loop_dump_stream, "Prefetch: ignoring loop: has call.\n");
3837
3838       return;
3839     }
3840
3841   /* Don't prefetch in loops known to have few iterations.  */
3842   if (PREFETCH_NO_LOW_LOOPCNT
3843       && LOOP_INFO (loop)->n_iterations
3844       && LOOP_INFO (loop)->n_iterations <= PREFETCH_LOW_LOOPCNT)
3845     {
3846       if (loop_dump_stream)
3847         fprintf (loop_dump_stream,
3848                  "Prefetch: ignoring loop: not enough iterations.\n");
3849       return;
3850     }
3851
3852   /* Search all induction variables and pick those interesting for the prefetch
3853      machinery.  */
3854   for (bl = ivs->list; bl; bl = bl->next)
3855     {
3856       struct induction *biv = bl->biv, *biv1;
3857       int basestride = 0;
3858
3859       biv1 = biv;
3860
3861       /* Expect all BIVs to be executed in each iteration.  This makes our
3862          analysis more conservative.  */
3863       while (biv1)
3864         {
3865           /* Discard non-constant additions that we can't handle well yet, and
3866              BIVs that are executed multiple times; such BIVs ought to be
3867              handled in the nested loop.  We accept not_every_iteration BIVs,
3868              since these only result in larger strides and make our
3869              heuristics more conservative.  */
3870           if (GET_CODE (biv->add_val) != CONST_INT)
3871             {
3872               if (loop_dump_stream)
3873                 {
3874                   fprintf (loop_dump_stream,
3875                     "Prefetch: ignoring biv %d: non-constant addition at insn %d:",
3876                            REGNO (biv->src_reg), INSN_UID (biv->insn));
3877                   print_rtl (loop_dump_stream, biv->add_val);
3878                   fprintf (loop_dump_stream, "\n");
3879                 }
3880               break;
3881             }
3882
3883           if (biv->maybe_multiple)
3884             {
3885               if (loop_dump_stream)
3886                 {
3887                   fprintf (loop_dump_stream,
3888                            "Prefetch: ignoring biv %d: maybe_multiple at insn %i:",
3889                            REGNO (biv->src_reg), INSN_UID (biv->insn));
3890                   print_rtl (loop_dump_stream, biv->add_val);
3891                   fprintf (loop_dump_stream, "\n");
3892                 }
3893               break;
3894             }
3895
3896           basestride += INTVAL (biv1->add_val);
3897           biv1 = biv1->next_iv;
3898         }
3899
3900       if (biv1 || !basestride)
3901         continue;
3902
3903       for (iv = bl->giv; iv; iv = iv->next_iv)
3904         {
3905           rtx address;
3906           rtx temp;
3907           HOST_WIDE_INT index = 0;
3908           int add = 1;
3909           HOST_WIDE_INT stride = 0;
3910           int stride_sign = 1;
3911           struct check_store_data d;
3912           const char *ignore_reason = NULL;
3913           int size = GET_MODE_SIZE (GET_MODE (iv));
3914
3915           /* See whether an induction variable is interesting to us and if
3916              not, report the reason.  */
3917           if (iv->giv_type != DEST_ADDR)
3918             ignore_reason = "giv is not a destination address";
3919
3920           /* We are interested only in constant stride memory references
3921              in order to be able to compute density easily.  */
3922           else if (GET_CODE (iv->mult_val) != CONST_INT)
3923             ignore_reason = "stride is not constant";
3924
3925           else
3926             {
3927               stride = INTVAL (iv->mult_val) * basestride;
3928               if (stride < 0)
3929                 {
3930                   stride = -stride;
3931                   stride_sign = -1;
3932                 }
3933
3934               /* On some targets, reversed order prefetches are not
3935                  worthwhile.  */
3936               if (PREFETCH_NO_REVERSE_ORDER && stride_sign < 0)
3937                 ignore_reason = "reversed order stride";
3938
3939               /* Prefetch of accesses with an extreme stride might not be
3940                  worthwhile, either.  */
3941               else if (PREFETCH_NO_EXTREME_STRIDE
3942                        && stride > PREFETCH_EXTREME_STRIDE)
3943                 ignore_reason = "extreme stride";
3944
3945               /* Ignore GIVs with varying add values; we can't predict the
3946                  value for the next iteration.  */
3947               else if (!loop_invariant_p (loop, iv->add_val))
3948                 ignore_reason = "giv has varying add value";
3949
3950               /* Ignore GIVs in the nested loops; they ought to have been
3951                  handled already.  */
3952               else if (iv->maybe_multiple)
3953                 ignore_reason = "giv is in nested loop";
3954             }
3955
3956           if (ignore_reason != NULL)
3957             {
3958               if (loop_dump_stream)
3959                 fprintf (loop_dump_stream,
3960                          "Prefetch: ignoring giv at %d: %s.\n",
3961                          INSN_UID (iv->insn), ignore_reason);
3962               continue;
3963             }
3964
3965           /* Determine the pointer to the basic array we are examining.  It is
3966              the sum of the BIV's initial value and the GIV's add_val.  */
3967           address = copy_rtx (iv->add_val);
3968           temp = copy_rtx (bl->initial_value);
3969
3970           address = simplify_gen_binary (PLUS, Pmode, temp, address);
3971           index = remove_constant_addition (&address);
3972
3973           d.mem_write = 0;
3974           d.mem_address = *iv->location;
3975
3976           /* When the GIV is not always executed, we might be better off by
3977              not dirtying the cache pages.  */
3978           if (PREFETCH_CONDITIONAL || iv->always_executed)
3979             note_stores (PATTERN (iv->insn), check_store, &d);
3980           else
3981             {
3982               if (loop_dump_stream)
3983                 fprintf (loop_dump_stream, "Prefetch: Ignoring giv at %d: %s\n",
3984                          INSN_UID (iv->insn), "in conditional code.");
3985               continue;
3986             }
3987
3988           /* Attempt to find another prefetch to the same array and see if we
3989              can merge this one.  */
3990           for (i = 0; i < num_prefetches; i++)
3991             if (rtx_equal_for_prefetch_p (address, info[i].base_address)
3992                 && stride == info[i].stride)
3993               {
3994                 /* In case both access same array (same location
3995                    just with small difference in constant indexes), merge
3996                    the prefetches.  Just do the later and the earlier will
3997                    get prefetched from previous iteration.
3998                    The artificial threshold should not be too small,
3999                    but also not bigger than small portion of memory usually
4000                    traversed by single loop.  */
4001                 if (index >= info[i].index
4002                     && index - info[i].index < PREFETCH_EXTREME_DIFFERENCE)
4003                   {
4004                     info[i].write |= d.mem_write;
4005                     info[i].bytes_accessed += size;
4006                     info[i].index = index;
4007                     info[i].giv = iv;
4008                     info[i].class = bl;
4009                     info[num_prefetches].base_address = address;
4010                     add = 0;
4011                     break;
4012                   }
4013
4014                 if (index < info[i].index
4015                     && info[i].index - index < PREFETCH_EXTREME_DIFFERENCE)
4016                   {
4017                     info[i].write |= d.mem_write;
4018                     info[i].bytes_accessed += size;
4019                     add = 0;
4020                     break;
4021                   }
4022               }
4023
4024           /* Merging failed.  */
4025           if (add)
4026             {
4027               info[num_prefetches].giv = iv;
4028               info[num_prefetches].class = bl;
4029               info[num_prefetches].index = index;
4030               info[num_prefetches].stride = stride;
4031               info[num_prefetches].base_address = address;
4032               info[num_prefetches].write = d.mem_write;
4033               info[num_prefetches].bytes_accessed = size;
4034               num_prefetches++;
4035               if (num_prefetches >= MAX_PREFETCHES)
4036                 {
4037                   if (loop_dump_stream)
4038                     fprintf (loop_dump_stream,
4039                              "Maximal number of prefetches exceeded.\n");
4040                   return;
4041                 }
4042             }
4043         }
4044     }
4045
4046   for (i = 0; i < num_prefetches; i++)
4047     {
4048       int density;
4049
4050       /* Attempt to calculate the total number of bytes fetched by all
4051          iterations of the loop.  Avoid overflow.  */
4052       if (LOOP_INFO (loop)->n_iterations
4053           && ((unsigned HOST_WIDE_INT) (0xffffffff / info[i].stride)
4054               >= LOOP_INFO (loop)->n_iterations))
4055         info[i].total_bytes = info[i].stride * LOOP_INFO (loop)->n_iterations;
4056       else
4057         info[i].total_bytes = 0xffffffff;
4058
4059       density = info[i].bytes_accessed * 100 / info[i].stride;
4060
4061       /* Prefetch might be worthwhile only when the loads/stores are dense.  */
4062       if (PREFETCH_ONLY_DENSE_MEM)
4063         if (density * 256 > PREFETCH_DENSE_MEM * 100
4064             && (info[i].total_bytes / PREFETCH_BLOCK
4065                 >= PREFETCH_BLOCKS_BEFORE_LOOP_MIN))
4066           {
4067             info[i].prefetch_before_loop = 1;
4068             info[i].prefetch_in_loop
4069               = (info[i].total_bytes / PREFETCH_BLOCK
4070                  > PREFETCH_BLOCKS_BEFORE_LOOP_MAX);
4071           }
4072         else
4073           {
4074             info[i].prefetch_in_loop = 0, info[i].prefetch_before_loop = 0;
4075             if (loop_dump_stream)
4076               fprintf (loop_dump_stream,
4077                   "Prefetch: ignoring giv at %d: %d%% density is too low.\n",
4078                        INSN_UID (info[i].giv->insn), density);
4079           }
4080       else
4081         info[i].prefetch_in_loop = 1, info[i].prefetch_before_loop = 1;
4082
4083       /* Find how many prefetch instructions we'll use within the loop.  */
4084       if (info[i].prefetch_in_loop != 0)
4085         {
4086           info[i].prefetch_in_loop = ((info[i].stride + PREFETCH_BLOCK - 1)
4087                                   / PREFETCH_BLOCK);
4088           num_real_prefetches += info[i].prefetch_in_loop;
4089           if (info[i].write)
4090             num_real_write_prefetches += info[i].prefetch_in_loop;
4091         }
4092     }
4093
4094   /* Determine how many iterations ahead to prefetch within the loop, based
4095      on how many prefetches we currently expect to do within the loop.  */
4096   if (num_real_prefetches != 0)
4097     {
4098       if ((ahead = SIMULTANEOUS_PREFETCHES / num_real_prefetches) == 0)
4099         {
4100           if (loop_dump_stream)
4101             fprintf (loop_dump_stream,
4102                      "Prefetch: ignoring prefetches within loop: ahead is zero; %d < %d\n",
4103                      SIMULTANEOUS_PREFETCHES, num_real_prefetches);
4104           num_real_prefetches = 0, num_real_write_prefetches = 0;
4105         }
4106     }
4107   /* We'll also use AHEAD to determine how many prefetch instructions to
4108      emit before a loop, so don't leave it zero.  */
4109   if (ahead == 0)
4110     ahead = PREFETCH_BLOCKS_BEFORE_LOOP_MAX;
4111
4112   for (i = 0; i < num_prefetches; i++)
4113     {
4114       /* Update if we've decided not to prefetch anything within the loop.  */
4115       if (num_real_prefetches == 0)
4116         info[i].prefetch_in_loop = 0;
4117
4118       /* Find how many prefetch instructions we'll use before the loop.  */
4119       if (info[i].prefetch_before_loop != 0)
4120         {
4121           int n = info[i].total_bytes / PREFETCH_BLOCK;
4122           if (n > ahead)
4123             n = ahead;
4124           info[i].prefetch_before_loop = n;
4125           num_prefetches_before += n;
4126           if (info[i].write)
4127             num_write_prefetches_before += n;
4128         }
4129
4130       if (loop_dump_stream)
4131         {
4132           if (info[i].prefetch_in_loop == 0
4133               && info[i].prefetch_before_loop == 0)
4134             continue;
4135           fprintf (loop_dump_stream, "Prefetch insn: %d",
4136                    INSN_UID (info[i].giv->insn));
4137           fprintf (loop_dump_stream,
4138                    "; in loop: %d; before: %d; %s\n",
4139                    info[i].prefetch_in_loop,
4140                    info[i].prefetch_before_loop,
4141                    info[i].write ? "read/write" : "read only");
4142           fprintf (loop_dump_stream,
4143                    " density: %d%%; bytes_accessed: %u; total_bytes: %u\n",
4144                    (int) (info[i].bytes_accessed * 100 / info[i].stride),
4145                    info[i].bytes_accessed, info[i].total_bytes);
4146           fprintf (loop_dump_stream, " index: " HOST_WIDE_INT_PRINT_DEC
4147                    "; stride: " HOST_WIDE_INT_PRINT_DEC "; address: ",
4148                    info[i].index, info[i].stride);
4149           print_rtl (loop_dump_stream, info[i].base_address);
4150           fprintf (loop_dump_stream, "\n");
4151         }
4152     }
4153
4154   if (num_real_prefetches + num_prefetches_before > 0)
4155     {
4156       /* Record that this loop uses prefetch instructions.  */
4157       LOOP_INFO (loop)->has_prefetch = 1;
4158
4159       if (loop_dump_stream)
4160         {
4161           fprintf (loop_dump_stream, "Real prefetches needed within loop: %d (write: %d)\n",
4162                    num_real_prefetches, num_real_write_prefetches);
4163           fprintf (loop_dump_stream, "Real prefetches needed before loop: %d (write: %d)\n",
4164                    num_prefetches_before, num_write_prefetches_before);
4165         }
4166     }
4167
4168   for (i = 0; i < num_prefetches; i++)
4169     {
4170       int y;
4171
4172       for (y = 0; y < info[i].prefetch_in_loop; y++)
4173         {
4174           rtx loc = copy_rtx (*info[i].giv->location);
4175           rtx insn;
4176           int bytes_ahead = PREFETCH_BLOCK * (ahead + y);
4177           rtx before_insn = info[i].giv->insn;
4178           rtx prev_insn = PREV_INSN (info[i].giv->insn);
4179           rtx seq;
4180
4181           /* We can save some effort by offsetting the address on
4182              architectures with offsettable memory references.  */
4183           if (offsettable_address_p (0, VOIDmode, loc))
4184             loc = plus_constant (loc, bytes_ahead);
4185           else
4186             {
4187               rtx reg = gen_reg_rtx (Pmode);
4188               loop_iv_add_mult_emit_before (loop, loc, const1_rtx,
4189                                             GEN_INT (bytes_ahead), reg,
4190                                             0, before_insn);
4191               loc = reg;
4192             }
4193
4194           start_sequence ();
4195           /* Make sure the address operand is valid for prefetch.  */
4196           if (! (*insn_data[(int)CODE_FOR_prefetch].operand[0].predicate)
4197                   (loc, insn_data[(int)CODE_FOR_prefetch].operand[0].mode))
4198             loc = force_reg (Pmode, loc);
4199           emit_insn (gen_prefetch (loc, GEN_INT (info[i].write),
4200                                    GEN_INT (3)));
4201           seq = get_insns ();
4202           end_sequence ();
4203           emit_insn_before (seq, before_insn);
4204
4205           /* Check all insns emitted and record the new GIV
4206              information.  */
4207           insn = NEXT_INSN (prev_insn);
4208           while (insn != before_insn)
4209             {
4210               insn = check_insn_for_givs (loop, insn,
4211                                           info[i].giv->always_executed,
4212                                           info[i].giv->maybe_multiple);
4213               insn = NEXT_INSN (insn);
4214             }
4215         }
4216
4217       if (PREFETCH_BEFORE_LOOP)
4218         {
4219           /* Emit insns before the loop to fetch the first cache lines or,
4220              if we're not prefetching within the loop, everything we expect
4221              to need.  */
4222           for (y = 0; y < info[i].prefetch_before_loop; y++)
4223             {
4224               rtx reg = gen_reg_rtx (Pmode);
4225               rtx loop_start = loop->start;
4226               rtx init_val = info[i].class->initial_value;
4227               rtx add_val = simplify_gen_binary (PLUS, Pmode,
4228                                                  info[i].giv->add_val,
4229                                                  GEN_INT (y * PREFETCH_BLOCK));
4230
4231               /* Functions called by LOOP_IV_ADD_EMIT_BEFORE expect a
4232                  non-constant INIT_VAL to have the same mode as REG, which
4233                  in this case we know to be Pmode.  */
4234               if (GET_MODE (init_val) != Pmode && !CONSTANT_P (init_val))
4235                 {
4236                   rtx seq;
4237
4238                   start_sequence ();
4239                   init_val = convert_to_mode (Pmode, init_val, 0);
4240                   seq = get_insns ();
4241                   end_sequence ();
4242                   loop_insn_emit_before (loop, 0, loop_start, seq);
4243                 }
4244               loop_iv_add_mult_emit_before (loop, init_val,
4245                                             info[i].giv->mult_val,
4246                                             add_val, reg, 0, loop_start);
4247               emit_insn_before (gen_prefetch (reg, GEN_INT (info[i].write),
4248                                               GEN_INT (3)),
4249                                 loop_start);
4250             }
4251         }
4252     }
4253
4254   return;
4255 }
4256 \f
4257 /* Communication with routines called via `note_stores'.  */
4258
4259 static rtx note_insn;
4260
4261 /* Dummy register to have nonzero DEST_REG for DEST_ADDR type givs.  */
4262
4263 static rtx addr_placeholder;
4264
4265 /* ??? Unfinished optimizations, and possible future optimizations,
4266    for the strength reduction code.  */
4267
4268 /* ??? The interaction of biv elimination, and recognition of 'constant'
4269    bivs, may cause problems.  */
4270
4271 /* ??? Add heuristics so that DEST_ADDR strength reduction does not cause
4272    performance problems.
4273
4274    Perhaps don't eliminate things that can be combined with an addressing
4275    mode.  Find all givs that have the same biv, mult_val, and add_val;
4276    then for each giv, check to see if its only use dies in a following
4277    memory address.  If so, generate a new memory address and check to see
4278    if it is valid.   If it is valid, then store the modified memory address,
4279    otherwise, mark the giv as not done so that it will get its own iv.  */
4280
4281 /* ??? Could try to optimize branches when it is known that a biv is always
4282    positive.  */
4283
4284 /* ??? When replace a biv in a compare insn, we should replace with closest
4285    giv so that an optimized branch can still be recognized by the combiner,
4286    e.g. the VAX acb insn.  */
4287
4288 /* ??? Many of the checks involving uid_luid could be simplified if regscan
4289    was rerun in loop_optimize whenever a register was added or moved.
4290    Also, some of the optimizations could be a little less conservative.  */
4291 \f
4292 /* Scan the loop body and call FNCALL for each insn.  In the addition to the
4293    LOOP and INSN parameters pass MAYBE_MULTIPLE and NOT_EVERY_ITERATION to the
4294    callback.
4295
4296    NOT_EVERY_ITERATION is 1 if current insn is not known to be executed at
4297    least once for every loop iteration except for the last one.
4298
4299    MAYBE_MULTIPLE is 1 if current insn may be executed more than once for every
4300    loop iteration.
4301  */
4302 void
4303 for_each_insn_in_loop (struct loop *loop, loop_insn_callback fncall)
4304 {
4305   int not_every_iteration = 0;
4306   int maybe_multiple = 0;
4307   int past_loop_latch = 0;
4308   int loop_depth = 0;
4309   rtx p;
4310
4311   /* If loop_scan_start points to the loop exit test, we have to be wary of
4312      subversive use of gotos inside expression statements.  */
4313   if (prev_nonnote_insn (loop->scan_start) != prev_nonnote_insn (loop->start))
4314     maybe_multiple = back_branch_in_range_p (loop, loop->scan_start);
4315
4316   /* Scan through loop and update NOT_EVERY_ITERATION and MAYBE_MULTIPLE.  */
4317   for (p = next_insn_in_loop (loop, loop->scan_start);
4318        p != NULL_RTX;
4319        p = next_insn_in_loop (loop, p))
4320     {
4321       p = fncall (loop, p, not_every_iteration, maybe_multiple);
4322
4323       /* Past CODE_LABEL, we get to insns that may be executed multiple
4324          times.  The only way we can be sure that they can't is if every
4325          jump insn between here and the end of the loop either
4326          returns, exits the loop, is a jump to a location that is still
4327          behind the label, or is a jump to the loop start.  */
4328
4329       if (GET_CODE (p) == CODE_LABEL)
4330         {
4331           rtx insn = p;
4332
4333           maybe_multiple = 0;
4334
4335           while (1)
4336             {
4337               insn = NEXT_INSN (insn);
4338               if (insn == loop->scan_start)
4339                 break;
4340               if (insn == loop->end)
4341                 {
4342                   if (loop->top != 0)
4343                     insn = loop->top;
4344                   else
4345                     break;
4346                   if (insn == loop->scan_start)
4347                     break;
4348                 }
4349
4350               if (GET_CODE (insn) == JUMP_INSN
4351                   && GET_CODE (PATTERN (insn)) != RETURN
4352                   && (!any_condjump_p (insn)
4353                       || (JUMP_LABEL (insn) != 0
4354                           && JUMP_LABEL (insn) != loop->scan_start
4355                           && !loop_insn_first_p (p, JUMP_LABEL (insn)))))
4356                 {
4357                   maybe_multiple = 1;
4358                   break;
4359                 }
4360             }
4361         }
4362
4363       /* Past a jump, we get to insns for which we can't count
4364          on whether they will be executed during each iteration.  */
4365       /* This code appears twice in strength_reduce.  There is also similar
4366          code in scan_loop.  */
4367       if (GET_CODE (p) == JUMP_INSN
4368       /* If we enter the loop in the middle, and scan around to the
4369          beginning, don't set not_every_iteration for that.
4370          This can be any kind of jump, since we want to know if insns
4371          will be executed if the loop is executed.  */
4372           && !(JUMP_LABEL (p) == loop->top
4373                && ((NEXT_INSN (NEXT_INSN (p)) == loop->end
4374                     && any_uncondjump_p (p))
4375                    || (NEXT_INSN (p) == loop->end && any_condjump_p (p)))))
4376         {
4377           rtx label = 0;
4378
4379           /* If this is a jump outside the loop, then it also doesn't
4380              matter.  Check to see if the target of this branch is on the
4381              loop->exits_labels list.  */
4382
4383           for (label = loop->exit_labels; label; label = LABEL_NEXTREF (label))
4384             if (XEXP (label, 0) == JUMP_LABEL (p))
4385               break;
4386
4387           if (!label)
4388             not_every_iteration = 1;
4389         }
4390
4391       else if (GET_CODE (p) == NOTE)
4392         {
4393           /* At the virtual top of a converted loop, insns are again known to
4394              be executed each iteration: logically, the loop begins here
4395              even though the exit code has been duplicated.
4396
4397              Insns are also again known to be executed each iteration at
4398              the LOOP_CONT note.  */
4399           if ((NOTE_LINE_NUMBER (p) == NOTE_INSN_LOOP_VTOP
4400                || NOTE_LINE_NUMBER (p) == NOTE_INSN_LOOP_CONT)
4401               && loop_depth == 0)
4402             not_every_iteration = 0;
4403           else if (NOTE_LINE_NUMBER (p) == NOTE_INSN_LOOP_BEG)
4404             loop_depth++;
4405           else if (NOTE_LINE_NUMBER (p) == NOTE_INSN_LOOP_END)
4406             loop_depth--;
4407         }
4408
4409       /* Note if we pass a loop latch.  If we do, then we can not clear
4410          NOT_EVERY_ITERATION below when we pass the last CODE_LABEL in
4411          a loop since a jump before the last CODE_LABEL may have started
4412          a new loop iteration.
4413
4414          Note that LOOP_TOP is only set for rotated loops and we need
4415          this check for all loops, so compare against the CODE_LABEL
4416          which immediately follows LOOP_START.  */
4417       if (GET_CODE (p) == JUMP_INSN
4418           && JUMP_LABEL (p) == NEXT_INSN (loop->start))
4419         past_loop_latch = 1;
4420
4421       /* Unlike in the code motion pass where MAYBE_NEVER indicates that
4422          an insn may never be executed, NOT_EVERY_ITERATION indicates whether
4423          or not an insn is known to be executed each iteration of the
4424          loop, whether or not any iterations are known to occur.
4425
4426          Therefore, if we have just passed a label and have no more labels
4427          between here and the test insn of the loop, and we have not passed
4428          a jump to the top of the loop, then we know these insns will be
4429          executed each iteration.  */
4430
4431       if (not_every_iteration
4432           && !past_loop_latch
4433           && GET_CODE (p) == CODE_LABEL
4434           && no_labels_between_p (p, loop->end)
4435           && loop_insn_first_p (p, loop->cont))
4436         not_every_iteration = 0;
4437     }
4438 }
4439 \f
4440 static void
4441 loop_bivs_find (struct loop *loop)
4442 {
4443   struct loop_regs *regs = LOOP_REGS (loop);
4444   struct loop_ivs *ivs = LOOP_IVS (loop);
4445   /* Temporary list pointers for traversing ivs->list.  */
4446   struct iv_class *bl, **backbl;
4447
4448   ivs->list = 0;
4449
4450   for_each_insn_in_loop (loop, check_insn_for_bivs);
4451
4452   /* Scan ivs->list to remove all regs that proved not to be bivs.
4453      Make a sanity check against regs->n_times_set.  */
4454   for (backbl = &ivs->list, bl = *backbl; bl; bl = bl->next)
4455     {
4456       if (REG_IV_TYPE (ivs, bl->regno) != BASIC_INDUCT
4457           /* Above happens if register modified by subreg, etc.  */
4458           /* Make sure it is not recognized as a basic induction var: */
4459           || regs->array[bl->regno].n_times_set != bl->biv_count
4460           /* If never incremented, it is invariant that we decided not to
4461              move.  So leave it alone.  */
4462           || ! bl->incremented)
4463         {
4464           if (loop_dump_stream)
4465             fprintf (loop_dump_stream, "Biv %d: discarded, %s\n",
4466                      bl->regno,
4467                      (REG_IV_TYPE (ivs, bl->regno) != BASIC_INDUCT
4468                       ? "not induction variable"
4469                       : (! bl->incremented ? "never incremented"
4470                          : "count error")));
4471
4472           REG_IV_TYPE (ivs, bl->regno) = NOT_BASIC_INDUCT;
4473           *backbl = bl->next;
4474         }
4475       else
4476         {
4477           backbl = &bl->next;
4478
4479           if (loop_dump_stream)
4480             fprintf (loop_dump_stream, "Biv %d: verified\n", bl->regno);
4481         }
4482     }
4483 }
4484
4485
4486 /* Determine how BIVS are initialized by looking through pre-header
4487    extended basic block.  */
4488 static void
4489 loop_bivs_init_find (struct loop *loop)
4490 {
4491   struct loop_ivs *ivs = LOOP_IVS (loop);
4492   /* Temporary list pointers for traversing ivs->list.  */
4493   struct iv_class *bl;
4494   int call_seen;
4495   rtx p;
4496
4497   /* Find initial value for each biv by searching backwards from loop_start,
4498      halting at first label.  Also record any test condition.  */
4499
4500   call_seen = 0;
4501   for (p = loop->start; p && GET_CODE (p) != CODE_LABEL; p = PREV_INSN (p))
4502     {
4503       rtx test;
4504
4505       note_insn = p;
4506
4507       if (GET_CODE (p) == CALL_INSN)
4508         call_seen = 1;
4509
4510       if (INSN_P (p))
4511         note_stores (PATTERN (p), record_initial, ivs);
4512
4513       /* Record any test of a biv that branches around the loop if no store
4514          between it and the start of loop.  We only care about tests with
4515          constants and registers and only certain of those.  */
4516       if (GET_CODE (p) == JUMP_INSN
4517           && JUMP_LABEL (p) != 0
4518           && next_real_insn (JUMP_LABEL (p)) == next_real_insn (loop->end)
4519           && (test = get_condition_for_loop (loop, p)) != 0
4520           && GET_CODE (XEXP (test, 0)) == REG
4521           && REGNO (XEXP (test, 0)) < max_reg_before_loop
4522           && (bl = REG_IV_CLASS (ivs, REGNO (XEXP (test, 0)))) != 0
4523           && valid_initial_value_p (XEXP (test, 1), p, call_seen, loop->start)
4524           && bl->init_insn == 0)
4525         {
4526           /* If an NE test, we have an initial value!  */
4527           if (GET_CODE (test) == NE)
4528             {
4529               bl->init_insn = p;
4530               bl->init_set = gen_rtx_SET (VOIDmode,
4531                                           XEXP (test, 0), XEXP (test, 1));
4532             }
4533           else
4534             bl->initial_test = test;
4535         }
4536     }
4537 }
4538
4539
4540 /* Look at the each biv and see if we can say anything better about its
4541    initial value from any initializing insns set up above.  (This is done
4542    in two passes to avoid missing SETs in a PARALLEL.)  */
4543 static void
4544 loop_bivs_check (struct loop *loop)
4545 {
4546   struct loop_ivs *ivs = LOOP_IVS (loop);
4547   /* Temporary list pointers for traversing ivs->list.  */
4548   struct iv_class *bl;
4549   struct iv_class **backbl;
4550
4551   for (backbl = &ivs->list; (bl = *backbl); backbl = &bl->next)
4552     {
4553       rtx src;
4554       rtx note;
4555
4556       if (! bl->init_insn)
4557         continue;
4558
4559       /* IF INIT_INSN has a REG_EQUAL or REG_EQUIV note and the value
4560          is a constant, use the value of that.  */
4561       if (((note = find_reg_note (bl->init_insn, REG_EQUAL, 0)) != NULL
4562            && CONSTANT_P (XEXP (note, 0)))
4563           || ((note = find_reg_note (bl->init_insn, REG_EQUIV, 0)) != NULL
4564               && CONSTANT_P (XEXP (note, 0))))
4565         src = XEXP (note, 0);
4566       else
4567         src = SET_SRC (bl->init_set);
4568
4569       if (loop_dump_stream)
4570         fprintf (loop_dump_stream,
4571                  "Biv %d: initialized at insn %d: initial value ",
4572                  bl->regno, INSN_UID (bl->init_insn));
4573
4574       if ((GET_MODE (src) == GET_MODE (regno_reg_rtx[bl->regno])
4575            || GET_MODE (src) == VOIDmode)
4576           && valid_initial_value_p (src, bl->init_insn,
4577                                     LOOP_INFO (loop)->pre_header_has_call,
4578                                     loop->start))
4579         {
4580           bl->initial_value = src;
4581
4582           if (loop_dump_stream)
4583             {
4584               print_simple_rtl (loop_dump_stream, src);
4585               fputc ('\n', loop_dump_stream);
4586             }
4587         }
4588       /* If we can't make it a giv,
4589          let biv keep initial value of "itself".  */
4590       else if (loop_dump_stream)
4591         fprintf (loop_dump_stream, "is complex\n");
4592     }
4593 }
4594
4595
4596 /* Search the loop for general induction variables.  */
4597
4598 static void
4599 loop_givs_find (struct loop* loop)
4600 {
4601   for_each_insn_in_loop (loop, check_insn_for_givs);
4602 }
4603
4604
4605 /* For each giv for which we still don't know whether or not it is
4606    replaceable, check to see if it is replaceable because its final value
4607    can be calculated.  */
4608
4609 static void
4610 loop_givs_check (struct loop *loop)
4611 {
4612   struct loop_ivs *ivs = LOOP_IVS (loop);
4613   struct iv_class *bl;
4614
4615   for (bl = ivs->list; bl; bl = bl->next)
4616     {
4617       struct induction *v;
4618
4619       for (v = bl->giv; v; v = v->next_iv)
4620         if (! v->replaceable && ! v->not_replaceable)
4621           check_final_value (loop, v);
4622     }
4623 }
4624
4625
4626 /* Return nonzero if it is possible to eliminate the biv BL provided
4627    all givs are reduced.  This is possible if either the reg is not
4628    used outside the loop, or we can compute what its final value will
4629    be.  */
4630
4631 static int
4632 loop_biv_eliminable_p (struct loop *loop, struct iv_class *bl,
4633                        int threshold, int insn_count)
4634 {
4635   /* For architectures with a decrement_and_branch_until_zero insn,
4636      don't do this if we put a REG_NONNEG note on the endtest for this
4637      biv.  */
4638
4639 #ifdef HAVE_decrement_and_branch_until_zero
4640   if (bl->nonneg)
4641     {
4642       if (loop_dump_stream)
4643         fprintf (loop_dump_stream,
4644                  "Cannot eliminate nonneg biv %d.\n", bl->regno);
4645       return 0;
4646     }
4647 #endif
4648
4649   /* Check that biv is used outside loop or if it has a final value.
4650      Compare against bl->init_insn rather than loop->start.  We aren't
4651      concerned with any uses of the biv between init_insn and
4652      loop->start since these won't be affected by the value of the biv
4653      elsewhere in the function, so long as init_insn doesn't use the
4654      biv itself.  */
4655
4656   if ((REGNO_LAST_LUID (bl->regno) < INSN_LUID (loop->end)
4657        && bl->init_insn
4658        && INSN_UID (bl->init_insn) < max_uid_for_loop
4659        && REGNO_FIRST_LUID (bl->regno) >= INSN_LUID (bl->init_insn)
4660        && ! reg_mentioned_p (bl->biv->dest_reg, SET_SRC (bl->init_set)))
4661       || (bl->final_value = final_biv_value (loop, bl)))
4662     return maybe_eliminate_biv (loop, bl, 0, threshold, insn_count);
4663
4664   if (loop_dump_stream)
4665     {
4666       fprintf (loop_dump_stream,
4667                "Cannot eliminate biv %d.\n",
4668                bl->regno);
4669       fprintf (loop_dump_stream,
4670                "First use: insn %d, last use: insn %d.\n",
4671                REGNO_FIRST_UID (bl->regno),
4672                REGNO_LAST_UID (bl->regno));
4673     }
4674   return 0;
4675 }
4676
4677
4678 /* Reduce each giv of BL that we have decided to reduce.  */
4679
4680 static void
4681 loop_givs_reduce (struct loop *loop, struct iv_class *bl)
4682 {
4683   struct induction *v;
4684
4685   for (v = bl->giv; v; v = v->next_iv)
4686     {
4687       struct induction *tv;
4688       if (! v->ignore && v->same == 0)
4689         {
4690           int auto_inc_opt = 0;
4691
4692           /* If the code for derived givs immediately below has already
4693              allocated a new_reg, we must keep it.  */
4694           if (! v->new_reg)
4695             v->new_reg = gen_reg_rtx (v->mode);
4696
4697 #ifdef AUTO_INC_DEC
4698           /* If the target has auto-increment addressing modes, and
4699              this is an address giv, then try to put the increment
4700              immediately after its use, so that flow can create an
4701              auto-increment addressing mode.  */
4702           if (v->giv_type == DEST_ADDR && bl->biv_count == 1
4703               && bl->biv->always_executed && ! bl->biv->maybe_multiple
4704               /* We don't handle reversed biv's because bl->biv->insn
4705                  does not have a valid INSN_LUID.  */
4706               && ! bl->reversed
4707               && v->always_executed && ! v->maybe_multiple
4708               && INSN_UID (v->insn) < max_uid_for_loop)
4709             {
4710               /* If other giv's have been combined with this one, then
4711                  this will work only if all uses of the other giv's occur
4712                  before this giv's insn.  This is difficult to check.
4713
4714                  We simplify this by looking for the common case where
4715                  there is one DEST_REG giv, and this giv's insn is the
4716                  last use of the dest_reg of that DEST_REG giv.  If the
4717                  increment occurs after the address giv, then we can
4718                  perform the optimization.  (Otherwise, the increment
4719                  would have to go before other_giv, and we would not be
4720                  able to combine it with the address giv to get an
4721                  auto-inc address.)  */
4722               if (v->combined_with)
4723                 {
4724                   struct induction *other_giv = 0;
4725
4726                   for (tv = bl->giv; tv; tv = tv->next_iv)
4727                     if (tv->same == v)
4728                       {
4729                         if (other_giv)
4730                           break;
4731                         else
4732                           other_giv = tv;
4733                       }
4734                   if (! tv && other_giv
4735                       && REGNO (other_giv->dest_reg) < max_reg_before_loop
4736                       && (REGNO_LAST_UID (REGNO (other_giv->dest_reg))
4737                           == INSN_UID (v->insn))
4738                       && INSN_LUID (v->insn) < INSN_LUID (bl->biv->insn))
4739                     auto_inc_opt = 1;
4740                 }
4741               /* Check for case where increment is before the address
4742                  giv.  Do this test in "loop order".  */
4743               else if ((INSN_LUID (v->insn) > INSN_LUID (bl->biv->insn)
4744                         && (INSN_LUID (v->insn) < INSN_LUID (loop->scan_start)
4745                             || (INSN_LUID (bl->biv->insn)
4746                                 > INSN_LUID (loop->scan_start))))
4747                        || (INSN_LUID (v->insn) < INSN_LUID (loop->scan_start)
4748                            && (INSN_LUID (loop->scan_start)
4749                                < INSN_LUID (bl->biv->insn))))
4750                 auto_inc_opt = -1;
4751               else
4752                 auto_inc_opt = 1;
4753
4754 #ifdef HAVE_cc0
4755               {
4756                 rtx prev;
4757
4758                 /* We can't put an insn immediately after one setting
4759                    cc0, or immediately before one using cc0.  */
4760                 if ((auto_inc_opt == 1 && sets_cc0_p (PATTERN (v->insn)))
4761                     || (auto_inc_opt == -1
4762                         && (prev = prev_nonnote_insn (v->insn)) != 0
4763                         && INSN_P (prev)
4764                         && sets_cc0_p (PATTERN (prev))))
4765                   auto_inc_opt = 0;
4766               }
4767 #endif
4768
4769               if (auto_inc_opt)
4770                 v->auto_inc_opt = 1;
4771             }
4772 #endif
4773
4774           /* For each place where the biv is incremented, add an insn
4775              to increment the new, reduced reg for the giv.  */
4776           for (tv = bl->biv; tv; tv = tv->next_iv)
4777             {
4778               rtx insert_before;
4779
4780               /* Skip if location is the same as a previous one.  */
4781               if (tv->same)
4782                 continue;
4783               if (! auto_inc_opt)
4784                 insert_before = NEXT_INSN (tv->insn);
4785               else if (auto_inc_opt == 1)
4786                 insert_before = NEXT_INSN (v->insn);
4787               else
4788                 insert_before = v->insn;
4789
4790               if (tv->mult_val == const1_rtx)
4791                 loop_iv_add_mult_emit_before (loop, tv->add_val, v->mult_val,
4792                                               v->new_reg, v->new_reg,
4793                                               0, insert_before);
4794               else /* tv->mult_val == const0_rtx */
4795                 /* A multiply is acceptable here
4796                    since this is presumed to be seldom executed.  */
4797                 loop_iv_add_mult_emit_before (loop, tv->add_val, v->mult_val,
4798                                               v->add_val, v->new_reg,
4799                                               0, insert_before);
4800             }
4801
4802           /* Add code at loop start to initialize giv's reduced reg.  */
4803
4804           loop_iv_add_mult_hoist (loop,
4805                                   extend_value_for_giv (v, bl->initial_value),
4806                                   v->mult_val, v->add_val, v->new_reg);
4807         }
4808     }
4809 }
4810
4811
4812 /* Check for givs whose first use is their definition and whose
4813    last use is the definition of another giv.  If so, it is likely
4814    dead and should not be used to derive another giv nor to
4815    eliminate a biv.  */
4816
4817 static void
4818 loop_givs_dead_check (struct loop *loop ATTRIBUTE_UNUSED, struct iv_class *bl)
4819 {
4820   struct induction *v;
4821
4822   for (v = bl->giv; v; v = v->next_iv)
4823     {
4824       if (v->ignore
4825           || (v->same && v->same->ignore))
4826         continue;
4827
4828       if (v->giv_type == DEST_REG
4829           && REGNO_FIRST_UID (REGNO (v->dest_reg)) == INSN_UID (v->insn))
4830         {
4831           struct induction *v1;
4832
4833           for (v1 = bl->giv; v1; v1 = v1->next_iv)
4834             if (REGNO_LAST_UID (REGNO (v->dest_reg)) == INSN_UID (v1->insn))
4835               v->maybe_dead = 1;
4836         }
4837     }
4838 }
4839
4840
4841 static void
4842 loop_givs_rescan (struct loop *loop, struct iv_class *bl, rtx *reg_map)
4843 {
4844   struct induction *v;
4845
4846   for (v = bl->giv; v; v = v->next_iv)
4847     {
4848       if (v->same && v->same->ignore)
4849         v->ignore = 1;
4850
4851       if (v->ignore)
4852         continue;
4853
4854       /* Update expression if this was combined, in case other giv was
4855          replaced.  */
4856       if (v->same)
4857         v->new_reg = replace_rtx (v->new_reg,
4858                                   v->same->dest_reg, v->same->new_reg);
4859
4860       /* See if this register is known to be a pointer to something.  If
4861          so, see if we can find the alignment.  First see if there is a
4862          destination register that is a pointer.  If so, this shares the
4863          alignment too.  Next see if we can deduce anything from the
4864          computational information.  If not, and this is a DEST_ADDR
4865          giv, at least we know that it's a pointer, though we don't know
4866          the alignment.  */
4867       if (GET_CODE (v->new_reg) == REG
4868           && v->giv_type == DEST_REG
4869           && REG_POINTER (v->dest_reg))
4870         mark_reg_pointer (v->new_reg,
4871                           REGNO_POINTER_ALIGN (REGNO (v->dest_reg)));
4872       else if (GET_CODE (v->new_reg) == REG
4873                && REG_POINTER (v->src_reg))
4874         {
4875           unsigned int align = REGNO_POINTER_ALIGN (REGNO (v->src_reg));
4876
4877           if (align == 0
4878               || GET_CODE (v->add_val) != CONST_INT
4879               || INTVAL (v->add_val) % (align / BITS_PER_UNIT) != 0)
4880             align = 0;
4881
4882           mark_reg_pointer (v->new_reg, align);
4883         }
4884       else if (GET_CODE (v->new_reg) == REG
4885                && GET_CODE (v->add_val) == REG
4886                && REG_POINTER (v->add_val))
4887         {
4888           unsigned int align = REGNO_POINTER_ALIGN (REGNO (v->add_val));
4889
4890           if (align == 0 || GET_CODE (v->mult_val) != CONST_INT
4891               || INTVAL (v->mult_val) % (align / BITS_PER_UNIT) != 0)
4892             align = 0;
4893
4894           mark_reg_pointer (v->new_reg, align);
4895         }
4896       else if (GET_CODE (v->new_reg) == REG && v->giv_type == DEST_ADDR)
4897         mark_reg_pointer (v->new_reg, 0);
4898
4899       if (v->giv_type == DEST_ADDR)
4900         /* Store reduced reg as the address in the memref where we found
4901            this giv.  */
4902         validate_change (v->insn, v->location, v->new_reg, 0);
4903       else if (v->replaceable)
4904         {
4905           reg_map[REGNO (v->dest_reg)] = v->new_reg;
4906         }
4907       else
4908         {
4909           rtx original_insn = v->insn;
4910           rtx note;
4911
4912           /* Not replaceable; emit an insn to set the original giv reg from
4913              the reduced giv, same as above.  */
4914           v->insn = loop_insn_emit_after (loop, 0, original_insn,
4915                                           gen_move_insn (v->dest_reg,
4916                                                          v->new_reg));
4917
4918           /* The original insn may have a REG_EQUAL note.  This note is
4919              now incorrect and may result in invalid substitutions later.
4920              The original insn is dead, but may be part of a libcall
4921              sequence, which doesn't seem worth the bother of handling.  */
4922           note = find_reg_note (original_insn, REG_EQUAL, NULL_RTX);
4923           if (note)
4924             remove_note (original_insn, note);
4925         }
4926
4927       /* When a loop is reversed, givs which depend on the reversed
4928          biv, and which are live outside the loop, must be set to their
4929          correct final value.  This insn is only needed if the giv is
4930          not replaceable.  The correct final value is the same as the
4931          value that the giv starts the reversed loop with.  */
4932       if (bl->reversed && ! v->replaceable)
4933         loop_iv_add_mult_sink (loop,
4934                                extend_value_for_giv (v, bl->initial_value),
4935                                v->mult_val, v->add_val, v->dest_reg);
4936       else if (v->final_value)
4937         loop_insn_sink_or_swim (loop,
4938                                 gen_load_of_final_value (v->dest_reg,
4939                                                          v->final_value));
4940
4941       if (loop_dump_stream)
4942         {
4943           fprintf (loop_dump_stream, "giv at %d reduced to ",
4944                    INSN_UID (v->insn));
4945           print_simple_rtl (loop_dump_stream, v->new_reg);
4946           fprintf (loop_dump_stream, "\n");
4947         }
4948     }
4949 }
4950
4951
4952 static int
4953 loop_giv_reduce_benefit (struct loop *loop ATTRIBUTE_UNUSED,
4954                          struct iv_class *bl, struct induction *v,
4955                          rtx test_reg)
4956 {
4957   int add_cost;
4958   int benefit;
4959
4960   benefit = v->benefit;
4961   PUT_MODE (test_reg, v->mode);
4962   add_cost = iv_add_mult_cost (bl->biv->add_val, v->mult_val,
4963                                test_reg, test_reg);
4964
4965   /* Reduce benefit if not replaceable, since we will insert a
4966      move-insn to replace the insn that calculates this giv.  Don't do
4967      this unless the giv is a user variable, since it will often be
4968      marked non-replaceable because of the duplication of the exit
4969      code outside the loop.  In such a case, the copies we insert are
4970      dead and will be deleted.  So they don't have a cost.  Similar
4971      situations exist.  */
4972   /* ??? The new final_[bg]iv_value code does a much better job of
4973      finding replaceable giv's, and hence this code may no longer be
4974      necessary.  */
4975   if (! v->replaceable && ! bl->eliminable
4976       && REG_USERVAR_P (v->dest_reg))
4977     benefit -= copy_cost;
4978
4979   /* Decrease the benefit to count the add-insns that we will insert
4980      to increment the reduced reg for the giv.  ??? This can
4981      overestimate the run-time cost of the additional insns, e.g. if
4982      there are multiple basic blocks that increment the biv, but only
4983      one of these blocks is executed during each iteration.  There is
4984      no good way to detect cases like this with the current structure
4985      of the loop optimizer.  This code is more accurate for
4986      determining code size than run-time benefits.  */
4987   benefit -= add_cost * bl->biv_count;
4988
4989   /* Decide whether to strength-reduce this giv or to leave the code
4990      unchanged (recompute it from the biv each time it is used).  This
4991      decision can be made independently for each giv.  */
4992
4993 #ifdef AUTO_INC_DEC
4994   /* Attempt to guess whether autoincrement will handle some of the
4995      new add insns; if so, increase BENEFIT (undo the subtraction of
4996      add_cost that was done above).  */
4997   if (v->giv_type == DEST_ADDR
4998       /* Increasing the benefit is risky, since this is only a guess.
4999          Avoid increasing register pressure in cases where there would
5000          be no other benefit from reducing this giv.  */
5001       && benefit > 0
5002       && GET_CODE (v->mult_val) == CONST_INT)
5003     {
5004       int size = GET_MODE_SIZE (GET_MODE (v->mem));
5005
5006       if (HAVE_POST_INCREMENT
5007           && INTVAL (v->mult_val) == size)
5008         benefit += add_cost * bl->biv_count;
5009       else if (HAVE_PRE_INCREMENT
5010                && INTVAL (v->mult_val) == size)
5011         benefit += add_cost * bl->biv_count;
5012       else if (HAVE_POST_DECREMENT
5013                && -INTVAL (v->mult_val) == size)
5014         benefit += add_cost * bl->biv_count;
5015       else if (HAVE_PRE_DECREMENT
5016                && -INTVAL (v->mult_val) == size)
5017         benefit += add_cost * bl->biv_count;
5018     }
5019 #endif
5020
5021   return benefit;
5022 }
5023
5024
5025 /* Free IV structures for LOOP.  */
5026
5027 static void
5028 loop_ivs_free (struct loop *loop)
5029 {
5030   struct loop_ivs *ivs = LOOP_IVS (loop);
5031   struct iv_class *iv = ivs->list;
5032
5033   free (ivs->regs);
5034
5035   while (iv)
5036     {
5037       struct iv_class *next = iv->next;
5038       struct induction *induction;
5039       struct induction *next_induction;
5040
5041       for (induction = iv->biv; induction; induction = next_induction)
5042         {
5043           next_induction = induction->next_iv;
5044           free (induction);
5045         }
5046       for (induction = iv->giv; induction; induction = next_induction)
5047         {
5048           next_induction = induction->next_iv;
5049           free (induction);
5050         }
5051
5052       free (iv);
5053       iv = next;
5054     }
5055 }
5056
5057
5058 /* Perform strength reduction and induction variable elimination.
5059
5060    Pseudo registers created during this function will be beyond the
5061    last valid index in several tables including
5062    REGS->ARRAY[I].N_TIMES_SET and REGNO_LAST_UID.  This does not cause a
5063    problem here, because the added registers cannot be givs outside of
5064    their loop, and hence will never be reconsidered.  But scan_loop
5065    must check regnos to make sure they are in bounds.  */
5066
5067 static void
5068 strength_reduce (struct loop *loop, int flags)
5069 {
5070   struct loop_info *loop_info = LOOP_INFO (loop);
5071   struct loop_regs *regs = LOOP_REGS (loop);
5072   struct loop_ivs *ivs = LOOP_IVS (loop);
5073   rtx p;
5074   /* Temporary list pointer for traversing ivs->list.  */
5075   struct iv_class *bl;
5076   /* Ratio of extra register life span we can justify
5077      for saving an instruction.  More if loop doesn't call subroutines
5078      since in that case saving an insn makes more difference
5079      and more registers are available.  */
5080   /* ??? could set this to last value of threshold in move_movables */
5081   int threshold = (loop_info->has_call ? 1 : 2) * (3 + n_non_fixed_regs);
5082   /* Map of pseudo-register replacements.  */
5083   rtx *reg_map = NULL;
5084   int reg_map_size;
5085   int unrolled_insn_copies = 0;
5086   rtx test_reg = gen_rtx_REG (word_mode, LAST_VIRTUAL_REGISTER + 1);
5087   int insn_count = count_insns_in_loop (loop);
5088
5089   addr_placeholder = gen_reg_rtx (Pmode);
5090
5091   ivs->n_regs = max_reg_before_loop;
5092   ivs->regs = xcalloc (ivs->n_regs, sizeof (struct iv));
5093
5094   /* Find all BIVs in loop.  */
5095   loop_bivs_find (loop);
5096
5097   /* Exit if there are no bivs.  */
5098   if (! ivs->list)
5099     {
5100       /* Can still unroll the loop anyways, but indicate that there is no
5101          strength reduction info available.  */
5102       if (flags & LOOP_UNROLL)
5103         unroll_loop (loop, insn_count, 0);
5104
5105       loop_ivs_free (loop);
5106       return;
5107     }
5108
5109   /* Determine how BIVS are initialized by looking through pre-header
5110      extended basic block.  */
5111   loop_bivs_init_find (loop);
5112
5113   /* Look at the each biv and see if we can say anything better about its
5114      initial value from any initializing insns set up above.  */
5115   loop_bivs_check (loop);
5116
5117   /* Search the loop for general induction variables.  */
5118   loop_givs_find (loop);
5119
5120   /* Try to calculate and save the number of loop iterations.  This is
5121      set to zero if the actual number can not be calculated.  This must
5122      be called after all giv's have been identified, since otherwise it may
5123      fail if the iteration variable is a giv.  */
5124   loop_iterations (loop);
5125
5126 #ifdef HAVE_prefetch
5127   if (flags & LOOP_PREFETCH)
5128     emit_prefetch_instructions (loop);
5129 #endif
5130
5131   /* Now for each giv for which we still don't know whether or not it is
5132      replaceable, check to see if it is replaceable because its final value
5133      can be calculated.  This must be done after loop_iterations is called,
5134      so that final_giv_value will work correctly.  */
5135   loop_givs_check (loop);
5136
5137   /* Try to prove that the loop counter variable (if any) is always
5138      nonnegative; if so, record that fact with a REG_NONNEG note
5139      so that "decrement and branch until zero" insn can be used.  */
5140   check_dbra_loop (loop, insn_count);
5141
5142   /* Create reg_map to hold substitutions for replaceable giv regs.
5143      Some givs might have been made from biv increments, so look at
5144      ivs->reg_iv_type for a suitable size.  */
5145   reg_map_size = ivs->n_regs;
5146   reg_map = xcalloc (reg_map_size, sizeof (rtx));
5147
5148   /* Examine each iv class for feasibility of strength reduction/induction
5149      variable elimination.  */
5150
5151   for (bl = ivs->list; bl; bl = bl->next)
5152     {
5153       struct induction *v;
5154       int benefit;
5155
5156       /* Test whether it will be possible to eliminate this biv
5157          provided all givs are reduced.  */
5158       bl->eliminable = loop_biv_eliminable_p (loop, bl, threshold, insn_count);
5159
5160       /* This will be true at the end, if all givs which depend on this
5161          biv have been strength reduced.
5162          We can't (currently) eliminate the biv unless this is so.  */
5163       bl->all_reduced = 1;
5164
5165       /* Check each extension dependent giv in this class to see if its
5166          root biv is safe from wrapping in the interior mode.  */
5167       check_ext_dependent_givs (loop, bl);
5168
5169       /* Combine all giv's for this iv_class.  */
5170       combine_givs (regs, bl);
5171
5172       for (v = bl->giv; v; v = v->next_iv)
5173         {
5174           struct induction *tv;
5175
5176           if (v->ignore || v->same)
5177             continue;
5178
5179           benefit = loop_giv_reduce_benefit (loop, bl, v, test_reg);
5180
5181           /* If an insn is not to be strength reduced, then set its ignore
5182              flag, and clear bl->all_reduced.  */
5183
5184           /* A giv that depends on a reversed biv must be reduced if it is
5185              used after the loop exit, otherwise, it would have the wrong
5186              value after the loop exit.  To make it simple, just reduce all
5187              of such giv's whether or not we know they are used after the loop
5188              exit.  */
5189
5190           if (! flag_reduce_all_givs
5191               && v->lifetime * threshold * benefit < insn_count
5192               && ! bl->reversed)
5193             {
5194               if (loop_dump_stream)
5195                 fprintf (loop_dump_stream,
5196                          "giv of insn %d not worth while, %d vs %d.\n",
5197                          INSN_UID (v->insn),
5198                          v->lifetime * threshold * benefit, insn_count);
5199               v->ignore = 1;
5200               bl->all_reduced = 0;
5201             }
5202           else
5203             {
5204               /* Check that we can increment the reduced giv without a
5205                  multiply insn.  If not, reject it.  */
5206
5207               for (tv = bl->biv; tv; tv = tv->next_iv)
5208                 if (tv->mult_val == const1_rtx
5209                     && ! product_cheap_p (tv->add_val, v->mult_val))
5210                   {
5211                     if (loop_dump_stream)
5212                       fprintf (loop_dump_stream,
5213                                "giv of insn %d: would need a multiply.\n",
5214                                INSN_UID (v->insn));
5215                     v->ignore = 1;
5216                     bl->all_reduced = 0;
5217                     break;
5218                   }
5219             }
5220         }
5221
5222       /* Check for givs whose first use is their definition and whose
5223          last use is the definition of another giv.  If so, it is likely
5224          dead and should not be used to derive another giv nor to
5225          eliminate a biv.  */
5226       loop_givs_dead_check (loop, bl);
5227
5228       /* Reduce each giv that we decided to reduce.  */
5229       loop_givs_reduce (loop, bl);
5230
5231       /* Rescan all givs.  If a giv is the same as a giv not reduced, mark it
5232          as not reduced.
5233
5234          For each giv register that can be reduced now: if replaceable,
5235          substitute reduced reg wherever the old giv occurs;
5236          else add new move insn "giv_reg = reduced_reg".  */
5237       loop_givs_rescan (loop, bl, reg_map);
5238
5239       /* All the givs based on the biv bl have been reduced if they
5240          merit it.  */
5241
5242       /* For each giv not marked as maybe dead that has been combined with a
5243          second giv, clear any "maybe dead" mark on that second giv.
5244          v->new_reg will either be or refer to the register of the giv it
5245          combined with.
5246
5247          Doing this clearing avoids problems in biv elimination where
5248          a giv's new_reg is a complex value that can't be put in the
5249          insn but the giv combined with (with a reg as new_reg) is
5250          marked maybe_dead.  Since the register will be used in either
5251          case, we'd prefer it be used from the simpler giv.  */
5252
5253       for (v = bl->giv; v; v = v->next_iv)
5254         if (! v->maybe_dead && v->same)
5255           v->same->maybe_dead = 0;
5256
5257       /* Try to eliminate the biv, if it is a candidate.
5258          This won't work if ! bl->all_reduced,
5259          since the givs we planned to use might not have been reduced.
5260
5261          We have to be careful that we didn't initially think we could
5262          eliminate this biv because of a giv that we now think may be
5263          dead and shouldn't be used as a biv replacement.
5264
5265          Also, there is the possibility that we may have a giv that looks
5266          like it can be used to eliminate a biv, but the resulting insn
5267          isn't valid.  This can happen, for example, on the 88k, where a
5268          JUMP_INSN can compare a register only with zero.  Attempts to
5269          replace it with a compare with a constant will fail.
5270
5271          Note that in cases where this call fails, we may have replaced some
5272          of the occurrences of the biv with a giv, but no harm was done in
5273          doing so in the rare cases where it can occur.  */
5274
5275       if (bl->all_reduced == 1 && bl->eliminable
5276           && maybe_eliminate_biv (loop, bl, 1, threshold, insn_count))
5277         {
5278           /* ?? If we created a new test to bypass the loop entirely,
5279              or otherwise drop straight in, based on this test, then
5280              we might want to rewrite it also.  This way some later
5281              pass has more hope of removing the initialization of this
5282              biv entirely.  */
5283
5284           /* If final_value != 0, then the biv may be used after loop end
5285              and we must emit an insn to set it just in case.
5286
5287              Reversed bivs already have an insn after the loop setting their
5288              value, so we don't need another one.  We can't calculate the
5289              proper final value for such a biv here anyways.  */
5290           if (bl->final_value && ! bl->reversed)
5291               loop_insn_sink_or_swim (loop,
5292                                       gen_load_of_final_value (bl->biv->dest_reg,
5293                                                                bl->final_value));
5294
5295           if (loop_dump_stream)
5296             fprintf (loop_dump_stream, "Reg %d: biv eliminated\n",
5297                      bl->regno);
5298         }
5299       /* See above note wrt final_value.  But since we couldn't eliminate
5300          the biv, we must set the value after the loop instead of before.  */
5301       else if (bl->final_value && ! bl->reversed)
5302         loop_insn_sink (loop, gen_load_of_final_value (bl->biv->dest_reg,
5303                                                        bl->final_value));
5304     }
5305
5306   /* Go through all the instructions in the loop, making all the
5307      register substitutions scheduled in REG_MAP.  */
5308
5309   for (p = loop->start; p != loop->end; p = NEXT_INSN (p))
5310     if (GET_CODE (p) == INSN || GET_CODE (p) == JUMP_INSN
5311         || GET_CODE (p) == CALL_INSN)
5312       {
5313         replace_regs (PATTERN (p), reg_map, reg_map_size, 0);
5314         replace_regs (REG_NOTES (p), reg_map, reg_map_size, 0);
5315         INSN_CODE (p) = -1;
5316       }
5317
5318   if (loop_info->n_iterations > 0)
5319     {
5320       /* When we completely unroll a loop we will likely not need the increment
5321          of the loop BIV and we will not need the conditional branch at the
5322          end of the loop.  */
5323       unrolled_insn_copies = insn_count - 2;
5324
5325 #ifdef HAVE_cc0
5326       /* When we completely unroll a loop on a HAVE_cc0 machine we will not
5327          need the comparison before the conditional branch at the end of the
5328          loop.  */
5329       unrolled_insn_copies -= 1;
5330 #endif
5331
5332       /* We'll need one copy for each loop iteration.  */
5333       unrolled_insn_copies *= loop_info->n_iterations;
5334
5335       /* A little slop to account for the ability to remove initialization
5336          code, better CSE, and other secondary benefits of completely
5337          unrolling some loops.  */
5338       unrolled_insn_copies -= 1;
5339
5340       /* Clamp the value.  */
5341       if (unrolled_insn_copies < 0)
5342         unrolled_insn_copies = 0;
5343     }
5344
5345   /* Unroll loops from within strength reduction so that we can use the
5346      induction variable information that strength_reduce has already
5347      collected.  Always unroll loops that would be as small or smaller
5348      unrolled than when rolled.  */
5349   if ((flags & LOOP_UNROLL)
5350       || ((flags & LOOP_AUTO_UNROLL)
5351           && loop_info->n_iterations > 0
5352           && unrolled_insn_copies <= insn_count))
5353     unroll_loop (loop, insn_count, 1);
5354
5355 #ifdef HAVE_doloop_end
5356   if (HAVE_doloop_end && (flags & LOOP_BCT) && flag_branch_on_count_reg)
5357     doloop_optimize (loop);
5358 #endif  /* HAVE_doloop_end  */
5359
5360   /* In case number of iterations is known, drop branch prediction note
5361      in the branch.  Do that only in second loop pass, as loop unrolling
5362      may change the number of iterations performed.  */
5363   if (flags & LOOP_BCT)
5364     {
5365       unsigned HOST_WIDE_INT n
5366         = loop_info->n_iterations / loop_info->unroll_number;
5367       if (n > 1)
5368         predict_insn (prev_nonnote_insn (loop->end), PRED_LOOP_ITERATIONS,
5369                       REG_BR_PROB_BASE - REG_BR_PROB_BASE / n);
5370     }
5371
5372   if (loop_dump_stream)
5373     fprintf (loop_dump_stream, "\n");
5374
5375   loop_ivs_free (loop);
5376   if (reg_map)
5377     free (reg_map);
5378 }
5379 \f
5380 /*Record all basic induction variables calculated in the insn.  */
5381 static rtx
5382 check_insn_for_bivs (struct loop *loop, rtx p, int not_every_iteration,
5383                      int maybe_multiple)
5384 {
5385   struct loop_ivs *ivs = LOOP_IVS (loop);
5386   rtx set;
5387   rtx dest_reg;
5388   rtx inc_val;
5389   rtx mult_val;
5390   rtx *location;
5391
5392   if (GET_CODE (p) == INSN
5393       && (set = single_set (p))
5394       && GET_CODE (SET_DEST (set)) == REG)
5395     {
5396       dest_reg = SET_DEST (set);
5397       if (REGNO (dest_reg) < max_reg_before_loop
5398           && REGNO (dest_reg) >= FIRST_PSEUDO_REGISTER
5399           && REG_IV_TYPE (ivs, REGNO (dest_reg)) != NOT_BASIC_INDUCT)
5400         {
5401           if (basic_induction_var (loop, SET_SRC (set),
5402                                    GET_MODE (SET_SRC (set)),
5403                                    dest_reg, p, &inc_val, &mult_val,
5404                                    &location))
5405             {
5406               /* It is a possible basic induction variable.
5407                  Create and initialize an induction structure for it.  */
5408
5409               struct induction *v = xmalloc (sizeof (struct induction));
5410
5411               record_biv (loop, v, p, dest_reg, inc_val, mult_val, location,
5412                           not_every_iteration, maybe_multiple);
5413               REG_IV_TYPE (ivs, REGNO (dest_reg)) = BASIC_INDUCT;
5414             }
5415           else if (REGNO (dest_reg) < ivs->n_regs)
5416             REG_IV_TYPE (ivs, REGNO (dest_reg)) = NOT_BASIC_INDUCT;
5417         }
5418     }
5419   return p;
5420 }
5421 \f
5422 /* Record all givs calculated in the insn.
5423    A register is a giv if: it is only set once, it is a function of a
5424    biv and a constant (or invariant), and it is not a biv.  */
5425 static rtx
5426 check_insn_for_givs (struct loop *loop, rtx p, int not_every_iteration,
5427                      int maybe_multiple)
5428 {
5429   struct loop_regs *regs = LOOP_REGS (loop);
5430
5431   rtx set;
5432   /* Look for a general induction variable in a register.  */
5433   if (GET_CODE (p) == INSN
5434       && (set = single_set (p))
5435       && GET_CODE (SET_DEST (set)) == REG
5436       && ! regs->array[REGNO (SET_DEST (set))].may_not_optimize)
5437     {
5438       rtx src_reg;
5439       rtx dest_reg;
5440       rtx add_val;
5441       rtx mult_val;
5442       rtx ext_val;
5443       int benefit;
5444       rtx regnote = 0;
5445       rtx last_consec_insn;
5446
5447       dest_reg = SET_DEST (set);
5448       if (REGNO (dest_reg) < FIRST_PSEUDO_REGISTER)
5449         return p;
5450
5451       if (/* SET_SRC is a giv.  */
5452           (general_induction_var (loop, SET_SRC (set), &src_reg, &add_val,
5453                                   &mult_val, &ext_val, 0, &benefit, VOIDmode)
5454            /* Equivalent expression is a giv.  */
5455            || ((regnote = find_reg_note (p, REG_EQUAL, NULL_RTX))
5456                && general_induction_var (loop, XEXP (regnote, 0), &src_reg,
5457                                          &add_val, &mult_val, &ext_val, 0,
5458                                          &benefit, VOIDmode)))
5459           /* Don't try to handle any regs made by loop optimization.
5460              We have nothing on them in regno_first_uid, etc.  */
5461           && REGNO (dest_reg) < max_reg_before_loop
5462           /* Don't recognize a BASIC_INDUCT_VAR here.  */
5463           && dest_reg != src_reg
5464           /* This must be the only place where the register is set.  */
5465           && (regs->array[REGNO (dest_reg)].n_times_set == 1
5466               /* or all sets must be consecutive and make a giv.  */
5467               || (benefit = consec_sets_giv (loop, benefit, p,
5468                                              src_reg, dest_reg,
5469                                              &add_val, &mult_val, &ext_val,
5470                                              &last_consec_insn))))
5471         {
5472           struct induction *v = xmalloc (sizeof (struct induction));
5473
5474           /* If this is a library call, increase benefit.  */
5475           if (find_reg_note (p, REG_RETVAL, NULL_RTX))
5476             benefit += libcall_benefit (p);
5477
5478           /* Skip the consecutive insns, if there are any.  */
5479           if (regs->array[REGNO (dest_reg)].n_times_set != 1)
5480             p = last_consec_insn;
5481
5482           record_giv (loop, v, p, src_reg, dest_reg, mult_val, add_val,
5483                       ext_val, benefit, DEST_REG, not_every_iteration,
5484                       maybe_multiple, (rtx*) 0);
5485
5486         }
5487     }
5488
5489   /* Look for givs which are memory addresses.  */
5490   if (GET_CODE (p) == INSN)
5491     find_mem_givs (loop, PATTERN (p), p, not_every_iteration,
5492                    maybe_multiple);
5493
5494   /* Update the status of whether giv can derive other givs.  This can
5495      change when we pass a label or an insn that updates a biv.  */
5496   if (GET_CODE (p) == INSN || GET_CODE (p) == JUMP_INSN
5497       || GET_CODE (p) == CODE_LABEL)
5498     update_giv_derive (loop, p);
5499   return p;
5500 }
5501 \f
5502 /* Return 1 if X is a valid source for an initial value (or as value being
5503    compared against in an initial test).
5504
5505    X must be either a register or constant and must not be clobbered between
5506    the current insn and the start of the loop.
5507
5508    INSN is the insn containing X.  */
5509
5510 static int
5511 valid_initial_value_p (rtx x, rtx insn, int call_seen, rtx loop_start)
5512 {
5513   if (CONSTANT_P (x))
5514     return 1;
5515
5516   /* Only consider pseudos we know about initialized in insns whose luids
5517      we know.  */
5518   if (GET_CODE (x) != REG
5519       || REGNO (x) >= max_reg_before_loop)
5520     return 0;
5521
5522   /* Don't use call-clobbered registers across a call which clobbers it.  On
5523      some machines, don't use any hard registers at all.  */
5524   if (REGNO (x) < FIRST_PSEUDO_REGISTER
5525       && (SMALL_REGISTER_CLASSES
5526           || (call_used_regs[REGNO (x)] && call_seen)))
5527     return 0;
5528
5529   /* Don't use registers that have been clobbered before the start of the
5530      loop.  */
5531   if (reg_set_between_p (x, insn, loop_start))
5532     return 0;
5533
5534   return 1;
5535 }
5536 \f
5537 /* Scan X for memory refs and check each memory address
5538    as a possible giv.  INSN is the insn whose pattern X comes from.
5539    NOT_EVERY_ITERATION is 1 if the insn might not be executed during
5540    every loop iteration.  MAYBE_MULTIPLE is 1 if the insn might be executed
5541    more than once in each loop iteration.  */
5542
5543 static void
5544 find_mem_givs (const struct loop *loop, rtx x, rtx insn,
5545                int not_every_iteration, int maybe_multiple)
5546 {
5547   int i, j;
5548   enum rtx_code code;
5549   const char *fmt;
5550
5551   if (x == 0)
5552     return;
5553
5554   code = GET_CODE (x);
5555   switch (code)
5556     {
5557     case REG:
5558     case CONST_INT:
5559     case CONST:
5560     case CONST_DOUBLE:
5561     case SYMBOL_REF:
5562     case LABEL_REF:
5563     case PC:
5564     case CC0:
5565     case ADDR_VEC:
5566     case ADDR_DIFF_VEC:
5567     case USE:
5568     case CLOBBER:
5569       return;
5570
5571     case MEM:
5572       {
5573         rtx src_reg;
5574         rtx add_val;
5575         rtx mult_val;
5576         rtx ext_val;
5577         int benefit;
5578
5579         /* This code used to disable creating GIVs with mult_val == 1 and
5580            add_val == 0.  However, this leads to lost optimizations when
5581            it comes time to combine a set of related DEST_ADDR GIVs, since
5582            this one would not be seen.  */
5583
5584         if (general_induction_var (loop, XEXP (x, 0), &src_reg, &add_val,
5585                                    &mult_val, &ext_val, 1, &benefit,
5586                                    GET_MODE (x)))
5587           {
5588             /* Found one; record it.  */
5589             struct induction *v = xmalloc (sizeof (struct induction));
5590
5591             record_giv (loop, v, insn, src_reg, addr_placeholder, mult_val,
5592                         add_val, ext_val, benefit, DEST_ADDR,
5593                         not_every_iteration, maybe_multiple, &XEXP (x, 0));
5594
5595             v->mem = x;
5596           }
5597       }
5598       return;
5599
5600     default:
5601       break;
5602     }
5603
5604   /* Recursively scan the subexpressions for other mem refs.  */
5605
5606   fmt = GET_RTX_FORMAT (code);
5607   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
5608     if (fmt[i] == 'e')
5609       find_mem_givs (loop, XEXP (x, i), insn, not_every_iteration,
5610                      maybe_multiple);
5611     else if (fmt[i] == 'E')
5612       for (j = 0; j < XVECLEN (x, i); j++)
5613         find_mem_givs (loop, XVECEXP (x, i, j), insn, not_every_iteration,
5614                        maybe_multiple);
5615 }
5616 \f
5617 /* Fill in the data about one biv update.
5618    V is the `struct induction' in which we record the biv.  (It is
5619    allocated by the caller, with alloca.)
5620    INSN is the insn that sets it.
5621    DEST_REG is the biv's reg.
5622
5623    MULT_VAL is const1_rtx if the biv is being incremented here, in which case
5624    INC_VAL is the increment.  Otherwise, MULT_VAL is const0_rtx and the biv is
5625    being set to INC_VAL.
5626
5627    NOT_EVERY_ITERATION is nonzero if this biv update is not know to be
5628    executed every iteration; MAYBE_MULTIPLE is nonzero if this biv update
5629    can be executed more than once per iteration.  If MAYBE_MULTIPLE
5630    and NOT_EVERY_ITERATION are both zero, we know that the biv update is
5631    executed exactly once per iteration.  */
5632
5633 static void
5634 record_biv (struct loop *loop, struct induction *v, rtx insn, rtx dest_reg,
5635             rtx inc_val, rtx mult_val, rtx *location,
5636             int not_every_iteration, int maybe_multiple)
5637 {
5638   struct loop_ivs *ivs = LOOP_IVS (loop);
5639   struct iv_class *bl;
5640
5641   v->insn = insn;
5642   v->src_reg = dest_reg;
5643   v->dest_reg = dest_reg;
5644   v->mult_val = mult_val;
5645   v->add_val = inc_val;
5646   v->ext_dependent = NULL_RTX;
5647   v->location = location;
5648   v->mode = GET_MODE (dest_reg);
5649   v->always_computable = ! not_every_iteration;
5650   v->always_executed = ! not_every_iteration;
5651   v->maybe_multiple = maybe_multiple;
5652   v->same = 0;
5653
5654   /* Add this to the reg's iv_class, creating a class
5655      if this is the first incrementation of the reg.  */
5656
5657   bl = REG_IV_CLASS (ivs, REGNO (dest_reg));
5658   if (bl == 0)
5659     {
5660       /* Create and initialize new iv_class.  */
5661
5662       bl = xmalloc (sizeof (struct iv_class));
5663
5664       bl->regno = REGNO (dest_reg);
5665       bl->biv = 0;
5666       bl->giv = 0;
5667       bl->biv_count = 0;
5668       bl->giv_count = 0;
5669
5670       /* Set initial value to the reg itself.  */
5671       bl->initial_value = dest_reg;
5672       bl->final_value = 0;
5673       /* We haven't seen the initializing insn yet.  */
5674       bl->init_insn = 0;
5675       bl->init_set = 0;
5676       bl->initial_test = 0;
5677       bl->incremented = 0;
5678       bl->eliminable = 0;
5679       bl->nonneg = 0;
5680       bl->reversed = 0;
5681       bl->total_benefit = 0;
5682
5683       /* Add this class to ivs->list.  */
5684       bl->next = ivs->list;
5685       ivs->list = bl;
5686
5687       /* Put it in the array of biv register classes.  */
5688       REG_IV_CLASS (ivs, REGNO (dest_reg)) = bl;
5689     }
5690   else
5691     {
5692       /* Check if location is the same as a previous one.  */
5693       struct induction *induction;
5694       for (induction = bl->biv; induction; induction = induction->next_iv)
5695         if (location == induction->location)
5696           {
5697             v->same = induction;
5698             break;
5699           }
5700     }
5701
5702   /* Update IV_CLASS entry for this biv.  */
5703   v->next_iv = bl->biv;
5704   bl->biv = v;
5705   bl->biv_count++;
5706   if (mult_val == const1_rtx)
5707     bl->incremented = 1;
5708
5709   if (loop_dump_stream)
5710     loop_biv_dump (v, loop_dump_stream, 0);
5711 }
5712 \f
5713 /* Fill in the data about one giv.
5714    V is the `struct induction' in which we record the giv.  (It is
5715    allocated by the caller, with alloca.)
5716    INSN is the insn that sets it.
5717    BENEFIT estimates the savings from deleting this insn.
5718    TYPE is DEST_REG or DEST_ADDR; it says whether the giv is computed
5719    into a register or is used as a memory address.
5720
5721    SRC_REG is the biv reg which the giv is computed from.
5722    DEST_REG is the giv's reg (if the giv is stored in a reg).
5723    MULT_VAL and ADD_VAL are the coefficients used to compute the giv.
5724    LOCATION points to the place where this giv's value appears in INSN.  */
5725
5726 static void
5727 record_giv (const struct loop *loop, struct induction *v, rtx insn,
5728             rtx src_reg, rtx dest_reg, rtx mult_val, rtx add_val,
5729             rtx ext_val, int benefit, enum g_types type,
5730             int not_every_iteration, int maybe_multiple, rtx *location)
5731 {
5732   struct loop_ivs *ivs = LOOP_IVS (loop);
5733   struct induction *b;
5734   struct iv_class *bl;
5735   rtx set = single_set (insn);
5736   rtx temp;
5737
5738   /* Attempt to prove constantness of the values.  Don't let simplify_rtx
5739      undo the MULT canonicalization that we performed earlier.  */
5740   temp = simplify_rtx (add_val);
5741   if (temp
5742       && ! (GET_CODE (add_val) == MULT
5743             && GET_CODE (temp) == ASHIFT))
5744     add_val = temp;
5745
5746   v->insn = insn;
5747   v->src_reg = src_reg;
5748   v->giv_type = type;
5749   v->dest_reg = dest_reg;
5750   v->mult_val = mult_val;
5751   v->add_val = add_val;
5752   v->ext_dependent = ext_val;
5753   v->benefit = benefit;
5754   v->location = location;
5755   v->cant_derive = 0;
5756   v->combined_with = 0;
5757   v->maybe_multiple = maybe_multiple;
5758   v->maybe_dead = 0;
5759   v->derive_adjustment = 0;
5760   v->same = 0;
5761   v->ignore = 0;
5762   v->new_reg = 0;
5763   v->final_value = 0;
5764   v->same_insn = 0;
5765   v->auto_inc_opt = 0;
5766   v->unrolled = 0;
5767   v->shared = 0;
5768
5769   /* The v->always_computable field is used in update_giv_derive, to
5770      determine whether a giv can be used to derive another giv.  For a
5771      DEST_REG giv, INSN computes a new value for the giv, so its value
5772      isn't computable if INSN insn't executed every iteration.
5773      However, for a DEST_ADDR giv, INSN merely uses the value of the giv;
5774      it does not compute a new value.  Hence the value is always computable
5775      regardless of whether INSN is executed each iteration.  */
5776
5777   if (type == DEST_ADDR)
5778     v->always_computable = 1;
5779   else
5780     v->always_computable = ! not_every_iteration;
5781
5782   v->always_executed = ! not_every_iteration;
5783
5784   if (type == DEST_ADDR)
5785     {
5786       v->mode = GET_MODE (*location);
5787       v->lifetime = 1;
5788     }
5789   else /* type == DEST_REG */
5790     {
5791       v->mode = GET_MODE (SET_DEST (set));
5792
5793       v->lifetime = LOOP_REG_LIFETIME (loop, REGNO (dest_reg));
5794
5795       /* If the lifetime is zero, it means that this register is
5796          really a dead store.  So mark this as a giv that can be
5797          ignored.  This will not prevent the biv from being eliminated.  */
5798       if (v->lifetime == 0)
5799         v->ignore = 1;
5800
5801       REG_IV_TYPE (ivs, REGNO (dest_reg)) = GENERAL_INDUCT;
5802       REG_IV_INFO (ivs, REGNO (dest_reg)) = v;
5803     }
5804
5805   /* Add the giv to the class of givs computed from one biv.  */
5806
5807   bl = REG_IV_CLASS (ivs, REGNO (src_reg));
5808   if (bl)
5809     {
5810       v->next_iv = bl->giv;
5811       bl->giv = v;
5812       /* Don't count DEST_ADDR.  This is supposed to count the number of
5813          insns that calculate givs.  */
5814       if (type == DEST_REG)
5815         bl->giv_count++;
5816       bl->total_benefit += benefit;
5817     }
5818   else
5819     /* Fatal error, biv missing for this giv?  */
5820     abort ();
5821
5822   if (type == DEST_ADDR)
5823     {
5824       v->replaceable = 1;
5825       v->not_replaceable = 0;
5826     }
5827   else
5828     {
5829       /* The giv can be replaced outright by the reduced register only if all
5830          of the following conditions are true:
5831          - the insn that sets the giv is always executed on any iteration
5832            on which the giv is used at all
5833            (there are two ways to deduce this:
5834             either the insn is executed on every iteration,
5835             or all uses follow that insn in the same basic block),
5836          - the giv is not used outside the loop
5837          - no assignments to the biv occur during the giv's lifetime.  */
5838
5839       if (REGNO_FIRST_UID (REGNO (dest_reg)) == INSN_UID (insn)
5840           /* Previous line always fails if INSN was moved by loop opt.  */
5841           && REGNO_LAST_LUID (REGNO (dest_reg))
5842           < INSN_LUID (loop->end)
5843           && (! not_every_iteration
5844               || last_use_this_basic_block (dest_reg, insn)))
5845         {
5846           /* Now check that there are no assignments to the biv within the
5847              giv's lifetime.  This requires two separate checks.  */
5848
5849           /* Check each biv update, and fail if any are between the first
5850              and last use of the giv.
5851
5852              If this loop contains an inner loop that was unrolled, then
5853              the insn modifying the biv may have been emitted by the loop
5854              unrolling code, and hence does not have a valid luid.  Just
5855              mark the biv as not replaceable in this case.  It is not very
5856              useful as a biv, because it is used in two different loops.
5857              It is very unlikely that we would be able to optimize the giv
5858              using this biv anyways.  */
5859
5860           v->replaceable = 1;
5861           v->not_replaceable = 0;
5862           for (b = bl->biv; b; b = b->next_iv)
5863             {
5864               if (INSN_UID (b->insn) >= max_uid_for_loop
5865                   || ((INSN_LUID (b->insn)
5866                        >= REGNO_FIRST_LUID (REGNO (dest_reg)))
5867                       && (INSN_LUID (b->insn)
5868                           <= REGNO_LAST_LUID (REGNO (dest_reg)))))
5869                 {
5870                   v->replaceable = 0;
5871                   v->not_replaceable = 1;
5872                   break;
5873                 }
5874             }
5875
5876           /* If there are any backwards branches that go from after the
5877              biv update to before it, then this giv is not replaceable.  */
5878           if (v->replaceable)
5879             for (b = bl->biv; b; b = b->next_iv)
5880               if (back_branch_in_range_p (loop, b->insn))
5881                 {
5882                   v->replaceable = 0;
5883                   v->not_replaceable = 1;
5884                   break;
5885                 }
5886         }
5887       else
5888         {
5889           /* May still be replaceable, we don't have enough info here to
5890              decide.  */
5891           v->replaceable = 0;
5892           v->not_replaceable = 0;
5893         }
5894     }
5895
5896   /* Record whether the add_val contains a const_int, for later use by
5897      combine_givs.  */
5898   {
5899     rtx tem = add_val;
5900
5901     v->no_const_addval = 1;
5902     if (tem == const0_rtx)
5903       ;
5904     else if (CONSTANT_P (add_val))
5905       v->no_const_addval = 0;
5906     if (GET_CODE (tem) == PLUS)
5907       {
5908         while (1)
5909           {
5910             if (GET_CODE (XEXP (tem, 0)) == PLUS)
5911               tem = XEXP (tem, 0);
5912             else if (GET_CODE (XEXP (tem, 1)) == PLUS)
5913               tem = XEXP (tem, 1);
5914             else
5915               break;
5916           }
5917         if (CONSTANT_P (XEXP (tem, 1)))
5918           v->no_const_addval = 0;
5919       }
5920   }
5921
5922   if (loop_dump_stream)
5923     loop_giv_dump (v, loop_dump_stream, 0);
5924 }
5925
5926 /* All this does is determine whether a giv can be made replaceable because
5927    its final value can be calculated.  This code can not be part of record_giv
5928    above, because final_giv_value requires that the number of loop iterations
5929    be known, and that can not be accurately calculated until after all givs
5930    have been identified.  */
5931
5932 static void
5933 check_final_value (const struct loop *loop, struct induction *v)
5934 {
5935   rtx final_value = 0;
5936
5937   /* DEST_ADDR givs will never reach here, because they are always marked
5938      replaceable above in record_giv.  */
5939
5940   /* The giv can be replaced outright by the reduced register only if all
5941      of the following conditions are true:
5942      - the insn that sets the giv is always executed on any iteration
5943        on which the giv is used at all
5944        (there are two ways to deduce this:
5945         either the insn is executed on every iteration,
5946         or all uses follow that insn in the same basic block),
5947      - its final value can be calculated (this condition is different
5948        than the one above in record_giv)
5949      - it's not used before the it's set
5950      - no assignments to the biv occur during the giv's lifetime.  */
5951
5952 #if 0
5953   /* This is only called now when replaceable is known to be false.  */
5954   /* Clear replaceable, so that it won't confuse final_giv_value.  */
5955   v->replaceable = 0;
5956 #endif
5957
5958   if ((final_value = final_giv_value (loop, v))
5959       && (v->always_executed
5960           || last_use_this_basic_block (v->dest_reg, v->insn)))
5961     {
5962       int biv_increment_seen = 0, before_giv_insn = 0;
5963       rtx p = v->insn;
5964       rtx last_giv_use;
5965
5966       v->replaceable = 1;
5967       v->not_replaceable = 0;
5968
5969       /* When trying to determine whether or not a biv increment occurs
5970          during the lifetime of the giv, we can ignore uses of the variable
5971          outside the loop because final_value is true.  Hence we can not
5972          use regno_last_uid and regno_first_uid as above in record_giv.  */
5973
5974       /* Search the loop to determine whether any assignments to the
5975          biv occur during the giv's lifetime.  Start with the insn
5976          that sets the giv, and search around the loop until we come
5977          back to that insn again.
5978
5979          Also fail if there is a jump within the giv's lifetime that jumps
5980          to somewhere outside the lifetime but still within the loop.  This
5981          catches spaghetti code where the execution order is not linear, and
5982          hence the above test fails.  Here we assume that the giv lifetime
5983          does not extend from one iteration of the loop to the next, so as
5984          to make the test easier.  Since the lifetime isn't known yet,
5985          this requires two loops.  See also record_giv above.  */
5986
5987       last_giv_use = v->insn;
5988
5989       while (1)
5990         {
5991           p = NEXT_INSN (p);
5992           if (p == loop->end)
5993             {
5994               before_giv_insn = 1;
5995               p = NEXT_INSN (loop->start);
5996             }
5997           if (p == v->insn)
5998             break;
5999
6000           if (GET_CODE (p) == INSN || GET_CODE (p) == JUMP_INSN
6001               || GET_CODE (p) == CALL_INSN)
6002             {
6003               /* It is possible for the BIV increment to use the GIV if we
6004                  have a cycle.  Thus we must be sure to check each insn for
6005                  both BIV and GIV uses, and we must check for BIV uses
6006                  first.  */
6007
6008               if (! biv_increment_seen
6009                   && reg_set_p (v->src_reg, PATTERN (p)))
6010                 biv_increment_seen = 1;
6011
6012               if (reg_mentioned_p (v->dest_reg, PATTERN (p)))
6013                 {
6014                   if (biv_increment_seen || before_giv_insn)
6015                     {
6016                       v->replaceable = 0;
6017                       v->not_replaceable = 1;
6018                       break;
6019                     }
6020                   last_giv_use = p;
6021                 }
6022             }
6023         }
6024
6025       /* Now that the lifetime of the giv is known, check for branches
6026          from within the lifetime to outside the lifetime if it is still
6027          replaceable.  */
6028
6029       if (v->replaceable)
6030         {
6031           p = v->insn;
6032           while (1)
6033             {
6034               p = NEXT_INSN (p);
6035               if (p == loop->end)
6036                 p = NEXT_INSN (loop->start);
6037               if (p == last_giv_use)
6038                 break;
6039
6040               if (GET_CODE (p) == JUMP_INSN && JUMP_LABEL (p)
6041                   && LABEL_NAME (JUMP_LABEL (p))
6042                   && ((loop_insn_first_p (JUMP_LABEL (p), v->insn)
6043                        && loop_insn_first_p (loop->start, JUMP_LABEL (p)))
6044                       || (loop_insn_first_p (last_giv_use, JUMP_LABEL (p))
6045                           && loop_insn_first_p (JUMP_LABEL (p), loop->end))))
6046                 {
6047                   v->replaceable = 0;
6048                   v->not_replaceable = 1;
6049
6050                   if (loop_dump_stream)
6051                     fprintf (loop_dump_stream,
6052                              "Found branch outside giv lifetime.\n");
6053
6054                   break;
6055                 }
6056             }
6057         }
6058
6059       /* If it is replaceable, then save the final value.  */
6060       if (v->replaceable)
6061         v->final_value = final_value;
6062     }
6063
6064   if (loop_dump_stream && v->replaceable)
6065     fprintf (loop_dump_stream, "Insn %d: giv reg %d final_value replaceable\n",
6066              INSN_UID (v->insn), REGNO (v->dest_reg));
6067 }
6068 \f
6069 /* Update the status of whether a giv can derive other givs.
6070
6071    We need to do something special if there is or may be an update to the biv
6072    between the time the giv is defined and the time it is used to derive
6073    another giv.
6074
6075    In addition, a giv that is only conditionally set is not allowed to
6076    derive another giv once a label has been passed.
6077
6078    The cases we look at are when a label or an update to a biv is passed.  */
6079
6080 static void
6081 update_giv_derive (const struct loop *loop, rtx p)
6082 {
6083   struct loop_ivs *ivs = LOOP_IVS (loop);
6084   struct iv_class *bl;
6085   struct induction *biv, *giv;
6086   rtx tem;
6087   int dummy;
6088
6089   /* Search all IV classes, then all bivs, and finally all givs.
6090
6091      There are three cases we are concerned with.  First we have the situation
6092      of a giv that is only updated conditionally.  In that case, it may not
6093      derive any givs after a label is passed.
6094
6095      The second case is when a biv update occurs, or may occur, after the
6096      definition of a giv.  For certain biv updates (see below) that are
6097      known to occur between the giv definition and use, we can adjust the
6098      giv definition.  For others, or when the biv update is conditional,
6099      we must prevent the giv from deriving any other givs.  There are two
6100      sub-cases within this case.
6101
6102      If this is a label, we are concerned with any biv update that is done
6103      conditionally, since it may be done after the giv is defined followed by
6104      a branch here (actually, we need to pass both a jump and a label, but
6105      this extra tracking doesn't seem worth it).
6106
6107      If this is a jump, we are concerned about any biv update that may be
6108      executed multiple times.  We are actually only concerned about
6109      backward jumps, but it is probably not worth performing the test
6110      on the jump again here.
6111
6112      If this is a biv update, we must adjust the giv status to show that a
6113      subsequent biv update was performed.  If this adjustment cannot be done,
6114      the giv cannot derive further givs.  */
6115
6116   for (bl = ivs->list; bl; bl = bl->next)
6117     for (biv = bl->biv; biv; biv = biv->next_iv)
6118       if (GET_CODE (p) == CODE_LABEL || GET_CODE (p) == JUMP_INSN
6119           || biv->insn == p)
6120         {
6121           /* Skip if location is the same as a previous one.  */
6122           if (biv->same)
6123             continue;
6124
6125           for (giv = bl->giv; giv; giv = giv->next_iv)
6126             {
6127               /* If cant_derive is already true, there is no point in
6128                  checking all of these conditions again.  */
6129               if (giv->cant_derive)
6130                 continue;
6131
6132               /* If this giv is conditionally set and we have passed a label,
6133                  it cannot derive anything.  */
6134               if (GET_CODE (p) == CODE_LABEL && ! giv->always_computable)
6135                 giv->cant_derive = 1;
6136
6137               /* Skip givs that have mult_val == 0, since
6138                  they are really invariants.  Also skip those that are
6139                  replaceable, since we know their lifetime doesn't contain
6140                  any biv update.  */
6141               else if (giv->mult_val == const0_rtx || giv->replaceable)
6142                 continue;
6143
6144               /* The only way we can allow this giv to derive another
6145                  is if this is a biv increment and we can form the product
6146                  of biv->add_val and giv->mult_val.  In this case, we will
6147                  be able to compute a compensation.  */
6148               else if (biv->insn == p)
6149                 {
6150                   rtx ext_val_dummy;
6151
6152                   tem = 0;
6153                   if (biv->mult_val == const1_rtx)
6154                     tem = simplify_giv_expr (loop,
6155                                              gen_rtx_MULT (giv->mode,
6156                                                            biv->add_val,
6157                                                            giv->mult_val),
6158                                              &ext_val_dummy, &dummy);
6159
6160                   if (tem && giv->derive_adjustment)
6161                     tem = simplify_giv_expr
6162                       (loop,
6163                        gen_rtx_PLUS (giv->mode, tem, giv->derive_adjustment),
6164                        &ext_val_dummy, &dummy);
6165
6166                   if (tem)
6167                     giv->derive_adjustment = tem;
6168                   else
6169                     giv->cant_derive = 1;
6170                 }
6171               else if ((GET_CODE (p) == CODE_LABEL && ! biv->always_computable)
6172                        || (GET_CODE (p) == JUMP_INSN && biv->maybe_multiple))
6173                 giv->cant_derive = 1;
6174             }
6175         }
6176 }
6177 \f
6178 /* Check whether an insn is an increment legitimate for a basic induction var.
6179    X is the source of insn P, or a part of it.
6180    MODE is the mode in which X should be interpreted.
6181
6182    DEST_REG is the putative biv, also the destination of the insn.
6183    We accept patterns of these forms:
6184      REG = REG + INVARIANT (includes REG = REG - CONSTANT)
6185      REG = INVARIANT + REG
6186
6187    If X is suitable, we return 1, set *MULT_VAL to CONST1_RTX,
6188    store the additive term into *INC_VAL, and store the place where
6189    we found the additive term into *LOCATION.
6190
6191    If X is an assignment of an invariant into DEST_REG, we set
6192    *MULT_VAL to CONST0_RTX, and store the invariant into *INC_VAL.
6193
6194    We also want to detect a BIV when it corresponds to a variable
6195    whose mode was promoted.  In that case, an increment
6196    of the variable may be a PLUS that adds a SUBREG of that variable to
6197    an invariant and then sign- or zero-extends the result of the PLUS
6198    into the variable.
6199
6200    Most GIVs in such cases will be in the promoted mode, since that is the
6201    probably the natural computation mode (and almost certainly the mode
6202    used for addresses) on the machine.  So we view the pseudo-reg containing
6203    the variable as the BIV, as if it were simply incremented.
6204
6205    Note that treating the entire pseudo as a BIV will result in making
6206    simple increments to any GIVs based on it.  However, if the variable
6207    overflows in its declared mode but not its promoted mode, the result will
6208    be incorrect.  This is acceptable if the variable is signed, since
6209    overflows in such cases are undefined, but not if it is unsigned, since
6210    those overflows are defined.  So we only check for SIGN_EXTEND and
6211    not ZERO_EXTEND.
6212
6213    If we cannot find a biv, we return 0.  */
6214
6215 static int
6216 basic_induction_var (const struct loop *loop, rtx x, enum machine_mode mode,
6217                      rtx dest_reg, rtx p, rtx *inc_val, rtx *mult_val,
6218                      rtx **location)
6219 {
6220   enum rtx_code code;
6221   rtx *argp, arg;
6222   rtx insn, set = 0, last, inc;
6223
6224   code = GET_CODE (x);
6225   *location = NULL;
6226   switch (code)
6227     {
6228     case PLUS:
6229       if (rtx_equal_p (XEXP (x, 0), dest_reg)
6230           || (GET_CODE (XEXP (x, 0)) == SUBREG
6231               && SUBREG_PROMOTED_VAR_P (XEXP (x, 0))
6232               && SUBREG_REG (XEXP (x, 0)) == dest_reg))
6233         {
6234           argp = &XEXP (x, 1);
6235         }
6236       else if (rtx_equal_p (XEXP (x, 1), dest_reg)
6237                || (GET_CODE (XEXP (x, 1)) == SUBREG
6238                    && SUBREG_PROMOTED_VAR_P (XEXP (x, 1))
6239                    && SUBREG_REG (XEXP (x, 1)) == dest_reg))
6240         {
6241           argp = &XEXP (x, 0);
6242         }
6243       else
6244         return 0;
6245
6246       arg = *argp;
6247       if (loop_invariant_p (loop, arg) != 1)
6248         return 0;
6249
6250       /* convert_modes can emit new instructions, e.g. when arg is a loop
6251          invariant MEM and dest_reg has a different mode.
6252          These instructions would be emitted after the end of the function
6253          and then *inc_val would be an uninitialized pseudo.
6254          Detect this and bail in this case.
6255          Other alternatives to solve this can be introducing a convert_modes
6256          variant which is allowed to fail but not allowed to emit new
6257          instructions, emit these instructions before loop start and let
6258          it be garbage collected if *inc_val is never used or saving the
6259          *inc_val initialization sequence generated here and when *inc_val
6260          is going to be actually used, emit it at some suitable place.  */
6261       last = get_last_insn ();
6262       inc = convert_modes (GET_MODE (dest_reg), GET_MODE (x), arg, 0);
6263       if (get_last_insn () != last)
6264         {
6265           delete_insns_since (last);
6266           return 0;
6267         }
6268
6269       *inc_val = inc;
6270       *mult_val = const1_rtx;
6271       *location = argp;
6272       return 1;
6273
6274     case SUBREG:
6275       /* If what's inside the SUBREG is a BIV, then the SUBREG.  This will
6276          handle addition of promoted variables.
6277          ??? The comment at the start of this function is wrong: promoted
6278          variable increments don't look like it says they do.  */
6279       return basic_induction_var (loop, SUBREG_REG (x),
6280                                   GET_MODE (SUBREG_REG (x)),
6281                                   dest_reg, p, inc_val, mult_val, location);
6282
6283     case REG:
6284       /* If this register is assigned in a previous insn, look at its
6285          source, but don't go outside the loop or past a label.  */
6286
6287       /* If this sets a register to itself, we would repeat any previous
6288          biv increment if we applied this strategy blindly.  */
6289       if (rtx_equal_p (dest_reg, x))
6290         return 0;
6291
6292       insn = p;
6293       while (1)
6294         {
6295           rtx dest;
6296           do
6297             {
6298               insn = PREV_INSN (insn);
6299             }
6300           while (insn && GET_CODE (insn) == NOTE
6301                  && NOTE_LINE_NUMBER (insn) != NOTE_INSN_LOOP_BEG);
6302
6303           if (!insn)
6304             break;
6305           set = single_set (insn);
6306           if (set == 0)
6307             break;
6308           dest = SET_DEST (set);
6309           if (dest == x
6310               || (GET_CODE (dest) == SUBREG
6311                   && (GET_MODE_SIZE (GET_MODE (dest)) <= UNITS_PER_WORD)
6312                   && (GET_MODE_CLASS (GET_MODE (dest)) == MODE_INT)
6313                   && SUBREG_REG (dest) == x))
6314             return basic_induction_var (loop, SET_SRC (set),
6315                                         (GET_MODE (SET_SRC (set)) == VOIDmode
6316                                          ? GET_MODE (x)
6317                                          : GET_MODE (SET_SRC (set))),
6318                                         dest_reg, insn,
6319                                         inc_val, mult_val, location);
6320
6321           while (GET_CODE (dest) == SIGN_EXTRACT
6322                  || GET_CODE (dest) == ZERO_EXTRACT
6323                  || GET_CODE (dest) == SUBREG
6324                  || GET_CODE (dest) == STRICT_LOW_PART)
6325             dest = XEXP (dest, 0);
6326           if (dest == x)
6327             break;
6328         }
6329       /* Fall through.  */
6330
6331       /* Can accept constant setting of biv only when inside inner most loop.
6332          Otherwise, a biv of an inner loop may be incorrectly recognized
6333          as a biv of the outer loop,
6334          causing code to be moved INTO the inner loop.  */
6335     case MEM:
6336       if (loop_invariant_p (loop, x) != 1)
6337         return 0;
6338     case CONST_INT:
6339     case SYMBOL_REF:
6340     case CONST:
6341       /* convert_modes aborts if we try to convert to or from CCmode, so just
6342          exclude that case.  It is very unlikely that a condition code value
6343          would be a useful iterator anyways.  convert_modes aborts if we try to
6344          convert a float mode to non-float or vice versa too.  */
6345       if (loop->level == 1
6346           && GET_MODE_CLASS (mode) == GET_MODE_CLASS (GET_MODE (dest_reg))
6347           && GET_MODE_CLASS (mode) != MODE_CC)
6348         {
6349           /* Possible bug here?  Perhaps we don't know the mode of X.  */
6350           last = get_last_insn ();
6351           inc = convert_modes (GET_MODE (dest_reg), mode, x, 0);
6352           if (get_last_insn () != last)
6353             {
6354               delete_insns_since (last);
6355               return 0;
6356             }
6357
6358           *inc_val = inc;
6359           *mult_val = const0_rtx;
6360           return 1;
6361         }
6362       else
6363         return 0;
6364
6365     case SIGN_EXTEND:
6366       /* Ignore this BIV if signed arithmetic overflow is defined.  */
6367       if (flag_wrapv)
6368         return 0;
6369       return basic_induction_var (loop, XEXP (x, 0), GET_MODE (XEXP (x, 0)),
6370                                   dest_reg, p, inc_val, mult_val, location);
6371
6372     case ASHIFTRT:
6373       /* Similar, since this can be a sign extension.  */
6374       for (insn = PREV_INSN (p);
6375            (insn && GET_CODE (insn) == NOTE
6376             && NOTE_LINE_NUMBER (insn) != NOTE_INSN_LOOP_BEG);
6377            insn = PREV_INSN (insn))
6378         ;
6379
6380       if (insn)
6381         set = single_set (insn);
6382
6383       if (! rtx_equal_p (dest_reg, XEXP (x, 0))
6384           && set && SET_DEST (set) == XEXP (x, 0)
6385           && GET_CODE (XEXP (x, 1)) == CONST_INT
6386           && INTVAL (XEXP (x, 1)) >= 0
6387           && GET_CODE (SET_SRC (set)) == ASHIFT
6388           && XEXP (x, 1) == XEXP (SET_SRC (set), 1))
6389         return basic_induction_var (loop, XEXP (SET_SRC (set), 0),
6390                                     GET_MODE (XEXP (x, 0)),
6391                                     dest_reg, insn, inc_val, mult_val,
6392                                     location);
6393       return 0;
6394
6395     default:
6396       return 0;
6397     }
6398 }
6399 \f
6400 /* A general induction variable (giv) is any quantity that is a linear
6401    function   of a basic induction variable,
6402    i.e. giv = biv * mult_val + add_val.
6403    The coefficients can be any loop invariant quantity.
6404    A giv need not be computed directly from the biv;
6405    it can be computed by way of other givs.  */
6406
6407 /* Determine whether X computes a giv.
6408    If it does, return a nonzero value
6409      which is the benefit from eliminating the computation of X;
6410    set *SRC_REG to the register of the biv that it is computed from;
6411    set *ADD_VAL and *MULT_VAL to the coefficients,
6412      such that the value of X is biv * mult + add;  */
6413
6414 static int
6415 general_induction_var (const struct loop *loop, rtx x, rtx *src_reg,
6416                        rtx *add_val, rtx *mult_val, rtx *ext_val,
6417                        int is_addr, int *pbenefit,
6418                        enum machine_mode addr_mode)
6419 {
6420   struct loop_ivs *ivs = LOOP_IVS (loop);
6421   rtx orig_x = x;
6422
6423   /* If this is an invariant, forget it, it isn't a giv.  */
6424   if (loop_invariant_p (loop, x) == 1)
6425     return 0;
6426
6427   *pbenefit = 0;
6428   *ext_val = NULL_RTX;
6429   x = simplify_giv_expr (loop, x, ext_val, pbenefit);
6430   if (x == 0)
6431     return 0;
6432
6433   switch (GET_CODE (x))
6434     {
6435     case USE:
6436     case CONST_INT:
6437       /* Since this is now an invariant and wasn't before, it must be a giv
6438          with MULT_VAL == 0.  It doesn't matter which BIV we associate this
6439          with.  */
6440       *src_reg = ivs->list->biv->dest_reg;
6441       *mult_val = const0_rtx;
6442       *add_val = x;
6443       break;
6444
6445     case REG:
6446       /* This is equivalent to a BIV.  */
6447       *src_reg = x;
6448       *mult_val = const1_rtx;
6449       *add_val = const0_rtx;
6450       break;
6451
6452     case PLUS:
6453       /* Either (plus (biv) (invar)) or
6454          (plus (mult (biv) (invar_1)) (invar_2)).  */
6455       if (GET_CODE (XEXP (x, 0)) == MULT)
6456         {
6457           *src_reg = XEXP (XEXP (x, 0), 0);
6458           *mult_val = XEXP (XEXP (x, 0), 1);
6459         }
6460       else
6461         {
6462           *src_reg = XEXP (x, 0);
6463           *mult_val = const1_rtx;
6464         }
6465       *add_val = XEXP (x, 1);
6466       break;
6467
6468     case MULT:
6469       /* ADD_VAL is zero.  */
6470       *src_reg = XEXP (x, 0);
6471       *mult_val = XEXP (x, 1);
6472       *add_val = const0_rtx;
6473       break;
6474
6475     default:
6476       abort ();
6477     }
6478
6479   /* Remove any enclosing USE from ADD_VAL and MULT_VAL (there will be
6480      unless they are CONST_INT).  */
6481   if (GET_CODE (*add_val) == USE)
6482     *add_val = XEXP (*add_val, 0);
6483   if (GET_CODE (*mult_val) == USE)
6484     *mult_val = XEXP (*mult_val, 0);
6485
6486   if (is_addr)
6487     *pbenefit += address_cost (orig_x, addr_mode) - reg_address_cost;
6488   else
6489     *pbenefit += rtx_cost (orig_x, SET);
6490
6491   /* Always return true if this is a giv so it will be detected as such,
6492      even if the benefit is zero or negative.  This allows elimination
6493      of bivs that might otherwise not be eliminated.  */
6494   return 1;
6495 }
6496 \f
6497 /* Given an expression, X, try to form it as a linear function of a biv.
6498    We will canonicalize it to be of the form
6499         (plus (mult (BIV) (invar_1))
6500               (invar_2))
6501    with possible degeneracies.
6502
6503    The invariant expressions must each be of a form that can be used as a
6504    machine operand.  We surround then with a USE rtx (a hack, but localized
6505    and certainly unambiguous!) if not a CONST_INT for simplicity in this
6506    routine; it is the caller's responsibility to strip them.
6507
6508    If no such canonicalization is possible (i.e., two biv's are used or an
6509    expression that is neither invariant nor a biv or giv), this routine
6510    returns 0.
6511
6512    For a nonzero return, the result will have a code of CONST_INT, USE,
6513    REG (for a BIV), PLUS, or MULT.  No other codes will occur.
6514
6515    *BENEFIT will be incremented by the benefit of any sub-giv encountered.  */
6516
6517 static rtx sge_plus (enum machine_mode, rtx, rtx);
6518 static rtx sge_plus_constant (rtx, rtx);
6519
6520 static rtx
6521 simplify_giv_expr (const struct loop *loop, rtx x, rtx *ext_val, int *benefit)
6522 {
6523   struct loop_ivs *ivs = LOOP_IVS (loop);
6524   struct loop_regs *regs = LOOP_REGS (loop);
6525   enum machine_mode mode = GET_MODE (x);
6526   rtx arg0, arg1;
6527   rtx tem;
6528
6529   /* If this is not an integer mode, or if we cannot do arithmetic in this
6530      mode, this can't be a giv.  */
6531   if (mode != VOIDmode
6532       && (GET_MODE_CLASS (mode) != MODE_INT
6533           || GET_MODE_BITSIZE (mode) > HOST_BITS_PER_WIDE_INT))
6534     return NULL_RTX;
6535
6536   switch (GET_CODE (x))
6537     {
6538     case PLUS:
6539       arg0 = simplify_giv_expr (loop, XEXP (x, 0), ext_val, benefit);
6540       arg1 = simplify_giv_expr (loop, XEXP (x, 1), ext_val, benefit);
6541       if (arg0 == 0 || arg1 == 0)
6542         return NULL_RTX;
6543
6544       /* Put constant last, CONST_INT last if both constant.  */
6545       if ((GET_CODE (arg0) == USE
6546            || GET_CODE (arg0) == CONST_INT)
6547           && ! ((GET_CODE (arg0) == USE
6548                  && GET_CODE (arg1) == USE)
6549                 || GET_CODE (arg1) == CONST_INT))
6550         tem = arg0, arg0 = arg1, arg1 = tem;
6551
6552       /* Handle addition of zero, then addition of an invariant.  */
6553       if (arg1 == const0_rtx)
6554         return arg0;
6555       else if (GET_CODE (arg1) == CONST_INT || GET_CODE (arg1) == USE)
6556         switch (GET_CODE (arg0))
6557           {
6558           case CONST_INT:
6559           case USE:
6560             /* Adding two invariants must result in an invariant, so enclose
6561                addition operation inside a USE and return it.  */
6562             if (GET_CODE (arg0) == USE)
6563               arg0 = XEXP (arg0, 0);
6564             if (GET_CODE (arg1) == USE)
6565               arg1 = XEXP (arg1, 0);
6566
6567             if (GET_CODE (arg0) == CONST_INT)
6568               tem = arg0, arg0 = arg1, arg1 = tem;
6569             if (GET_CODE (arg1) == CONST_INT)
6570               tem = sge_plus_constant (arg0, arg1);
6571             else
6572               tem = sge_plus (mode, arg0, arg1);
6573
6574             if (GET_CODE (tem) != CONST_INT)
6575               tem = gen_rtx_USE (mode, tem);
6576             return tem;
6577
6578           case REG:
6579           case MULT:
6580             /* biv + invar or mult + invar.  Return sum.  */
6581             return gen_rtx_PLUS (mode, arg0, arg1);
6582
6583           case PLUS:
6584             /* (a + invar_1) + invar_2.  Associate.  */
6585             return
6586               simplify_giv_expr (loop,
6587                                  gen_rtx_PLUS (mode,
6588                                                XEXP (arg0, 0),
6589                                                gen_rtx_PLUS (mode,
6590                                                              XEXP (arg0, 1),
6591                                                              arg1)),
6592                                  ext_val, benefit);
6593
6594           default:
6595             abort ();
6596           }
6597
6598       /* Each argument must be either REG, PLUS, or MULT.  Convert REG to
6599          MULT to reduce cases.  */
6600       if (GET_CODE (arg0) == REG)
6601         arg0 = gen_rtx_MULT (mode, arg0, const1_rtx);
6602       if (GET_CODE (arg1) == REG)
6603         arg1 = gen_rtx_MULT (mode, arg1, const1_rtx);
6604
6605       /* Now have PLUS + PLUS, PLUS + MULT, MULT + PLUS, or MULT + MULT.
6606          Put a MULT first, leaving PLUS + PLUS, MULT + PLUS, or MULT + MULT.
6607          Recurse to associate the second PLUS.  */
6608       if (GET_CODE (arg1) == MULT)
6609         tem = arg0, arg0 = arg1, arg1 = tem;
6610
6611       if (GET_CODE (arg1) == PLUS)
6612         return
6613           simplify_giv_expr (loop,
6614                              gen_rtx_PLUS (mode,
6615                                            gen_rtx_PLUS (mode, arg0,
6616                                                          XEXP (arg1, 0)),
6617                                            XEXP (arg1, 1)),
6618                              ext_val, benefit);
6619
6620       /* Now must have MULT + MULT.  Distribute if same biv, else not giv.  */
6621       if (GET_CODE (arg0) != MULT || GET_CODE (arg1) != MULT)
6622         return NULL_RTX;
6623
6624       if (!rtx_equal_p (arg0, arg1))
6625         return NULL_RTX;
6626
6627       return simplify_giv_expr (loop,
6628                                 gen_rtx_MULT (mode,
6629                                               XEXP (arg0, 0),
6630                                               gen_rtx_PLUS (mode,
6631                                                             XEXP (arg0, 1),
6632                                                             XEXP (arg1, 1))),
6633                                 ext_val, benefit);
6634
6635     case MINUS:
6636       /* Handle "a - b" as "a + b * (-1)".  */
6637       return simplify_giv_expr (loop,
6638                                 gen_rtx_PLUS (mode,
6639                                               XEXP (x, 0),
6640                                               gen_rtx_MULT (mode,
6641                                                             XEXP (x, 1),
6642                                                             constm1_rtx)),
6643                                 ext_val, benefit);
6644
6645     case MULT:
6646       arg0 = simplify_giv_expr (loop, XEXP (x, 0), ext_val, benefit);
6647       arg1 = simplify_giv_expr (loop, XEXP (x, 1), ext_val, benefit);
6648       if (arg0 == 0 || arg1 == 0)
6649         return NULL_RTX;
6650
6651       /* Put constant last, CONST_INT last if both constant.  */
6652       if ((GET_CODE (arg0) == USE || GET_CODE (arg0) == CONST_INT)
6653           && GET_CODE (arg1) != CONST_INT)
6654         tem = arg0, arg0 = arg1, arg1 = tem;
6655
6656       /* If second argument is not now constant, not giv.  */
6657       if (GET_CODE (arg1) != USE && GET_CODE (arg1) != CONST_INT)
6658         return NULL_RTX;
6659
6660       /* Handle multiply by 0 or 1.  */
6661       if (arg1 == const0_rtx)
6662         return const0_rtx;
6663
6664       else if (arg1 == const1_rtx)
6665         return arg0;
6666
6667       switch (GET_CODE (arg0))
6668         {
6669         case REG:
6670           /* biv * invar.  Done.  */
6671           return gen_rtx_MULT (mode, arg0, arg1);
6672
6673         case CONST_INT:
6674           /* Product of two constants.  */
6675           return GEN_INT (INTVAL (arg0) * INTVAL (arg1));
6676
6677         case USE:
6678           /* invar * invar is a giv, but attempt to simplify it somehow.  */
6679           if (GET_CODE (arg1) != CONST_INT)
6680             return NULL_RTX;
6681
6682           arg0 = XEXP (arg0, 0);
6683           if (GET_CODE (arg0) == MULT)
6684             {
6685               /* (invar_0 * invar_1) * invar_2.  Associate.  */
6686               return simplify_giv_expr (loop,
6687                                         gen_rtx_MULT (mode,
6688                                                       XEXP (arg0, 0),
6689                                                       gen_rtx_MULT (mode,
6690                                                                     XEXP (arg0,
6691                                                                           1),
6692                                                                     arg1)),
6693                                         ext_val, benefit);
6694             }
6695           /* Propagate the MULT expressions to the innermost nodes.  */
6696           else if (GET_CODE (arg0) == PLUS)
6697             {
6698               /* (invar_0 + invar_1) * invar_2.  Distribute.  */
6699               return simplify_giv_expr (loop,
6700                                         gen_rtx_PLUS (mode,
6701                                                       gen_rtx_MULT (mode,
6702                                                                     XEXP (arg0,
6703                                                                           0),
6704                                                                     arg1),
6705                                                       gen_rtx_MULT (mode,
6706                                                                     XEXP (arg0,
6707                                                                           1),
6708                                                                     arg1)),
6709                                         ext_val, benefit);
6710             }
6711           return gen_rtx_USE (mode, gen_rtx_MULT (mode, arg0, arg1));
6712
6713         case MULT:
6714           /* (a * invar_1) * invar_2.  Associate.  */
6715           return simplify_giv_expr (loop,
6716                                     gen_rtx_MULT (mode,
6717                                                   XEXP (arg0, 0),
6718                                                   gen_rtx_MULT (mode,
6719                                                                 XEXP (arg0, 1),
6720                                                                 arg1)),
6721                                     ext_val, benefit);
6722
6723         case PLUS:
6724           /* (a + invar_1) * invar_2.  Distribute.  */
6725           return simplify_giv_expr (loop,
6726                                     gen_rtx_PLUS (mode,
6727                                                   gen_rtx_MULT (mode,
6728                                                                 XEXP (arg0, 0),
6729                                                                 arg1),
6730                                                   gen_rtx_MULT (mode,
6731                                                                 XEXP (arg0, 1),
6732                                                                 arg1)),
6733                                     ext_val, benefit);
6734
6735         default:
6736           abort ();
6737         }
6738
6739     case ASHIFT:
6740       /* Shift by constant is multiply by power of two.  */
6741       if (GET_CODE (XEXP (x, 1)) != CONST_INT)
6742         return 0;
6743
6744       return
6745         simplify_giv_expr (loop,
6746                            gen_rtx_MULT (mode,
6747                                          XEXP (x, 0),
6748                                          GEN_INT ((HOST_WIDE_INT) 1
6749                                                   << INTVAL (XEXP (x, 1)))),
6750                            ext_val, benefit);
6751
6752     case NEG:
6753       /* "-a" is "a * (-1)" */
6754       return simplify_giv_expr (loop,
6755                                 gen_rtx_MULT (mode, XEXP (x, 0), constm1_rtx),
6756                                 ext_val, benefit);
6757
6758     case NOT:
6759       /* "~a" is "-a - 1". Silly, but easy.  */
6760       return simplify_giv_expr (loop,
6761                                 gen_rtx_MINUS (mode,
6762                                                gen_rtx_NEG (mode, XEXP (x, 0)),
6763                                                const1_rtx),
6764                                 ext_val, benefit);
6765
6766     case USE:
6767       /* Already in proper form for invariant.  */
6768       return x;
6769
6770     case SIGN_EXTEND:
6771     case ZERO_EXTEND:
6772     case TRUNCATE:
6773       /* Conditionally recognize extensions of simple IVs.  After we've
6774          computed loop traversal counts and verified the range of the
6775          source IV, we'll reevaluate this as a GIV.  */
6776       if (*ext_val == NULL_RTX)
6777         {
6778           arg0 = simplify_giv_expr (loop, XEXP (x, 0), ext_val, benefit);
6779           if (arg0 && *ext_val == NULL_RTX && GET_CODE (arg0) == REG)
6780             {
6781               *ext_val = gen_rtx_fmt_e (GET_CODE (x), mode, arg0);
6782               return arg0;
6783             }
6784         }
6785       goto do_default;
6786
6787     case REG:
6788       /* If this is a new register, we can't deal with it.  */
6789       if (REGNO (x) >= max_reg_before_loop)
6790         return 0;
6791
6792       /* Check for biv or giv.  */
6793       switch (REG_IV_TYPE (ivs, REGNO (x)))
6794         {
6795         case BASIC_INDUCT:
6796           return x;
6797         case GENERAL_INDUCT:
6798           {
6799             struct induction *v = REG_IV_INFO (ivs, REGNO (x));
6800
6801             /* Form expression from giv and add benefit.  Ensure this giv
6802                can derive another and subtract any needed adjustment if so.  */
6803
6804             /* Increasing the benefit here is risky.  The only case in which it
6805                is arguably correct is if this is the only use of V.  In other
6806                cases, this will artificially inflate the benefit of the current
6807                giv, and lead to suboptimal code.  Thus, it is disabled, since
6808                potentially not reducing an only marginally beneficial giv is
6809                less harmful than reducing many givs that are not really
6810                beneficial.  */
6811             {
6812               rtx single_use = regs->array[REGNO (x)].single_usage;
6813               if (single_use && single_use != const0_rtx)
6814                 *benefit += v->benefit;
6815             }
6816
6817             if (v->cant_derive)
6818               return 0;
6819
6820             tem = gen_rtx_PLUS (mode, gen_rtx_MULT (mode,
6821                                                     v->src_reg, v->mult_val),
6822                                 v->add_val);
6823
6824             if (v->derive_adjustment)
6825               tem = gen_rtx_MINUS (mode, tem, v->derive_adjustment);
6826             arg0 = simplify_giv_expr (loop, tem, ext_val, benefit);
6827             if (*ext_val)
6828               {
6829                 if (!v->ext_dependent)
6830                   return arg0;
6831               }
6832             else
6833               {
6834                 *ext_val = v->ext_dependent;
6835                 return arg0;
6836               }
6837             return 0;
6838           }
6839
6840         default:
6841         do_default:
6842           /* If it isn't an induction variable, and it is invariant, we
6843              may be able to simplify things further by looking through
6844              the bits we just moved outside the loop.  */
6845           if (loop_invariant_p (loop, x) == 1)
6846             {
6847               struct movable *m;
6848               struct loop_movables *movables = LOOP_MOVABLES (loop);
6849
6850               for (m = movables->head; m; m = m->next)
6851                 if (rtx_equal_p (x, m->set_dest))
6852                   {
6853                     /* Ok, we found a match.  Substitute and simplify.  */
6854
6855                     /* If we match another movable, we must use that, as
6856                        this one is going away.  */
6857                     if (m->match)
6858                       return simplify_giv_expr (loop, m->match->set_dest,
6859                                                 ext_val, benefit);
6860
6861                     /* If consec is nonzero, this is a member of a group of
6862                        instructions that were moved together.  We handle this
6863                        case only to the point of seeking to the last insn and
6864                        looking for a REG_EQUAL.  Fail if we don't find one.  */
6865                     if (m->consec != 0)
6866                       {
6867                         int i = m->consec;
6868                         tem = m->insn;
6869                         do
6870                           {
6871                             tem = NEXT_INSN (tem);
6872                           }
6873                         while (--i > 0);
6874
6875                         tem = find_reg_note (tem, REG_EQUAL, NULL_RTX);
6876                         if (tem)
6877                           tem = XEXP (tem, 0);
6878                       }
6879                     else
6880                       {
6881                         tem = single_set (m->insn);
6882                         if (tem)
6883                           tem = SET_SRC (tem);
6884                       }
6885
6886                     if (tem)
6887                       {
6888                         /* What we are most interested in is pointer
6889                            arithmetic on invariants -- only take
6890                            patterns we may be able to do something with.  */
6891                         if (GET_CODE (tem) == PLUS
6892                             || GET_CODE (tem) == MULT
6893                             || GET_CODE (tem) == ASHIFT
6894                             || GET_CODE (tem) == CONST_INT
6895                             || GET_CODE (tem) == SYMBOL_REF)
6896                           {
6897                             tem = simplify_giv_expr (loop, tem, ext_val,
6898                                                      benefit);
6899                             if (tem)
6900                               return tem;
6901                           }
6902                         else if (GET_CODE (tem) == CONST
6903                                  && GET_CODE (XEXP (tem, 0)) == PLUS
6904                                  && GET_CODE (XEXP (XEXP (tem, 0), 0)) == SYMBOL_REF
6905                                  && GET_CODE (XEXP (XEXP (tem, 0), 1)) == CONST_INT)
6906                           {
6907                             tem = simplify_giv_expr (loop, XEXP (tem, 0),
6908                                                      ext_val, benefit);
6909                             if (tem)
6910                               return tem;
6911                           }
6912                       }
6913                     break;
6914                   }
6915             }
6916           break;
6917         }
6918
6919       /* Fall through to general case.  */
6920     default:
6921       /* If invariant, return as USE (unless CONST_INT).
6922          Otherwise, not giv.  */
6923       if (GET_CODE (x) == USE)
6924         x = XEXP (x, 0);
6925
6926       if (loop_invariant_p (loop, x) == 1)
6927         {
6928           if (GET_CODE (x) == CONST_INT)
6929             return x;
6930           if (GET_CODE (x) == CONST
6931               && GET_CODE (XEXP (x, 0)) == PLUS
6932               && GET_CODE (XEXP (XEXP (x, 0), 0)) == SYMBOL_REF
6933               && GET_CODE (XEXP (XEXP (x, 0), 1)) == CONST_INT)
6934             x = XEXP (x, 0);
6935           return gen_rtx_USE (mode, x);
6936         }
6937       else
6938         return 0;
6939     }
6940 }
6941
6942 /* This routine folds invariants such that there is only ever one
6943    CONST_INT in the summation.  It is only used by simplify_giv_expr.  */
6944
6945 static rtx
6946 sge_plus_constant (rtx x, rtx c)
6947 {
6948   if (GET_CODE (x) == CONST_INT)
6949     return GEN_INT (INTVAL (x) + INTVAL (c));
6950   else if (GET_CODE (x) != PLUS)
6951     return gen_rtx_PLUS (GET_MODE (x), x, c);
6952   else if (GET_CODE (XEXP (x, 1)) == CONST_INT)
6953     {
6954       return gen_rtx_PLUS (GET_MODE (x), XEXP (x, 0),
6955                            GEN_INT (INTVAL (XEXP (x, 1)) + INTVAL (c)));
6956     }
6957   else if (GET_CODE (XEXP (x, 0)) == PLUS
6958            || GET_CODE (XEXP (x, 1)) != PLUS)
6959     {
6960       return gen_rtx_PLUS (GET_MODE (x),
6961                            sge_plus_constant (XEXP (x, 0), c), XEXP (x, 1));
6962     }
6963   else
6964     {
6965       return gen_rtx_PLUS (GET_MODE (x),
6966                            sge_plus_constant (XEXP (x, 1), c), XEXP (x, 0));
6967     }
6968 }
6969
6970 static rtx
6971 sge_plus (enum machine_mode mode, rtx x, rtx y)
6972 {
6973   while (GET_CODE (y) == PLUS)
6974     {
6975       rtx a = XEXP (y, 0);
6976       if (GET_CODE (a) == CONST_INT)
6977         x = sge_plus_constant (x, a);
6978       else
6979         x = gen_rtx_PLUS (mode, x, a);
6980       y = XEXP (y, 1);
6981     }
6982   if (GET_CODE (y) == CONST_INT)
6983     x = sge_plus_constant (x, y);
6984   else
6985     x = gen_rtx_PLUS (mode, x, y);
6986   return x;
6987 }
6988 \f
6989 /* Help detect a giv that is calculated by several consecutive insns;
6990    for example,
6991       giv = biv * M
6992       giv = giv + A
6993    The caller has already identified the first insn P as having a giv as dest;
6994    we check that all other insns that set the same register follow
6995    immediately after P, that they alter nothing else,
6996    and that the result of the last is still a giv.
6997
6998    The value is 0 if the reg set in P is not really a giv.
6999    Otherwise, the value is the amount gained by eliminating
7000    all the consecutive insns that compute the value.
7001
7002    FIRST_BENEFIT is the amount gained by eliminating the first insn, P.
7003    SRC_REG is the reg of the biv; DEST_REG is the reg of the giv.
7004
7005    The coefficients of the ultimate giv value are stored in
7006    *MULT_VAL and *ADD_VAL.  */
7007
7008 static int
7009 consec_sets_giv (const struct loop *loop, int first_benefit, rtx p,
7010                  rtx src_reg, rtx dest_reg, rtx *add_val, rtx *mult_val,
7011                  rtx *ext_val, rtx *last_consec_insn)
7012 {
7013   struct loop_ivs *ivs = LOOP_IVS (loop);
7014   struct loop_regs *regs = LOOP_REGS (loop);
7015   int count;
7016   enum rtx_code code;
7017   int benefit;
7018   rtx temp;
7019   rtx set;
7020
7021   /* Indicate that this is a giv so that we can update the value produced in
7022      each insn of the multi-insn sequence.
7023
7024      This induction structure will be used only by the call to
7025      general_induction_var below, so we can allocate it on our stack.
7026      If this is a giv, our caller will replace the induct var entry with
7027      a new induction structure.  */
7028   struct induction *v;
7029
7030   if (REG_IV_TYPE (ivs, REGNO (dest_reg)) != UNKNOWN_INDUCT)
7031     return 0;
7032
7033   v = alloca (sizeof (struct induction));
7034   v->src_reg = src_reg;
7035   v->mult_val = *mult_val;
7036   v->add_val = *add_val;
7037   v->benefit = first_benefit;
7038   v->cant_derive = 0;
7039   v->derive_adjustment = 0;
7040   v->ext_dependent = NULL_RTX;
7041
7042   REG_IV_TYPE (ivs, REGNO (dest_reg)) = GENERAL_INDUCT;
7043   REG_IV_INFO (ivs, REGNO (dest_reg)) = v;
7044
7045   count = regs->array[REGNO (dest_reg)].n_times_set - 1;
7046
7047   while (count > 0)
7048     {
7049       p = NEXT_INSN (p);
7050       code = GET_CODE (p);
7051
7052       /* If libcall, skip to end of call sequence.  */
7053       if (code == INSN && (temp = find_reg_note (p, REG_LIBCALL, NULL_RTX)))
7054         p = XEXP (temp, 0);
7055
7056       if (code == INSN
7057           && (set = single_set (p))
7058           && GET_CODE (SET_DEST (set)) == REG
7059           && SET_DEST (set) == dest_reg
7060           && (general_induction_var (loop, SET_SRC (set), &src_reg,
7061                                      add_val, mult_val, ext_val, 0,
7062                                      &benefit, VOIDmode)
7063               /* Giv created by equivalent expression.  */
7064               || ((temp = find_reg_note (p, REG_EQUAL, NULL_RTX))
7065                   && general_induction_var (loop, XEXP (temp, 0), &src_reg,
7066                                             add_val, mult_val, ext_val, 0,
7067                                             &benefit, VOIDmode)))
7068           && src_reg == v->src_reg)
7069         {
7070           if (find_reg_note (p, REG_RETVAL, NULL_RTX))
7071             benefit += libcall_benefit (p);
7072
7073           count--;
7074           v->mult_val = *mult_val;
7075           v->add_val = *add_val;
7076           v->benefit += benefit;
7077         }
7078       else if (code != NOTE)
7079         {
7080           /* Allow insns that set something other than this giv to a
7081              constant.  Such insns are needed on machines which cannot
7082              include long constants and should not disqualify a giv.  */
7083           if (code == INSN
7084               && (set = single_set (p))
7085               && SET_DEST (set) != dest_reg
7086               && CONSTANT_P (SET_SRC (set)))
7087             continue;
7088
7089           REG_IV_TYPE (ivs, REGNO (dest_reg)) = UNKNOWN_INDUCT;
7090           return 0;
7091         }
7092     }
7093
7094   REG_IV_TYPE (ivs, REGNO (dest_reg)) = UNKNOWN_INDUCT;
7095   *last_consec_insn = p;
7096   return v->benefit;
7097 }
7098 \f
7099 /* Return an rtx, if any, that expresses giv G2 as a function of the register
7100    represented by G1.  If no such expression can be found, or it is clear that
7101    it cannot possibly be a valid address, 0 is returned.
7102
7103    To perform the computation, we note that
7104         G1 = x * v + a          and
7105         G2 = y * v + b
7106    where `v' is the biv.
7107
7108    So G2 = (y/b) * G1 + (b - a*y/x).
7109
7110    Note that MULT = y/x.
7111
7112    Update: A and B are now allowed to be additive expressions such that
7113    B contains all variables in A.  That is, computing B-A will not require
7114    subtracting variables.  */
7115
7116 static rtx
7117 express_from_1 (rtx a, rtx b, rtx mult)
7118 {
7119   /* If MULT is zero, then A*MULT is zero, and our expression is B.  */
7120
7121   if (mult == const0_rtx)
7122     return b;
7123
7124   /* If MULT is not 1, we cannot handle A with non-constants, since we
7125      would then be required to subtract multiples of the registers in A.
7126      This is theoretically possible, and may even apply to some Fortran
7127      constructs, but it is a lot of work and we do not attempt it here.  */
7128
7129   if (mult != const1_rtx && GET_CODE (a) != CONST_INT)
7130     return NULL_RTX;
7131
7132   /* In general these structures are sorted top to bottom (down the PLUS
7133      chain), but not left to right across the PLUS.  If B is a higher
7134      order giv than A, we can strip one level and recurse.  If A is higher
7135      order, we'll eventually bail out, but won't know that until the end.
7136      If they are the same, we'll strip one level around this loop.  */
7137
7138   while (GET_CODE (a) == PLUS && GET_CODE (b) == PLUS)
7139     {
7140       rtx ra, rb, oa, ob, tmp;
7141
7142       ra = XEXP (a, 0), oa = XEXP (a, 1);
7143       if (GET_CODE (ra) == PLUS)
7144         tmp = ra, ra = oa, oa = tmp;
7145
7146       rb = XEXP (b, 0), ob = XEXP (b, 1);
7147       if (GET_CODE (rb) == PLUS)
7148         tmp = rb, rb = ob, ob = tmp;
7149
7150       if (rtx_equal_p (ra, rb))
7151         /* We matched: remove one reg completely.  */
7152         a = oa, b = ob;
7153       else if (GET_CODE (ob) != PLUS && rtx_equal_p (ra, ob))
7154         /* An alternate match.  */
7155         a = oa, b = rb;
7156       else if (GET_CODE (oa) != PLUS && rtx_equal_p (oa, rb))
7157         /* An alternate match.  */
7158         a = ra, b = ob;
7159       else
7160         {
7161           /* Indicates an extra register in B.  Strip one level from B and
7162              recurse, hoping B was the higher order expression.  */
7163           ob = express_from_1 (a, ob, mult);
7164           if (ob == NULL_RTX)
7165             return NULL_RTX;
7166           return gen_rtx_PLUS (GET_MODE (b), rb, ob);
7167         }
7168     }
7169
7170   /* Here we are at the last level of A, go through the cases hoping to
7171      get rid of everything but a constant.  */
7172
7173   if (GET_CODE (a) == PLUS)
7174     {
7175       rtx ra, oa;
7176
7177       ra = XEXP (a, 0), oa = XEXP (a, 1);
7178       if (rtx_equal_p (oa, b))
7179         oa = ra;
7180       else if (!rtx_equal_p (ra, b))
7181         return NULL_RTX;
7182
7183       if (GET_CODE (oa) != CONST_INT)
7184         return NULL_RTX;
7185
7186       return GEN_INT (-INTVAL (oa) * INTVAL (mult));
7187     }
7188   else if (GET_CODE (a) == CONST_INT)
7189     {
7190       return plus_constant (b, -INTVAL (a) * INTVAL (mult));
7191     }
7192   else if (CONSTANT_P (a))
7193     {
7194       enum machine_mode mode_a = GET_MODE (a);
7195       enum machine_mode mode_b = GET_MODE (b);
7196       enum machine_mode mode = mode_b == VOIDmode ? mode_a : mode_b;
7197       return simplify_gen_binary (MINUS, mode, b, a);
7198     }
7199   else if (GET_CODE (b) == PLUS)
7200     {
7201       if (rtx_equal_p (a, XEXP (b, 0)))
7202         return XEXP (b, 1);
7203       else if (rtx_equal_p (a, XEXP (b, 1)))
7204         return XEXP (b, 0);
7205       else
7206         return NULL_RTX;
7207     }
7208   else if (rtx_equal_p (a, b))
7209     return const0_rtx;
7210
7211   return NULL_RTX;
7212 }
7213
7214 rtx
7215 express_from (struct induction *g1, struct induction *g2)
7216 {
7217   rtx mult, add;
7218
7219   /* The value that G1 will be multiplied by must be a constant integer.  Also,
7220      the only chance we have of getting a valid address is if b*c/a (see above
7221      for notation) is also an integer.  */
7222   if (GET_CODE (g1->mult_val) == CONST_INT
7223       && GET_CODE (g2->mult_val) == CONST_INT)
7224     {
7225       if (g1->mult_val == const0_rtx
7226           || (g1->mult_val == constm1_rtx
7227               && INTVAL (g2->mult_val)
7228                  == (HOST_WIDE_INT) 1 << (HOST_BITS_PER_WIDE_INT - 1))
7229           || INTVAL (g2->mult_val) % INTVAL (g1->mult_val) != 0)
7230         return NULL_RTX;
7231       mult = GEN_INT (INTVAL (g2->mult_val) / INTVAL (g1->mult_val));
7232     }
7233   else if (rtx_equal_p (g1->mult_val, g2->mult_val))
7234     mult = const1_rtx;
7235   else
7236     {
7237       /* ??? Find out if the one is a multiple of the other?  */
7238       return NULL_RTX;
7239     }
7240
7241   add = express_from_1 (g1->add_val, g2->add_val, mult);
7242   if (add == NULL_RTX)
7243     {
7244       /* Failed.  If we've got a multiplication factor between G1 and G2,
7245          scale G1's addend and try again.  */
7246       if (INTVAL (mult) > 1)
7247         {
7248           rtx g1_add_val = g1->add_val;
7249           if (GET_CODE (g1_add_val) == MULT
7250               && GET_CODE (XEXP (g1_add_val, 1)) == CONST_INT)
7251             {
7252               HOST_WIDE_INT m;
7253               m = INTVAL (mult) * INTVAL (XEXP (g1_add_val, 1));
7254               g1_add_val = gen_rtx_MULT (GET_MODE (g1_add_val),
7255                                          XEXP (g1_add_val, 0), GEN_INT (m));
7256             }
7257           else
7258             {
7259               g1_add_val = gen_rtx_MULT (GET_MODE (g1_add_val), g1_add_val,
7260                                          mult);
7261             }
7262
7263           add = express_from_1 (g1_add_val, g2->add_val, const1_rtx);
7264         }
7265     }
7266   if (add == NULL_RTX)
7267     return NULL_RTX;
7268
7269   /* Form simplified final result.  */
7270   if (mult == const0_rtx)
7271     return add;
7272   else if (mult == const1_rtx)
7273     mult = g1->dest_reg;
7274   else
7275     mult = gen_rtx_MULT (g2->mode, g1->dest_reg, mult);
7276
7277   if (add == const0_rtx)
7278     return mult;
7279   else
7280     {
7281       if (GET_CODE (add) == PLUS
7282           && CONSTANT_P (XEXP (add, 1)))
7283         {
7284           rtx tem = XEXP (add, 1);
7285           mult = gen_rtx_PLUS (g2->mode, mult, XEXP (add, 0));
7286           add = tem;
7287         }
7288
7289       return gen_rtx_PLUS (g2->mode, mult, add);
7290     }
7291 }
7292 \f
7293 /* Return an rtx, if any, that expresses giv G2 as a function of the register
7294    represented by G1.  This indicates that G2 should be combined with G1 and
7295    that G2 can use (either directly or via an address expression) a register
7296    used to represent G1.  */
7297
7298 static rtx
7299 combine_givs_p (struct induction *g1, struct induction *g2)
7300 {
7301   rtx comb, ret;
7302
7303   /* With the introduction of ext dependent givs, we must care for modes.
7304      G2 must not use a wider mode than G1.  */
7305   if (GET_MODE_SIZE (g1->mode) < GET_MODE_SIZE (g2->mode))
7306     return NULL_RTX;
7307
7308   ret = comb = express_from (g1, g2);
7309   if (comb == NULL_RTX)
7310     return NULL_RTX;
7311   if (g1->mode != g2->mode)
7312     ret = gen_lowpart (g2->mode, comb);
7313
7314   /* If these givs are identical, they can be combined.  We use the results
7315      of express_from because the addends are not in a canonical form, so
7316      rtx_equal_p is a weaker test.  */
7317   /* But don't combine a DEST_REG giv with a DEST_ADDR giv; we want the
7318      combination to be the other way round.  */
7319   if (comb == g1->dest_reg
7320       && (g1->giv_type == DEST_REG || g2->giv_type == DEST_ADDR))
7321     {
7322       return ret;
7323     }
7324
7325   /* If G2 can be expressed as a function of G1 and that function is valid
7326      as an address and no more expensive than using a register for G2,
7327      the expression of G2 in terms of G1 can be used.  */
7328   if (ret != NULL_RTX
7329       && g2->giv_type == DEST_ADDR
7330       && memory_address_p (GET_MODE (g2->mem), ret))
7331     return ret;
7332
7333   return NULL_RTX;
7334 }
7335 \f
7336 /* Check each extension dependent giv in this class to see if its
7337    root biv is safe from wrapping in the interior mode, which would
7338    make the giv illegal.  */
7339
7340 static void
7341 check_ext_dependent_givs (const struct loop *loop, struct iv_class *bl)
7342 {
7343   struct loop_info *loop_info = LOOP_INFO (loop);
7344   int ze_ok = 0, se_ok = 0, info_ok = 0;
7345   enum machine_mode biv_mode = GET_MODE (bl->biv->src_reg);
7346   HOST_WIDE_INT start_val;
7347   unsigned HOST_WIDE_INT u_end_val = 0;
7348   unsigned HOST_WIDE_INT u_start_val = 0;
7349   rtx incr = pc_rtx;
7350   struct induction *v;
7351
7352   /* Make sure the iteration data is available.  We must have
7353      constants in order to be certain of no overflow.  */
7354   if (loop_info->n_iterations > 0
7355       && bl->initial_value
7356       && GET_CODE (bl->initial_value) == CONST_INT
7357       && (incr = biv_total_increment (bl))
7358       && GET_CODE (incr) == CONST_INT
7359       /* Make sure the host can represent the arithmetic.  */
7360       && HOST_BITS_PER_WIDE_INT >= GET_MODE_BITSIZE (biv_mode))
7361     {
7362       unsigned HOST_WIDE_INT abs_incr, total_incr;
7363       HOST_WIDE_INT s_end_val;
7364       int neg_incr;
7365
7366       info_ok = 1;
7367       start_val = INTVAL (bl->initial_value);
7368       u_start_val = start_val;
7369
7370       neg_incr = 0, abs_incr = INTVAL (incr);
7371       if (INTVAL (incr) < 0)
7372         neg_incr = 1, abs_incr = -abs_incr;
7373       total_incr = abs_incr * loop_info->n_iterations;
7374
7375       /* Check for host arithmetic overflow.  */
7376       if (total_incr / loop_info->n_iterations == abs_incr)
7377         {
7378           unsigned HOST_WIDE_INT u_max;
7379           HOST_WIDE_INT s_max;
7380
7381           u_end_val = start_val + (neg_incr ? -total_incr : total_incr);
7382           s_end_val = u_end_val;
7383           u_max = GET_MODE_MASK (biv_mode);
7384           s_max = u_max >> 1;
7385
7386           /* Check zero extension of biv ok.  */
7387           if (start_val >= 0
7388               /* Check for host arithmetic overflow.  */
7389               && (neg_incr
7390                   ? u_end_val < u_start_val
7391                   : u_end_val > u_start_val)
7392               /* Check for target arithmetic overflow.  */
7393               && (neg_incr
7394                   ? 1 /* taken care of with host overflow */
7395                   : u_end_val <= u_max))
7396             {
7397               ze_ok = 1;
7398             }
7399
7400           /* Check sign extension of biv ok.  */
7401           /* ??? While it is true that overflow with signed and pointer
7402              arithmetic is undefined, I fear too many programmers don't
7403              keep this fact in mind -- myself included on occasion.
7404              So leave alone with the signed overflow optimizations.  */
7405           if (start_val >= -s_max - 1
7406               /* Check for host arithmetic overflow.  */
7407               && (neg_incr
7408                   ? s_end_val < start_val
7409                   : s_end_val > start_val)
7410               /* Check for target arithmetic overflow.  */
7411               && (neg_incr
7412                   ? s_end_val >= -s_max - 1
7413                   : s_end_val <= s_max))
7414             {
7415               se_ok = 1;
7416             }
7417         }
7418     }
7419
7420   /* If we know the BIV is compared at run-time against an
7421      invariant value, and the increment is +/- 1, we may also
7422      be able to prove that the BIV cannot overflow.  */
7423   else if (bl->biv->src_reg == loop_info->iteration_var
7424            && loop_info->comparison_value
7425            && loop_invariant_p (loop, loop_info->comparison_value)
7426            && (incr = biv_total_increment (bl))
7427            && GET_CODE (incr) == CONST_INT)
7428     {
7429       /* If the increment is +1, and the exit test is a <,
7430          the BIV cannot overflow.  (For <=, we have the
7431          problematic case that the comparison value might
7432          be the maximum value of the range.)  */
7433        if (INTVAL (incr) == 1)
7434          {
7435            if (loop_info->comparison_code == LT)
7436              se_ok = ze_ok = 1;
7437            else if (loop_info->comparison_code == LTU)
7438              ze_ok = 1;
7439          }
7440
7441        /* Likewise for increment -1 and exit test >.  */
7442        if (INTVAL (incr) == -1)
7443          {
7444            if (loop_info->comparison_code == GT)
7445              se_ok = ze_ok = 1;
7446            else if (loop_info->comparison_code == GTU)
7447              ze_ok = 1;
7448          }
7449     }
7450
7451   /* Invalidate givs that fail the tests.  */
7452   for (v = bl->giv; v; v = v->next_iv)
7453     if (v->ext_dependent)
7454       {
7455         enum rtx_code code = GET_CODE (v->ext_dependent);
7456         int ok = 0;
7457
7458         switch (code)
7459           {
7460           case SIGN_EXTEND:
7461             ok = se_ok;
7462             break;
7463           case ZERO_EXTEND:
7464             ok = ze_ok;
7465             break;
7466
7467           case TRUNCATE:
7468             /* We don't know whether this value is being used as either
7469                signed or unsigned, so to safely truncate we must satisfy
7470                both.  The initial check here verifies the BIV itself;
7471                once that is successful we may check its range wrt the
7472                derived GIV.  This works only if we were able to determine
7473                constant start and end values above.  */
7474             if (se_ok && ze_ok && info_ok)
7475               {
7476                 enum machine_mode outer_mode = GET_MODE (v->ext_dependent);
7477                 unsigned HOST_WIDE_INT max = GET_MODE_MASK (outer_mode) >> 1;
7478
7479                 /* We know from the above that both endpoints are nonnegative,
7480                    and that there is no wrapping.  Verify that both endpoints
7481                    are within the (signed) range of the outer mode.  */
7482                 if (u_start_val <= max && u_end_val <= max)
7483                   ok = 1;
7484               }
7485             break;
7486
7487           default:
7488             abort ();
7489           }
7490
7491         if (ok)
7492           {
7493             if (loop_dump_stream)
7494               {
7495                 fprintf (loop_dump_stream,
7496                          "Verified ext dependent giv at %d of reg %d\n",
7497                          INSN_UID (v->insn), bl->regno);
7498               }
7499           }
7500         else
7501           {
7502             if (loop_dump_stream)
7503               {
7504                 const char *why;
7505
7506                 if (info_ok)
7507                   why = "biv iteration values overflowed";
7508                 else
7509                   {
7510                     if (incr == pc_rtx)
7511                       incr = biv_total_increment (bl);
7512                     if (incr == const1_rtx)
7513                       why = "biv iteration info incomplete; incr by 1";
7514                     else
7515                       why = "biv iteration info incomplete";
7516                   }
7517
7518                 fprintf (loop_dump_stream,
7519                          "Failed ext dependent giv at %d, %s\n",
7520                          INSN_UID (v->insn), why);
7521               }
7522             v->ignore = 1;
7523             bl->all_reduced = 0;
7524           }
7525       }
7526 }
7527
7528 /* Generate a version of VALUE in a mode appropriate for initializing V.  */
7529
7530 rtx
7531 extend_value_for_giv (struct induction *v, rtx value)
7532 {
7533   rtx ext_dep = v->ext_dependent;
7534
7535   if (! ext_dep)
7536     return value;
7537
7538   /* Recall that check_ext_dependent_givs verified that the known bounds
7539      of a biv did not overflow or wrap with respect to the extension for
7540      the giv.  Therefore, constants need no additional adjustment.  */
7541   if (CONSTANT_P (value) && GET_MODE (value) == VOIDmode)
7542     return value;
7543
7544   /* Otherwise, we must adjust the value to compensate for the
7545      differing modes of the biv and the giv.  */
7546   return gen_rtx_fmt_e (GET_CODE (ext_dep), GET_MODE (ext_dep), value);
7547 }
7548 \f
7549 struct combine_givs_stats
7550 {
7551   int giv_number;
7552   int total_benefit;
7553 };
7554
7555 static int
7556 cmp_combine_givs_stats (const void *xp, const void *yp)
7557 {
7558   const struct combine_givs_stats * const x =
7559     (const struct combine_givs_stats *) xp;
7560   const struct combine_givs_stats * const y =
7561     (const struct combine_givs_stats *) yp;
7562   int d;
7563   d = y->total_benefit - x->total_benefit;
7564   /* Stabilize the sort.  */
7565   if (!d)
7566     d = x->giv_number - y->giv_number;
7567   return d;
7568 }
7569
7570 /* Check all pairs of givs for iv_class BL and see if any can be combined with
7571    any other.  If so, point SAME to the giv combined with and set NEW_REG to
7572    be an expression (in terms of the other giv's DEST_REG) equivalent to the
7573    giv.  Also, update BENEFIT and related fields for cost/benefit analysis.  */
7574
7575 static void
7576 combine_givs (struct loop_regs *regs, struct iv_class *bl)
7577 {
7578   /* Additional benefit to add for being combined multiple times.  */
7579   const int extra_benefit = 3;
7580
7581   struct induction *g1, *g2, **giv_array;
7582   int i, j, k, giv_count;
7583   struct combine_givs_stats *stats;
7584   rtx *can_combine;
7585
7586   /* Count givs, because bl->giv_count is incorrect here.  */
7587   giv_count = 0;
7588   for (g1 = bl->giv; g1; g1 = g1->next_iv)
7589     if (!g1->ignore)
7590       giv_count++;
7591
7592   giv_array = alloca (giv_count * sizeof (struct induction *));
7593   i = 0;
7594   for (g1 = bl->giv; g1; g1 = g1->next_iv)
7595     if (!g1->ignore)
7596       giv_array[i++] = g1;
7597
7598   stats = xcalloc (giv_count, sizeof (*stats));
7599   can_combine = xcalloc (giv_count, giv_count * sizeof (rtx));
7600
7601   for (i = 0; i < giv_count; i++)
7602     {
7603       int this_benefit;
7604       rtx single_use;
7605
7606       g1 = giv_array[i];
7607       stats[i].giv_number = i;
7608
7609       /* If a DEST_REG GIV is used only once, do not allow it to combine
7610          with anything, for in doing so we will gain nothing that cannot
7611          be had by simply letting the GIV with which we would have combined
7612          to be reduced on its own.  The losage shows up in particular with
7613          DEST_ADDR targets on hosts with reg+reg addressing, though it can
7614          be seen elsewhere as well.  */
7615       if (g1->giv_type == DEST_REG
7616           && (single_use = regs->array[REGNO (g1->dest_reg)].single_usage)
7617           && single_use != const0_rtx)
7618         continue;
7619
7620       this_benefit = g1->benefit;
7621       /* Add an additional weight for zero addends.  */
7622       if (g1->no_const_addval)
7623         this_benefit += 1;
7624
7625       for (j = 0; j < giv_count; j++)
7626         {
7627           rtx this_combine;
7628
7629           g2 = giv_array[j];
7630           if (g1 != g2
7631               && (this_combine = combine_givs_p (g1, g2)) != NULL_RTX)
7632             {
7633               can_combine[i * giv_count + j] = this_combine;
7634               this_benefit += g2->benefit + extra_benefit;
7635             }
7636         }
7637       stats[i].total_benefit = this_benefit;
7638     }
7639
7640   /* Iterate, combining until we can't.  */
7641 restart:
7642   qsort (stats, giv_count, sizeof (*stats), cmp_combine_givs_stats);
7643
7644   if (loop_dump_stream)
7645     {
7646       fprintf (loop_dump_stream, "Sorted combine statistics:\n");
7647       for (k = 0; k < giv_count; k++)
7648         {
7649           g1 = giv_array[stats[k].giv_number];
7650           if (!g1->combined_with && !g1->same)
7651             fprintf (loop_dump_stream, " {%d, %d}",
7652                      INSN_UID (giv_array[stats[k].giv_number]->insn),
7653                      stats[k].total_benefit);
7654         }
7655       putc ('\n', loop_dump_stream);
7656     }
7657
7658   for (k = 0; k < giv_count; k++)
7659     {
7660       int g1_add_benefit = 0;
7661
7662       i = stats[k].giv_number;
7663       g1 = giv_array[i];
7664
7665       /* If it has already been combined, skip.  */
7666       if (g1->combined_with || g1->same)
7667         continue;
7668
7669       for (j = 0; j < giv_count; j++)
7670         {
7671           g2 = giv_array[j];
7672           if (g1 != g2 && can_combine[i * giv_count + j]
7673               /* If it has already been combined, skip.  */
7674               && ! g2->same && ! g2->combined_with)
7675             {
7676               int l;
7677
7678               g2->new_reg = can_combine[i * giv_count + j];
7679               g2->same = g1;
7680               /* For destination, we now may replace by mem expression instead
7681                  of register.  This changes the costs considerably, so add the
7682                  compensation.  */
7683               if (g2->giv_type == DEST_ADDR)
7684                 g2->benefit = (g2->benefit + reg_address_cost
7685                                - address_cost (g2->new_reg,
7686                                GET_MODE (g2->mem)));
7687               g1->combined_with++;
7688               g1->lifetime += g2->lifetime;
7689
7690               g1_add_benefit += g2->benefit;
7691
7692               /* ??? The new final_[bg]iv_value code does a much better job
7693                  of finding replaceable giv's, and hence this code may no
7694                  longer be necessary.  */
7695               if (! g2->replaceable && REG_USERVAR_P (g2->dest_reg))
7696                 g1_add_benefit -= copy_cost;
7697
7698               /* To help optimize the next set of combinations, remove
7699                  this giv from the benefits of other potential mates.  */
7700               for (l = 0; l < giv_count; ++l)
7701                 {
7702                   int m = stats[l].giv_number;
7703                   if (can_combine[m * giv_count + j])
7704                     stats[l].total_benefit -= g2->benefit + extra_benefit;
7705                 }
7706
7707               if (loop_dump_stream)
7708                 fprintf (loop_dump_stream,
7709                          "giv at %d combined with giv at %d; new benefit %d + %d, lifetime %d\n",
7710                          INSN_UID (g2->insn), INSN_UID (g1->insn),
7711                          g1->benefit, g1_add_benefit, g1->lifetime);
7712             }
7713         }
7714
7715       /* To help optimize the next set of combinations, remove
7716          this giv from the benefits of other potential mates.  */
7717       if (g1->combined_with)
7718         {
7719           for (j = 0; j < giv_count; ++j)
7720             {
7721               int m = stats[j].giv_number;
7722               if (can_combine[m * giv_count + i])
7723                 stats[j].total_benefit -= g1->benefit + extra_benefit;
7724             }
7725
7726           g1->benefit += g1_add_benefit;
7727
7728           /* We've finished with this giv, and everything it touched.
7729              Restart the combination so that proper weights for the
7730              rest of the givs are properly taken into account.  */
7731           /* ??? Ideally we would compact the arrays at this point, so
7732              as to not cover old ground.  But sanely compacting
7733              can_combine is tricky.  */
7734           goto restart;
7735         }
7736     }
7737
7738   /* Clean up.  */
7739   free (stats);
7740   free (can_combine);
7741 }
7742 \f
7743 /* Generate sequence for REG = B * M + A.  B is the initial value of
7744    the basic induction variable, M a multiplicative constant, A an
7745    additive constant and REG the destination register.  */
7746
7747 static rtx
7748 gen_add_mult (rtx b,  rtx m, rtx a, rtx reg)
7749 {
7750   rtx seq;
7751   rtx result;
7752
7753   start_sequence ();
7754   /* Use unsigned arithmetic.  */
7755   result = expand_mult_add (b, reg, m, a, GET_MODE (reg), 1);
7756   if (reg != result)
7757     emit_move_insn (reg, result);
7758   seq = get_insns ();
7759   end_sequence ();
7760
7761   return seq;
7762 }
7763
7764
7765 /* Update registers created in insn sequence SEQ.  */
7766
7767 static void
7768 loop_regs_update (const struct loop *loop ATTRIBUTE_UNUSED, rtx seq)
7769 {
7770   rtx insn;
7771
7772   /* Update register info for alias analysis.  */
7773
7774   insn = seq;
7775   while (insn != NULL_RTX)
7776     {
7777       rtx set = single_set (insn);
7778
7779       if (set && GET_CODE (SET_DEST (set)) == REG)
7780         record_base_value (REGNO (SET_DEST (set)), SET_SRC (set), 0);
7781
7782       insn = NEXT_INSN (insn);
7783     }
7784 }
7785
7786
7787 /* EMIT code before BEFORE_BB/BEFORE_INSN to set REG = B * M + A.  B
7788    is the initial value of the basic induction variable, M a
7789    multiplicative constant, A an additive constant and REG the
7790    destination register.  */
7791
7792 void
7793 loop_iv_add_mult_emit_before (const struct loop *loop, rtx b, rtx m, rtx a,
7794                               rtx reg, basic_block before_bb, rtx before_insn)
7795 {
7796   rtx seq;
7797
7798   if (! before_insn)
7799     {
7800       loop_iv_add_mult_hoist (loop, b, m, a, reg);
7801       return;
7802     }
7803
7804   /* Use copy_rtx to prevent unexpected sharing of these rtx.  */
7805   seq = gen_add_mult (copy_rtx (b), copy_rtx (m), copy_rtx (a), reg);
7806
7807   /* Increase the lifetime of any invariants moved further in code.  */
7808   update_reg_last_use (a, before_insn);
7809   update_reg_last_use (b, before_insn);
7810   update_reg_last_use (m, before_insn);
7811
7812   /* It is possible that the expansion created lots of new registers.
7813      Iterate over the sequence we just created and record them all.  We
7814      must do this before inserting the sequence.  */
7815   loop_regs_update (loop, seq);
7816
7817   loop_insn_emit_before (loop, before_bb, before_insn, seq);
7818 }
7819
7820
7821 /* Emit insns in loop pre-header to set REG = B * M + A.  B is the
7822    initial value of the basic induction variable, M a multiplicative
7823    constant, A an additive constant and REG the destination
7824    register.  */
7825
7826 void
7827 loop_iv_add_mult_sink (const struct loop *loop, rtx b, rtx m, rtx a, rtx reg)
7828 {
7829   rtx seq;
7830
7831   /* Use copy_rtx to prevent unexpected sharing of these rtx.  */
7832   seq = gen_add_mult (copy_rtx (b), copy_rtx (m), copy_rtx (a), reg);
7833
7834   /* Increase the lifetime of any invariants moved further in code.
7835      ???? Is this really necessary?  */
7836   update_reg_last_use (a, loop->sink);
7837   update_reg_last_use (b, loop->sink);
7838   update_reg_last_use (m, loop->sink);
7839
7840   /* It is possible that the expansion created lots of new registers.
7841      Iterate over the sequence we just created and record them all.  We
7842      must do this before inserting the sequence.  */
7843   loop_regs_update (loop, seq);
7844
7845   loop_insn_sink (loop, seq);
7846 }
7847
7848
7849 /* Emit insns after loop to set REG = B * M + A.  B is the initial
7850    value of the basic induction variable, M a multiplicative constant,
7851    A an additive constant and REG the destination register.  */
7852
7853 void
7854 loop_iv_add_mult_hoist (const struct loop *loop, rtx b, rtx m, rtx a, rtx reg)
7855 {
7856   rtx seq;
7857
7858   /* Use copy_rtx to prevent unexpected sharing of these rtx.  */
7859   seq = gen_add_mult (copy_rtx (b), copy_rtx (m), copy_rtx (a), reg);
7860
7861   /* It is possible that the expansion created lots of new registers.
7862      Iterate over the sequence we just created and record them all.  We
7863      must do this before inserting the sequence.  */
7864   loop_regs_update (loop, seq);
7865
7866   loop_insn_hoist (loop, seq);
7867 }
7868
7869
7870
7871 /* Similar to gen_add_mult, but compute cost rather than generating
7872    sequence.  */
7873
7874 static int
7875 iv_add_mult_cost (rtx b, rtx m, rtx a, rtx reg)
7876 {
7877   int cost = 0;
7878   rtx last, result;
7879
7880   start_sequence ();
7881   result = expand_mult_add (b, reg, m, a, GET_MODE (reg), 1);
7882   if (reg != result)
7883     emit_move_insn (reg, result);
7884   last = get_last_insn ();
7885   while (last)
7886     {
7887       rtx t = single_set (last);
7888       if (t)
7889         cost += rtx_cost (SET_SRC (t), SET);
7890       last = PREV_INSN (last);
7891     }
7892   end_sequence ();
7893   return cost;
7894 }
7895 \f
7896 /* Test whether A * B can be computed without
7897    an actual multiply insn.  Value is 1 if so.
7898
7899   ??? This function stinks because it generates a ton of wasted RTL
7900   ??? and as a result fragments GC memory to no end.  There are other
7901   ??? places in the compiler which are invoked a lot and do the same
7902   ??? thing, generate wasted RTL just to see if something is possible.  */
7903
7904 static int
7905 product_cheap_p (rtx a, rtx b)
7906 {
7907   rtx tmp;
7908   int win, n_insns;
7909
7910   /* If only one is constant, make it B.  */
7911   if (GET_CODE (a) == CONST_INT)
7912     tmp = a, a = b, b = tmp;
7913
7914   /* If first constant, both constant, so don't need multiply.  */
7915   if (GET_CODE (a) == CONST_INT)
7916     return 1;
7917
7918   /* If second not constant, neither is constant, so would need multiply.  */
7919   if (GET_CODE (b) != CONST_INT)
7920     return 0;
7921
7922   /* One operand is constant, so might not need multiply insn.  Generate the
7923      code for the multiply and see if a call or multiply, or long sequence
7924      of insns is generated.  */
7925
7926   start_sequence ();
7927   expand_mult (GET_MODE (a), a, b, NULL_RTX, 1);
7928   tmp = get_insns ();
7929   end_sequence ();
7930
7931   win = 1;
7932   if (INSN_P (tmp))
7933     {
7934       n_insns = 0;
7935       while (tmp != NULL_RTX)
7936         {
7937           rtx next = NEXT_INSN (tmp);
7938
7939           if (++n_insns > 3
7940               || GET_CODE (tmp) != INSN
7941               || (GET_CODE (PATTERN (tmp)) == SET
7942                   && GET_CODE (SET_SRC (PATTERN (tmp))) == MULT)
7943               || (GET_CODE (PATTERN (tmp)) == PARALLEL
7944                   && GET_CODE (XVECEXP (PATTERN (tmp), 0, 0)) == SET
7945                   && GET_CODE (SET_SRC (XVECEXP (PATTERN (tmp), 0, 0))) == MULT))
7946             {
7947               win = 0;
7948               break;
7949             }
7950
7951           tmp = next;
7952         }
7953     }
7954   else if (GET_CODE (tmp) == SET
7955            && GET_CODE (SET_SRC (tmp)) == MULT)
7956     win = 0;
7957   else if (GET_CODE (tmp) == PARALLEL
7958            && GET_CODE (XVECEXP (tmp, 0, 0)) == SET
7959            && GET_CODE (SET_SRC (XVECEXP (tmp, 0, 0))) == MULT)
7960     win = 0;
7961
7962   return win;
7963 }
7964 \f
7965 /* Check to see if loop can be terminated by a "decrement and branch until
7966    zero" instruction.  If so, add a REG_NONNEG note to the branch insn if so.
7967    Also try reversing an increment loop to a decrement loop
7968    to see if the optimization can be performed.
7969    Value is nonzero if optimization was performed.  */
7970
7971 /* This is useful even if the architecture doesn't have such an insn,
7972    because it might change a loops which increments from 0 to n to a loop
7973    which decrements from n to 0.  A loop that decrements to zero is usually
7974    faster than one that increments from zero.  */
7975
7976 /* ??? This could be rewritten to use some of the loop unrolling procedures,
7977    such as approx_final_value, biv_total_increment, loop_iterations, and
7978    final_[bg]iv_value.  */
7979
7980 static int
7981 check_dbra_loop (struct loop *loop, int insn_count)
7982 {
7983   struct loop_info *loop_info = LOOP_INFO (loop);
7984   struct loop_regs *regs = LOOP_REGS (loop);
7985   struct loop_ivs *ivs = LOOP_IVS (loop);
7986   struct iv_class *bl;
7987   rtx reg;
7988   enum machine_mode mode;
7989   rtx jump_label;
7990   rtx final_value;
7991   rtx start_value;
7992   rtx new_add_val;
7993   rtx comparison;
7994   rtx before_comparison;
7995   rtx p;
7996   rtx jump;
7997   rtx first_compare;
7998   int compare_and_branch;
7999   rtx loop_start = loop->start;
8000   rtx loop_end = loop->end;
8001
8002   /* If last insn is a conditional branch, and the insn before tests a
8003      register value, try to optimize it.  Otherwise, we can't do anything.  */
8004
8005   jump = PREV_INSN (loop_end);
8006   comparison = get_condition_for_loop (loop, jump);
8007   if (comparison == 0)
8008     return 0;
8009   if (!onlyjump_p (jump))
8010     return 0;
8011
8012   /* Try to compute whether the compare/branch at the loop end is one or
8013      two instructions.  */
8014   get_condition (jump, &first_compare, false);
8015   if (first_compare == jump)
8016     compare_and_branch = 1;
8017   else if (first_compare == prev_nonnote_insn (jump))
8018     compare_and_branch = 2;
8019   else
8020     return 0;
8021
8022   {
8023     /* If more than one condition is present to control the loop, then
8024        do not proceed, as this function does not know how to rewrite
8025        loop tests with more than one condition.
8026
8027        Look backwards from the first insn in the last comparison
8028        sequence and see if we've got another comparison sequence.  */
8029
8030     rtx jump1;
8031     if ((jump1 = prev_nonnote_insn (first_compare)) != loop->cont)
8032       if (GET_CODE (jump1) == JUMP_INSN)
8033         return 0;
8034   }
8035
8036   /* Check all of the bivs to see if the compare uses one of them.
8037      Skip biv's set more than once because we can't guarantee that
8038      it will be zero on the last iteration.  Also skip if the biv is
8039      used between its update and the test insn.  */
8040
8041   for (bl = ivs->list; bl; bl = bl->next)
8042     {
8043       if (bl->biv_count == 1
8044           && ! bl->biv->maybe_multiple
8045           && bl->biv->dest_reg == XEXP (comparison, 0)
8046           && ! reg_used_between_p (regno_reg_rtx[bl->regno], bl->biv->insn,
8047                                    first_compare))
8048         break;
8049     }
8050
8051   /* Try swapping the comparison to identify a suitable biv.  */
8052   if (!bl)
8053     for (bl = ivs->list; bl; bl = bl->next)
8054       if (bl->biv_count == 1
8055           && ! bl->biv->maybe_multiple
8056           && bl->biv->dest_reg == XEXP (comparison, 1)
8057           && ! reg_used_between_p (regno_reg_rtx[bl->regno], bl->biv->insn,
8058                                    first_compare))
8059         {
8060           comparison = gen_rtx_fmt_ee (swap_condition (GET_CODE (comparison)),
8061                                        VOIDmode,
8062                                        XEXP (comparison, 1),
8063                                        XEXP (comparison, 0));
8064           break;
8065         }
8066
8067   if (! bl)
8068     return 0;
8069
8070   /* Look for the case where the basic induction variable is always
8071      nonnegative, and equals zero on the last iteration.
8072      In this case, add a reg_note REG_NONNEG, which allows the
8073      m68k DBRA instruction to be used.  */
8074
8075   if (((GET_CODE (comparison) == GT && XEXP (comparison, 1) == constm1_rtx)
8076        || (GET_CODE (comparison) == NE && XEXP (comparison, 1) == const0_rtx))
8077       && GET_CODE (bl->biv->add_val) == CONST_INT
8078       && INTVAL (bl->biv->add_val) < 0)
8079     {
8080       /* Initial value must be greater than 0,
8081          init_val % -dec_value == 0 to ensure that it equals zero on
8082          the last iteration */
8083
8084       if (GET_CODE (bl->initial_value) == CONST_INT
8085           && INTVAL (bl->initial_value) > 0
8086           && (INTVAL (bl->initial_value)
8087               % (-INTVAL (bl->biv->add_val))) == 0)
8088         {
8089           /* Register always nonnegative, add REG_NOTE to branch.  */
8090           if (! find_reg_note (jump, REG_NONNEG, NULL_RTX))
8091             REG_NOTES (jump)
8092               = gen_rtx_EXPR_LIST (REG_NONNEG, bl->biv->dest_reg,
8093                                    REG_NOTES (jump));
8094           bl->nonneg = 1;
8095
8096           return 1;
8097         }
8098
8099       /* If the decrement is 1 and the value was tested as >= 0 before
8100          the loop, then we can safely optimize.  */
8101       for (p = loop_start; p; p = PREV_INSN (p))
8102         {
8103           if (GET_CODE (p) == CODE_LABEL)
8104             break;
8105           if (GET_CODE (p) != JUMP_INSN)
8106             continue;
8107
8108           before_comparison = get_condition_for_loop (loop, p);
8109           if (before_comparison
8110               && XEXP (before_comparison, 0) == bl->biv->dest_reg
8111               && (GET_CODE (before_comparison) == LT
8112                   || GET_CODE (before_comparison) == LTU)
8113               && XEXP (before_comparison, 1) == const0_rtx
8114               && ! reg_set_between_p (bl->biv->dest_reg, p, loop_start)
8115               && INTVAL (bl->biv->add_val) == -1)
8116             {
8117               if (! find_reg_note (jump, REG_NONNEG, NULL_RTX))
8118                 REG_NOTES (jump)
8119                   = gen_rtx_EXPR_LIST (REG_NONNEG, bl->biv->dest_reg,
8120                                        REG_NOTES (jump));
8121               bl->nonneg = 1;
8122
8123               return 1;
8124             }
8125         }
8126     }
8127   else if (GET_CODE (bl->biv->add_val) == CONST_INT
8128            && INTVAL (bl->biv->add_val) > 0)
8129     {
8130       /* Try to change inc to dec, so can apply above optimization.  */
8131       /* Can do this if:
8132          all registers modified are induction variables or invariant,
8133          all memory references have non-overlapping addresses
8134          (obviously true if only one write)
8135          allow 2 insns for the compare/jump at the end of the loop.  */
8136       /* Also, we must avoid any instructions which use both the reversed
8137          biv and another biv.  Such instructions will fail if the loop is
8138          reversed.  We meet this condition by requiring that either
8139          no_use_except_counting is true, or else that there is only
8140          one biv.  */
8141       int num_nonfixed_reads = 0;
8142       /* 1 if the iteration var is used only to count iterations.  */
8143       int no_use_except_counting = 0;
8144       /* 1 if the loop has no memory store, or it has a single memory store
8145          which is reversible.  */
8146       int reversible_mem_store = 1;
8147
8148       if (bl->giv_count == 0
8149           && !loop->exit_count
8150           && !loop_info->has_multiple_exit_targets)
8151         {
8152           rtx bivreg = regno_reg_rtx[bl->regno];
8153           struct iv_class *blt;
8154
8155           /* If there are no givs for this biv, and the only exit is the
8156              fall through at the end of the loop, then
8157              see if perhaps there are no uses except to count.  */
8158           no_use_except_counting = 1;
8159           for (p = loop_start; p != loop_end; p = NEXT_INSN (p))
8160             if (INSN_P (p))
8161               {
8162                 rtx set = single_set (p);
8163
8164                 if (set && GET_CODE (SET_DEST (set)) == REG
8165                     && REGNO (SET_DEST (set)) == bl->regno)
8166                   /* An insn that sets the biv is okay.  */
8167                   ;
8168                 else if (!reg_mentioned_p (bivreg, PATTERN (p)))
8169                   /* An insn that doesn't mention the biv is okay.  */
8170                   ;
8171                 else if (p == prev_nonnote_insn (prev_nonnote_insn (loop_end))
8172                          || p == prev_nonnote_insn (loop_end))
8173                   {
8174                     /* If either of these insns uses the biv and sets a pseudo
8175                        that has more than one usage, then the biv has uses
8176                        other than counting since it's used to derive a value
8177                        that is used more than one time.  */
8178                     note_stores (PATTERN (p), note_set_pseudo_multiple_uses,
8179                                  regs);
8180                     if (regs->multiple_uses)
8181                       {
8182                         no_use_except_counting = 0;
8183                         break;
8184                       }
8185                   }
8186                 else
8187                   {
8188                     no_use_except_counting = 0;
8189                     break;
8190                   }
8191               }
8192
8193           /* A biv has uses besides counting if it is used to set
8194              another biv.  */
8195           for (blt = ivs->list; blt; blt = blt->next)
8196             if (blt->init_set
8197                 && reg_mentioned_p (bivreg, SET_SRC (blt->init_set)))
8198               {
8199                 no_use_except_counting = 0;
8200                 break;
8201               }
8202         }
8203
8204       if (no_use_except_counting)
8205         /* No need to worry about MEMs.  */
8206         ;
8207       else if (loop_info->num_mem_sets <= 1)
8208         {
8209           for (p = loop_start; p != loop_end; p = NEXT_INSN (p))
8210             if (INSN_P (p))
8211               num_nonfixed_reads += count_nonfixed_reads (loop, PATTERN (p));
8212
8213           /* If the loop has a single store, and the destination address is
8214              invariant, then we can't reverse the loop, because this address
8215              might then have the wrong value at loop exit.
8216              This would work if the source was invariant also, however, in that
8217              case, the insn should have been moved out of the loop.  */
8218
8219           if (loop_info->num_mem_sets == 1)
8220             {
8221               struct induction *v;
8222
8223               /* If we could prove that each of the memory locations
8224                  written to was different, then we could reverse the
8225                  store -- but we don't presently have any way of
8226                  knowing that.  */
8227               reversible_mem_store = 0;
8228
8229               /* If the store depends on a register that is set after the
8230                  store, it depends on the initial value, and is thus not
8231                  reversible.  */
8232               for (v = bl->giv; reversible_mem_store && v; v = v->next_iv)
8233                 {
8234                   if (v->giv_type == DEST_REG
8235                       && reg_mentioned_p (v->dest_reg,
8236                                           PATTERN (loop_info->first_loop_store_insn))
8237                       && loop_insn_first_p (loop_info->first_loop_store_insn,
8238                                             v->insn))
8239                     reversible_mem_store = 0;
8240                 }
8241             }
8242         }
8243       else
8244         return 0;
8245
8246       /* This code only acts for innermost loops.  Also it simplifies
8247          the memory address check by only reversing loops with
8248          zero or one memory access.
8249          Two memory accesses could involve parts of the same array,
8250          and that can't be reversed.
8251          If the biv is used only for counting, than we don't need to worry
8252          about all these things.  */
8253
8254       if ((num_nonfixed_reads <= 1
8255            && ! loop_info->has_nonconst_call
8256            && ! loop_info->has_prefetch
8257            && ! loop_info->has_volatile
8258            && reversible_mem_store
8259            && (bl->giv_count + bl->biv_count + loop_info->num_mem_sets
8260                + num_unmoved_movables (loop) + compare_and_branch == insn_count)
8261            && (bl == ivs->list && bl->next == 0))
8262           || (no_use_except_counting && ! loop_info->has_prefetch))
8263         {
8264           rtx tem;
8265
8266           /* Loop can be reversed.  */
8267           if (loop_dump_stream)
8268             fprintf (loop_dump_stream, "Can reverse loop\n");
8269
8270           /* Now check other conditions:
8271
8272              The increment must be a constant, as must the initial value,
8273              and the comparison code must be LT.
8274
8275              This test can probably be improved since +/- 1 in the constant
8276              can be obtained by changing LT to LE and vice versa; this is
8277              confusing.  */
8278
8279           if (comparison
8280               /* for constants, LE gets turned into LT */
8281               && (GET_CODE (comparison) == LT
8282                   || (GET_CODE (comparison) == LE
8283                       && no_use_except_counting)
8284                   || GET_CODE (comparison) == LTU))
8285             {
8286               HOST_WIDE_INT add_val, add_adjust, comparison_val = 0;
8287               rtx initial_value, comparison_value;
8288               int nonneg = 0;
8289               enum rtx_code cmp_code;
8290               int comparison_const_width;
8291               unsigned HOST_WIDE_INT comparison_sign_mask;
8292
8293               add_val = INTVAL (bl->biv->add_val);
8294               comparison_value = XEXP (comparison, 1);
8295               if (GET_MODE (comparison_value) == VOIDmode)
8296                 comparison_const_width
8297                   = GET_MODE_BITSIZE (GET_MODE (XEXP (comparison, 0)));
8298               else
8299                 comparison_const_width
8300                   = GET_MODE_BITSIZE (GET_MODE (comparison_value));
8301               if (comparison_const_width > HOST_BITS_PER_WIDE_INT)
8302                 comparison_const_width = HOST_BITS_PER_WIDE_INT;
8303               comparison_sign_mask
8304                 = (unsigned HOST_WIDE_INT) 1 << (comparison_const_width - 1);
8305
8306               /* If the comparison value is not a loop invariant, then we
8307                  can not reverse this loop.
8308
8309                  ??? If the insns which initialize the comparison value as
8310                  a whole compute an invariant result, then we could move
8311                  them out of the loop and proceed with loop reversal.  */
8312               if (! loop_invariant_p (loop, comparison_value))
8313                 return 0;
8314
8315               if (GET_CODE (comparison_value) == CONST_INT)
8316                 comparison_val = INTVAL (comparison_value);
8317               initial_value = bl->initial_value;
8318
8319               /* Normalize the initial value if it is an integer and
8320                  has no other use except as a counter.  This will allow
8321                  a few more loops to be reversed.  */
8322               if (no_use_except_counting
8323                   && GET_CODE (comparison_value) == CONST_INT
8324                   && GET_CODE (initial_value) == CONST_INT)
8325                 {
8326                   comparison_val = comparison_val - INTVAL (bl->initial_value);
8327                   /* The code below requires comparison_val to be a multiple
8328                      of add_val in order to do the loop reversal, so
8329                      round up comparison_val to a multiple of add_val.
8330                      Since comparison_value is constant, we know that the
8331                      current comparison code is LT.  */
8332                   comparison_val = comparison_val + add_val - 1;
8333                   comparison_val
8334                     -= (unsigned HOST_WIDE_INT) comparison_val % add_val;
8335                   /* We postpone overflow checks for COMPARISON_VAL here;
8336                      even if there is an overflow, we might still be able to
8337                      reverse the loop, if converting the loop exit test to
8338                      NE is possible.  */
8339                   initial_value = const0_rtx;
8340                 }
8341
8342               /* First check if we can do a vanilla loop reversal.  */
8343               if (initial_value == const0_rtx
8344                   /* If we have a decrement_and_branch_on_count,
8345                      prefer the NE test, since this will allow that
8346                      instruction to be generated.  Note that we must
8347                      use a vanilla loop reversal if the biv is used to
8348                      calculate a giv or has a non-counting use.  */
8349 #if ! defined (HAVE_decrement_and_branch_until_zero) \
8350 && defined (HAVE_decrement_and_branch_on_count)
8351                   && (! (add_val == 1 && loop->vtop
8352                          && (bl->biv_count == 0
8353                              || no_use_except_counting)))
8354 #endif
8355                   && GET_CODE (comparison_value) == CONST_INT
8356                      /* Now do postponed overflow checks on COMPARISON_VAL.  */
8357                   && ! (((comparison_val - add_val) ^ INTVAL (comparison_value))
8358                         & comparison_sign_mask))
8359                 {
8360                   /* Register will always be nonnegative, with value
8361                      0 on last iteration */
8362                   add_adjust = add_val;
8363                   nonneg = 1;
8364                   cmp_code = GE;
8365                 }
8366               else if (add_val == 1 && loop->vtop
8367                        && (bl->biv_count == 0
8368                            || no_use_except_counting))
8369                 {
8370                   add_adjust = 0;
8371                   cmp_code = NE;
8372                 }
8373               else
8374                 return 0;
8375
8376               if (GET_CODE (comparison) == LE)
8377                 add_adjust -= add_val;
8378
8379               /* If the initial value is not zero, or if the comparison
8380                  value is not an exact multiple of the increment, then we
8381                  can not reverse this loop.  */
8382               if (initial_value == const0_rtx
8383                   && GET_CODE (comparison_value) == CONST_INT)
8384                 {
8385                   if (((unsigned HOST_WIDE_INT) comparison_val % add_val) != 0)
8386                     return 0;
8387                 }
8388               else
8389                 {
8390                   if (! no_use_except_counting || add_val != 1)
8391                     return 0;
8392                 }
8393
8394               final_value = comparison_value;
8395
8396               /* Reset these in case we normalized the initial value
8397                  and comparison value above.  */
8398               if (GET_CODE (comparison_value) == CONST_INT
8399                   && GET_CODE (initial_value) == CONST_INT)
8400                 {
8401                   comparison_value = GEN_INT (comparison_val);
8402                   final_value
8403                     = GEN_INT (comparison_val + INTVAL (bl->initial_value));
8404                 }
8405               bl->initial_value = initial_value;
8406
8407               /* Save some info needed to produce the new insns.  */
8408               reg = bl->biv->dest_reg;
8409               mode = GET_MODE (reg);
8410               jump_label = condjump_label (PREV_INSN (loop_end));
8411               new_add_val = GEN_INT (-INTVAL (bl->biv->add_val));
8412
8413               /* Set start_value; if this is not a CONST_INT, we need
8414                  to generate a SUB.
8415                  Initialize biv to start_value before loop start.
8416                  The old initializing insn will be deleted as a
8417                  dead store by flow.c.  */
8418               if (initial_value == const0_rtx
8419                   && GET_CODE (comparison_value) == CONST_INT)
8420                 {
8421                   start_value
8422                     = gen_int_mode (comparison_val - add_adjust, mode);
8423                   loop_insn_hoist (loop, gen_move_insn (reg, start_value));
8424                 }
8425               else if (GET_CODE (initial_value) == CONST_INT)
8426                 {
8427                   rtx offset = GEN_INT (-INTVAL (initial_value) - add_adjust);
8428                   rtx add_insn = gen_add3_insn (reg, comparison_value, offset);
8429
8430                   if (add_insn == 0)
8431                     return 0;
8432
8433                   start_value
8434                     = gen_rtx_PLUS (mode, comparison_value, offset);
8435                   loop_insn_hoist (loop, add_insn);
8436                   if (GET_CODE (comparison) == LE)
8437                     final_value = gen_rtx_PLUS (mode, comparison_value,
8438                                                 GEN_INT (add_val));
8439                 }
8440               else if (! add_adjust)
8441                 {
8442                   rtx sub_insn = gen_sub3_insn (reg, comparison_value,
8443                                                 initial_value);
8444
8445                   if (sub_insn == 0)
8446                     return 0;
8447                   start_value
8448                     = gen_rtx_MINUS (mode, comparison_value, initial_value);
8449                   loop_insn_hoist (loop, sub_insn);
8450                 }
8451               else
8452                 /* We could handle the other cases too, but it'll be
8453                    better to have a testcase first.  */
8454                 return 0;
8455
8456               /* We may not have a single insn which can increment a reg, so
8457                  create a sequence to hold all the insns from expand_inc.  */
8458               start_sequence ();
8459               expand_inc (reg, new_add_val);
8460               tem = get_insns ();
8461               end_sequence ();
8462
8463               p = loop_insn_emit_before (loop, 0, bl->biv->insn, tem);
8464               delete_insn (bl->biv->insn);
8465
8466               /* Update biv info to reflect its new status.  */
8467               bl->biv->insn = p;
8468               bl->initial_value = start_value;
8469               bl->biv->add_val = new_add_val;
8470
8471               /* Update loop info.  */
8472               loop_info->initial_value = reg;
8473               loop_info->initial_equiv_value = reg;
8474               loop_info->final_value = const0_rtx;
8475               loop_info->final_equiv_value = const0_rtx;
8476               loop_info->comparison_value = const0_rtx;
8477               loop_info->comparison_code = cmp_code;
8478               loop_info->increment = new_add_val;
8479
8480               /* Inc LABEL_NUSES so that delete_insn will
8481                  not delete the label.  */
8482               LABEL_NUSES (XEXP (jump_label, 0))++;
8483
8484               /* Emit an insn after the end of the loop to set the biv's
8485                  proper exit value if it is used anywhere outside the loop.  */
8486               if ((REGNO_LAST_UID (bl->regno) != INSN_UID (first_compare))
8487                   || ! bl->init_insn
8488                   || REGNO_FIRST_UID (bl->regno) != INSN_UID (bl->init_insn))
8489                 loop_insn_sink (loop, gen_load_of_final_value (reg, final_value));
8490
8491               /* Delete compare/branch at end of loop.  */
8492               delete_related_insns (PREV_INSN (loop_end));
8493               if (compare_and_branch == 2)
8494                 delete_related_insns (first_compare);
8495
8496               /* Add new compare/branch insn at end of loop.  */
8497               start_sequence ();
8498               emit_cmp_and_jump_insns (reg, const0_rtx, cmp_code, NULL_RTX,
8499                                        mode, 0,
8500                                        XEXP (jump_label, 0));
8501               tem = get_insns ();
8502               end_sequence ();
8503               emit_jump_insn_before (tem, loop_end);
8504
8505               for (tem = PREV_INSN (loop_end);
8506                    tem && GET_CODE (tem) != JUMP_INSN;
8507                    tem = PREV_INSN (tem))
8508                 ;
8509
8510               if (tem)
8511                 JUMP_LABEL (tem) = XEXP (jump_label, 0);
8512
8513               if (nonneg)
8514                 {
8515                   if (tem)
8516                     {
8517                       /* Increment of LABEL_NUSES done above.  */
8518                       /* Register is now always nonnegative,
8519                          so add REG_NONNEG note to the branch.  */
8520                       REG_NOTES (tem) = gen_rtx_EXPR_LIST (REG_NONNEG, reg,
8521                                                            REG_NOTES (tem));
8522                     }
8523                   bl->nonneg = 1;
8524                 }
8525
8526               /* No insn may reference both the reversed and another biv or it
8527                  will fail (see comment near the top of the loop reversal
8528                  code).
8529                  Earlier on, we have verified that the biv has no use except
8530                  counting, or it is the only biv in this function.
8531                  However, the code that computes no_use_except_counting does
8532                  not verify reg notes.  It's possible to have an insn that
8533                  references another biv, and has a REG_EQUAL note with an
8534                  expression based on the reversed biv.  To avoid this case,
8535                  remove all REG_EQUAL notes based on the reversed biv
8536                  here.  */
8537               for (p = loop_start; p != loop_end; p = NEXT_INSN (p))
8538                 if (INSN_P (p))
8539                   {
8540                     rtx *pnote;
8541                     rtx set = single_set (p);
8542                     /* If this is a set of a GIV based on the reversed biv, any
8543                        REG_EQUAL notes should still be correct.  */
8544                     if (! set
8545                         || GET_CODE (SET_DEST (set)) != REG
8546                         || (size_t) REGNO (SET_DEST (set)) >= ivs->n_regs
8547                         || REG_IV_TYPE (ivs, REGNO (SET_DEST (set))) != GENERAL_INDUCT
8548                         || REG_IV_INFO (ivs, REGNO (SET_DEST (set)))->src_reg != bl->biv->src_reg)
8549                       for (pnote = &REG_NOTES (p); *pnote;)
8550                         {
8551                           if (REG_NOTE_KIND (*pnote) == REG_EQUAL
8552                               && reg_mentioned_p (regno_reg_rtx[bl->regno],
8553                                                   XEXP (*pnote, 0)))
8554                             *pnote = XEXP (*pnote, 1);
8555                           else
8556                             pnote = &XEXP (*pnote, 1);
8557                         }
8558                   }
8559
8560               /* Mark that this biv has been reversed.  Each giv which depends
8561                  on this biv, and which is also live past the end of the loop
8562                  will have to be fixed up.  */
8563
8564               bl->reversed = 1;
8565
8566               if (loop_dump_stream)
8567                 {
8568                   fprintf (loop_dump_stream, "Reversed loop");
8569                   if (bl->nonneg)
8570                     fprintf (loop_dump_stream, " and added reg_nonneg\n");
8571                   else
8572                     fprintf (loop_dump_stream, "\n");
8573                 }
8574
8575               return 1;
8576             }
8577         }
8578     }
8579
8580   return 0;
8581 }
8582 \f
8583 /* Verify whether the biv BL appears to be eliminable,
8584    based on the insns in the loop that refer to it.
8585
8586    If ELIMINATE_P is nonzero, actually do the elimination.
8587
8588    THRESHOLD and INSN_COUNT are from loop_optimize and are used to
8589    determine whether invariant insns should be placed inside or at the
8590    start of the loop.  */
8591
8592 static int
8593 maybe_eliminate_biv (const struct loop *loop, struct iv_class *bl,
8594                      int eliminate_p, int threshold, int insn_count)
8595 {
8596   struct loop_ivs *ivs = LOOP_IVS (loop);
8597   rtx reg = bl->biv->dest_reg;
8598   rtx p;
8599
8600   /* Scan all insns in the loop, stopping if we find one that uses the
8601      biv in a way that we cannot eliminate.  */
8602
8603   for (p = loop->start; p != loop->end; p = NEXT_INSN (p))
8604     {
8605       enum rtx_code code = GET_CODE (p);
8606       basic_block where_bb = 0;
8607       rtx where_insn = threshold >= insn_count ? 0 : p;
8608       rtx note;
8609
8610       /* If this is a libcall that sets a giv, skip ahead to its end.  */
8611       if (INSN_P (p))
8612         {
8613           note = find_reg_note (p, REG_LIBCALL, NULL_RTX);
8614
8615           if (note)
8616             {
8617               rtx last = XEXP (note, 0);
8618               rtx set = single_set (last);
8619
8620               if (set && GET_CODE (SET_DEST (set)) == REG)
8621                 {
8622                   unsigned int regno = REGNO (SET_DEST (set));
8623
8624                   if (regno < ivs->n_regs
8625                       && REG_IV_TYPE (ivs, regno) == GENERAL_INDUCT
8626                       && REG_IV_INFO (ivs, regno)->src_reg == bl->biv->src_reg)
8627                     p = last;
8628                 }
8629             }
8630         }
8631
8632       /* Closely examine the insn if the biv is mentioned.  */
8633       if ((code == INSN || code == JUMP_INSN || code == CALL_INSN)
8634           && reg_mentioned_p (reg, PATTERN (p))
8635           && ! maybe_eliminate_biv_1 (loop, PATTERN (p), p, bl,
8636                                       eliminate_p, where_bb, where_insn))
8637         {
8638           if (loop_dump_stream)
8639             fprintf (loop_dump_stream,
8640                      "Cannot eliminate biv %d: biv used in insn %d.\n",
8641                      bl->regno, INSN_UID (p));
8642           break;
8643         }
8644
8645       /* If we are eliminating, kill REG_EQUAL notes mentioning the biv.  */
8646       if (eliminate_p
8647           && (note = find_reg_note (p, REG_EQUAL, NULL_RTX)) != NULL_RTX
8648           && reg_mentioned_p (reg, XEXP (note, 0)))
8649         remove_note (p, note);
8650     }
8651
8652   if (p == loop->end)
8653     {
8654       if (loop_dump_stream)
8655         fprintf (loop_dump_stream, "biv %d %s eliminated.\n",
8656                  bl->regno, eliminate_p ? "was" : "can be");
8657       return 1;
8658     }
8659
8660   return 0;
8661 }
8662 \f
8663 /* INSN and REFERENCE are instructions in the same insn chain.
8664    Return nonzero if INSN is first.  */
8665
8666 int
8667 loop_insn_first_p (rtx insn, rtx reference)
8668 {
8669   rtx p, q;
8670
8671   for (p = insn, q = reference;;)
8672     {
8673       /* Start with test for not first so that INSN == REFERENCE yields not
8674          first.  */
8675       if (q == insn || ! p)
8676         return 0;
8677       if (p == reference || ! q)
8678         return 1;
8679
8680       /* Either of P or Q might be a NOTE.  Notes have the same LUID as the
8681          previous insn, hence the <= comparison below does not work if
8682          P is a note.  */
8683       if (INSN_UID (p) < max_uid_for_loop
8684           && INSN_UID (q) < max_uid_for_loop
8685           && GET_CODE (p) != NOTE)
8686         return INSN_LUID (p) <= INSN_LUID (q);
8687
8688       if (INSN_UID (p) >= max_uid_for_loop
8689           || GET_CODE (p) == NOTE)
8690         p = NEXT_INSN (p);
8691       if (INSN_UID (q) >= max_uid_for_loop)
8692         q = NEXT_INSN (q);
8693     }
8694 }
8695
8696 /* We are trying to eliminate BIV in INSN using GIV.  Return nonzero if
8697    the offset that we have to take into account due to auto-increment /
8698    div derivation is zero.  */
8699 static int
8700 biv_elimination_giv_has_0_offset (struct induction *biv,
8701                                   struct induction *giv, rtx insn)
8702 {
8703   /* If the giv V had the auto-inc address optimization applied
8704      to it, and INSN occurs between the giv insn and the biv
8705      insn, then we'd have to adjust the value used here.
8706      This is rare, so we don't bother to make this possible.  */
8707   if (giv->auto_inc_opt
8708       && ((loop_insn_first_p (giv->insn, insn)
8709            && loop_insn_first_p (insn, biv->insn))
8710           || (loop_insn_first_p (biv->insn, insn)
8711               && loop_insn_first_p (insn, giv->insn))))
8712     return 0;
8713
8714   return 1;
8715 }
8716
8717 /* If BL appears in X (part of the pattern of INSN), see if we can
8718    eliminate its use.  If so, return 1.  If not, return 0.
8719
8720    If BIV does not appear in X, return 1.
8721
8722    If ELIMINATE_P is nonzero, actually do the elimination.
8723    WHERE_INSN/WHERE_BB indicate where extra insns should be added.
8724    Depending on how many items have been moved out of the loop, it
8725    will either be before INSN (when WHERE_INSN is nonzero) or at the
8726    start of the loop (when WHERE_INSN is zero).  */
8727
8728 static int
8729 maybe_eliminate_biv_1 (const struct loop *loop, rtx x, rtx insn,
8730                        struct iv_class *bl, int eliminate_p,
8731                        basic_block where_bb, rtx where_insn)
8732 {
8733   enum rtx_code code = GET_CODE (x);
8734   rtx reg = bl->biv->dest_reg;
8735   enum machine_mode mode = GET_MODE (reg);
8736   struct induction *v;
8737   rtx arg, tem;
8738 #ifdef HAVE_cc0
8739   rtx new;
8740 #endif
8741   int arg_operand;
8742   const char *fmt;
8743   int i, j;
8744
8745   switch (code)
8746     {
8747     case REG:
8748       /* If we haven't already been able to do something with this BIV,
8749          we can't eliminate it.  */
8750       if (x == reg)
8751         return 0;
8752       return 1;
8753
8754     case SET:
8755       /* If this sets the BIV, it is not a problem.  */
8756       if (SET_DEST (x) == reg)
8757         return 1;
8758
8759       /* If this is an insn that defines a giv, it is also ok because
8760          it will go away when the giv is reduced.  */
8761       for (v = bl->giv; v; v = v->next_iv)
8762         if (v->giv_type == DEST_REG && SET_DEST (x) == v->dest_reg)
8763           return 1;
8764
8765 #ifdef HAVE_cc0
8766       if (SET_DEST (x) == cc0_rtx && SET_SRC (x) == reg)
8767         {
8768           /* Can replace with any giv that was reduced and
8769              that has (MULT_VAL != 0) and (ADD_VAL == 0).
8770              Require a constant for MULT_VAL, so we know it's nonzero.
8771              ??? We disable this optimization to avoid potential
8772              overflows.  */
8773
8774           for (v = bl->giv; v; v = v->next_iv)
8775             if (GET_CODE (v->mult_val) == CONST_INT && v->mult_val != const0_rtx
8776                 && v->add_val == const0_rtx
8777                 && ! v->ignore && ! v->maybe_dead && v->always_computable
8778                 && v->mode == mode
8779                 && 0)
8780               {
8781                 if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
8782                   continue;
8783
8784                 if (! eliminate_p)
8785                   return 1;
8786
8787                 /* If the giv has the opposite direction of change,
8788                    then reverse the comparison.  */
8789                 if (INTVAL (v->mult_val) < 0)
8790                   new = gen_rtx_COMPARE (GET_MODE (v->new_reg),
8791                                          const0_rtx, v->new_reg);
8792                 else
8793                   new = v->new_reg;
8794
8795                 /* We can probably test that giv's reduced reg.  */
8796                 if (validate_change (insn, &SET_SRC (x), new, 0))
8797                   return 1;
8798               }
8799
8800           /* Look for a giv with (MULT_VAL != 0) and (ADD_VAL != 0);
8801              replace test insn with a compare insn (cmp REDUCED_GIV ADD_VAL).
8802              Require a constant for MULT_VAL, so we know it's nonzero.
8803              ??? Do this only if ADD_VAL is a pointer to avoid a potential
8804              overflow problem.  */
8805
8806           for (v = bl->giv; v; v = v->next_iv)
8807             if (GET_CODE (v->mult_val) == CONST_INT
8808                 && v->mult_val != const0_rtx
8809                 && ! v->ignore && ! v->maybe_dead && v->always_computable
8810                 && v->mode == mode
8811                 && (GET_CODE (v->add_val) == SYMBOL_REF
8812                     || GET_CODE (v->add_val) == LABEL_REF
8813                     || GET_CODE (v->add_val) == CONST
8814                     || (GET_CODE (v->add_val) == REG
8815                         && REG_POINTER (v->add_val))))
8816               {
8817                 if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
8818                   continue;
8819
8820                 if (! eliminate_p)
8821                   return 1;
8822
8823                 /* If the giv has the opposite direction of change,
8824                    then reverse the comparison.  */
8825                 if (INTVAL (v->mult_val) < 0)
8826                   new = gen_rtx_COMPARE (VOIDmode, copy_rtx (v->add_val),
8827                                          v->new_reg);
8828                 else
8829                   new = gen_rtx_COMPARE (VOIDmode, v->new_reg,
8830                                          copy_rtx (v->add_val));
8831
8832                 /* Replace biv with the giv's reduced register.  */
8833                 update_reg_last_use (v->add_val, insn);
8834                 if (validate_change (insn, &SET_SRC (PATTERN (insn)), new, 0))
8835                   return 1;
8836
8837                 /* Insn doesn't support that constant or invariant.  Copy it
8838                    into a register (it will be a loop invariant.)  */
8839                 tem = gen_reg_rtx (GET_MODE (v->new_reg));
8840
8841                 loop_insn_emit_before (loop, 0, where_insn,
8842                                        gen_move_insn (tem,
8843                                                       copy_rtx (v->add_val)));
8844
8845                 /* Substitute the new register for its invariant value in
8846                    the compare expression.  */
8847                 XEXP (new, (INTVAL (v->mult_val) < 0) ? 0 : 1) = tem;
8848                 if (validate_change (insn, &SET_SRC (PATTERN (insn)), new, 0))
8849                   return 1;
8850               }
8851         }
8852 #endif
8853       break;
8854
8855     case COMPARE:
8856     case EQ:  case NE:
8857     case GT:  case GE:  case GTU:  case GEU:
8858     case LT:  case LE:  case LTU:  case LEU:
8859       /* See if either argument is the biv.  */
8860       if (XEXP (x, 0) == reg)
8861         arg = XEXP (x, 1), arg_operand = 1;
8862       else if (XEXP (x, 1) == reg)
8863         arg = XEXP (x, 0), arg_operand = 0;
8864       else
8865         break;
8866
8867       if (CONSTANT_P (arg))
8868         {
8869           /* First try to replace with any giv that has constant positive
8870              mult_val and constant add_val.  We might be able to support
8871              negative mult_val, but it seems complex to do it in general.  */
8872
8873           for (v = bl->giv; v; v = v->next_iv)
8874             if (GET_CODE (v->mult_val) == CONST_INT
8875                 && INTVAL (v->mult_val) > 0
8876                 && (GET_CODE (v->add_val) == SYMBOL_REF
8877                     || GET_CODE (v->add_val) == LABEL_REF
8878                     || GET_CODE (v->add_val) == CONST
8879                     || (GET_CODE (v->add_val) == REG
8880                         && REG_POINTER (v->add_val)))
8881                 && ! v->ignore && ! v->maybe_dead && v->always_computable
8882                 && v->mode == mode)
8883               {
8884                 if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
8885                   continue;
8886
8887                 /* Don't eliminate if the linear combination that makes up
8888                    the giv overflows when it is applied to ARG.  */
8889                 if (GET_CODE (arg) == CONST_INT)
8890                   {
8891                     rtx add_val;
8892
8893                     if (GET_CODE (v->add_val) == CONST_INT)
8894                       add_val = v->add_val;
8895                     else
8896                       add_val = const0_rtx;
8897
8898                     if (const_mult_add_overflow_p (arg, v->mult_val,
8899                                                    add_val, mode, 1))
8900                       continue;
8901                   }
8902
8903                 if (! eliminate_p)
8904                   return 1;
8905
8906                 /* Replace biv with the giv's reduced reg.  */
8907                 validate_change (insn, &XEXP (x, 1 - arg_operand), v->new_reg, 1);
8908
8909                 /* If all constants are actually constant integers and
8910                    the derived constant can be directly placed in the COMPARE,
8911                    do so.  */
8912                 if (GET_CODE (arg) == CONST_INT
8913                     && GET_CODE (v->add_val) == CONST_INT)
8914                   {
8915                     tem = expand_mult_add (arg, NULL_RTX, v->mult_val,
8916                                            v->add_val, mode, 1);
8917                   }
8918                 else
8919                   {
8920                     /* Otherwise, load it into a register.  */
8921                     tem = gen_reg_rtx (mode);
8922                     loop_iv_add_mult_emit_before (loop, arg,
8923                                                   v->mult_val, v->add_val,
8924                                                   tem, where_bb, where_insn);
8925                   }
8926
8927                 validate_change (insn, &XEXP (x, arg_operand), tem, 1);
8928
8929                 if (apply_change_group ())
8930                   return 1;
8931               }
8932
8933           /* Look for giv with positive constant mult_val and nonconst add_val.
8934              Insert insns to calculate new compare value.
8935              ??? Turn this off due to possible overflow.  */
8936
8937           for (v = bl->giv; v; v = v->next_iv)
8938             if (GET_CODE (v->mult_val) == CONST_INT
8939                 && INTVAL (v->mult_val) > 0
8940                 && ! v->ignore && ! v->maybe_dead && v->always_computable
8941                 && v->mode == mode
8942                 && 0)
8943               {
8944                 rtx tem;
8945
8946                 if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
8947                   continue;
8948
8949                 if (! eliminate_p)
8950                   return 1;
8951
8952                 tem = gen_reg_rtx (mode);
8953
8954                 /* Replace biv with giv's reduced register.  */
8955                 validate_change (insn, &XEXP (x, 1 - arg_operand),
8956                                  v->new_reg, 1);
8957
8958                 /* Compute value to compare against.  */
8959                 loop_iv_add_mult_emit_before (loop, arg,
8960                                               v->mult_val, v->add_val,
8961                                               tem, where_bb, where_insn);
8962                 /* Use it in this insn.  */
8963                 validate_change (insn, &XEXP (x, arg_operand), tem, 1);
8964                 if (apply_change_group ())
8965                   return 1;
8966               }
8967         }
8968       else if (GET_CODE (arg) == REG || GET_CODE (arg) == MEM)
8969         {
8970           if (loop_invariant_p (loop, arg) == 1)
8971             {
8972               /* Look for giv with constant positive mult_val and nonconst
8973                  add_val. Insert insns to compute new compare value.
8974                  ??? Turn this off due to possible overflow.  */
8975
8976               for (v = bl->giv; v; v = v->next_iv)
8977                 if (GET_CODE (v->mult_val) == CONST_INT && INTVAL (v->mult_val) > 0
8978                     && ! v->ignore && ! v->maybe_dead && v->always_computable
8979                     && v->mode == mode
8980                     && 0)
8981                   {
8982                     rtx tem;
8983
8984                     if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
8985                       continue;
8986
8987                     if (! eliminate_p)
8988                       return 1;
8989
8990                     tem = gen_reg_rtx (mode);
8991
8992                     /* Replace biv with giv's reduced register.  */
8993                     validate_change (insn, &XEXP (x, 1 - arg_operand),
8994                                      v->new_reg, 1);
8995
8996                     /* Compute value to compare against.  */
8997                     loop_iv_add_mult_emit_before (loop, arg,
8998                                                   v->mult_val, v->add_val,
8999                                                   tem, where_bb, where_insn);
9000                     validate_change (insn, &XEXP (x, arg_operand), tem, 1);
9001                     if (apply_change_group ())
9002                       return 1;
9003                   }
9004             }
9005
9006           /* This code has problems.  Basically, you can't know when
9007              seeing if we will eliminate BL, whether a particular giv
9008              of ARG will be reduced.  If it isn't going to be reduced,
9009              we can't eliminate BL.  We can try forcing it to be reduced,
9010              but that can generate poor code.
9011
9012              The problem is that the benefit of reducing TV, below should
9013              be increased if BL can actually be eliminated, but this means
9014              we might have to do a topological sort of the order in which
9015              we try to process biv.  It doesn't seem worthwhile to do
9016              this sort of thing now.  */
9017
9018 #if 0
9019           /* Otherwise the reg compared with had better be a biv.  */
9020           if (GET_CODE (arg) != REG
9021               || REG_IV_TYPE (ivs, REGNO (arg)) != BASIC_INDUCT)
9022             return 0;
9023
9024           /* Look for a pair of givs, one for each biv,
9025              with identical coefficients.  */
9026           for (v = bl->giv; v; v = v->next_iv)
9027             {
9028               struct induction *tv;
9029
9030               if (v->ignore || v->maybe_dead || v->mode != mode)
9031                 continue;
9032
9033               for (tv = REG_IV_CLASS (ivs, REGNO (arg))->giv; tv;
9034                    tv = tv->next_iv)
9035                 if (! tv->ignore && ! tv->maybe_dead
9036                     && rtx_equal_p (tv->mult_val, v->mult_val)
9037                     && rtx_equal_p (tv->add_val, v->add_val)
9038                     && tv->mode == mode)
9039                   {
9040                     if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
9041                       continue;
9042
9043                     if (! eliminate_p)
9044                       return 1;
9045
9046                     /* Replace biv with its giv's reduced reg.  */
9047                     XEXP (x, 1 - arg_operand) = v->new_reg;
9048                     /* Replace other operand with the other giv's
9049                        reduced reg.  */
9050                     XEXP (x, arg_operand) = tv->new_reg;
9051                     return 1;
9052                   }
9053             }
9054 #endif
9055         }
9056
9057       /* If we get here, the biv can't be eliminated.  */
9058       return 0;
9059
9060     case MEM:
9061       /* If this address is a DEST_ADDR giv, it doesn't matter if the
9062          biv is used in it, since it will be replaced.  */
9063       for (v = bl->giv; v; v = v->next_iv)
9064         if (v->giv_type == DEST_ADDR && v->location == &XEXP (x, 0))
9065           return 1;
9066       break;
9067
9068     default:
9069       break;
9070     }
9071
9072   /* See if any subexpression fails elimination.  */
9073   fmt = GET_RTX_FORMAT (code);
9074   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
9075     {
9076       switch (fmt[i])
9077         {
9078         case 'e':
9079           if (! maybe_eliminate_biv_1 (loop, XEXP (x, i), insn, bl,
9080                                        eliminate_p, where_bb, where_insn))
9081             return 0;
9082           break;
9083
9084         case 'E':
9085           for (j = XVECLEN (x, i) - 1; j >= 0; j--)
9086             if (! maybe_eliminate_biv_1 (loop, XVECEXP (x, i, j), insn, bl,
9087                                          eliminate_p, where_bb, where_insn))
9088               return 0;
9089           break;
9090         }
9091     }
9092
9093   return 1;
9094 }
9095 \f
9096 /* Return nonzero if the last use of REG
9097    is in an insn following INSN in the same basic block.  */
9098
9099 static int
9100 last_use_this_basic_block (rtx reg, rtx insn)
9101 {
9102   rtx n;
9103   for (n = insn;
9104        n && GET_CODE (n) != CODE_LABEL && GET_CODE (n) != JUMP_INSN;
9105        n = NEXT_INSN (n))
9106     {
9107       if (REGNO_LAST_UID (REGNO (reg)) == INSN_UID (n))
9108         return 1;
9109     }
9110   return 0;
9111 }
9112 \f
9113 /* Called via `note_stores' to record the initial value of a biv.  Here we
9114    just record the location of the set and process it later.  */
9115
9116 static void
9117 record_initial (rtx dest, rtx set, void *data ATTRIBUTE_UNUSED)
9118 {
9119   struct loop_ivs *ivs = (struct loop_ivs *) data;
9120   struct iv_class *bl;
9121
9122   if (GET_CODE (dest) != REG
9123       || REGNO (dest) >= ivs->n_regs
9124       || REG_IV_TYPE (ivs, REGNO (dest)) != BASIC_INDUCT)
9125     return;
9126
9127   bl = REG_IV_CLASS (ivs, REGNO (dest));
9128
9129   /* If this is the first set found, record it.  */
9130   if (bl->init_insn == 0)
9131     {
9132       bl->init_insn = note_insn;
9133       bl->init_set = set;
9134     }
9135 }
9136 \f
9137 /* If any of the registers in X are "old" and currently have a last use earlier
9138    than INSN, update them to have a last use of INSN.  Their actual last use
9139    will be the previous insn but it will not have a valid uid_luid so we can't
9140    use it.  X must be a source expression only.  */
9141
9142 static void
9143 update_reg_last_use (rtx x, rtx insn)
9144 {
9145   /* Check for the case where INSN does not have a valid luid.  In this case,
9146      there is no need to modify the regno_last_uid, as this can only happen
9147      when code is inserted after the loop_end to set a pseudo's final value,
9148      and hence this insn will never be the last use of x.
9149      ???? This comment is not correct.  See for example loop_givs_reduce.
9150      This may insert an insn before another new insn.  */
9151   if (GET_CODE (x) == REG && REGNO (x) < max_reg_before_loop
9152       && INSN_UID (insn) < max_uid_for_loop
9153       && REGNO_LAST_LUID (REGNO (x)) < INSN_LUID (insn))
9154     {
9155       REGNO_LAST_UID (REGNO (x)) = INSN_UID (insn);
9156     }
9157   else
9158     {
9159       int i, j;
9160       const char *fmt = GET_RTX_FORMAT (GET_CODE (x));
9161       for (i = GET_RTX_LENGTH (GET_CODE (x)) - 1; i >= 0; i--)
9162         {
9163           if (fmt[i] == 'e')
9164             update_reg_last_use (XEXP (x, i), insn);
9165           else if (fmt[i] == 'E')
9166             for (j = XVECLEN (x, i) - 1; j >= 0; j--)
9167               update_reg_last_use (XVECEXP (x, i, j), insn);
9168         }
9169     }
9170 }
9171 \f
9172 /* Given an insn INSN and condition COND, return the condition in a
9173    canonical form to simplify testing by callers.  Specifically:
9174
9175    (1) The code will always be a comparison operation (EQ, NE, GT, etc.).
9176    (2) Both operands will be machine operands; (cc0) will have been replaced.
9177    (3) If an operand is a constant, it will be the second operand.
9178    (4) (LE x const) will be replaced with (LT x <const+1>) and similarly
9179        for GE, GEU, and LEU.
9180
9181    If the condition cannot be understood, or is an inequality floating-point
9182    comparison which needs to be reversed, 0 will be returned.
9183
9184    If REVERSE is nonzero, then reverse the condition prior to canonizing it.
9185
9186    If EARLIEST is nonzero, it is a pointer to a place where the earliest
9187    insn used in locating the condition was found.  If a replacement test
9188    of the condition is desired, it should be placed in front of that
9189    insn and we will be sure that the inputs are still valid.
9190
9191    If WANT_REG is nonzero, we wish the condition to be relative to that
9192    register, if possible.  Therefore, do not canonicalize the condition
9193    further.  If ALLOW_CC_MODE is nonzero, allow the condition returned
9194    to be a compare to a CC mode register.  */
9195
9196 rtx
9197 canonicalize_condition (rtx insn, rtx cond, int reverse, rtx *earliest,
9198                         rtx want_reg, int allow_cc_mode)
9199 {
9200   enum rtx_code code;
9201   rtx prev = insn;
9202   rtx set;
9203   rtx tem;
9204   rtx op0, op1;
9205   int reverse_code = 0;
9206   enum machine_mode mode;
9207
9208   code = GET_CODE (cond);
9209   mode = GET_MODE (cond);
9210   op0 = XEXP (cond, 0);
9211   op1 = XEXP (cond, 1);
9212
9213   if (reverse)
9214     code = reversed_comparison_code (cond, insn);
9215   if (code == UNKNOWN)
9216     return 0;
9217
9218   if (earliest)
9219     *earliest = insn;
9220
9221   /* If we are comparing a register with zero, see if the register is set
9222      in the previous insn to a COMPARE or a comparison operation.  Perform
9223      the same tests as a function of STORE_FLAG_VALUE as find_comparison_args
9224      in cse.c  */
9225
9226   while ((GET_RTX_CLASS (code) == RTX_COMPARE
9227           || GET_RTX_CLASS (code) == RTX_COMM_COMPARE)
9228          && op1 == CONST0_RTX (GET_MODE (op0))
9229          && op0 != want_reg)
9230     {
9231       /* Set nonzero when we find something of interest.  */
9232       rtx x = 0;
9233
9234 #ifdef HAVE_cc0
9235       /* If comparison with cc0, import actual comparison from compare
9236          insn.  */
9237       if (op0 == cc0_rtx)
9238         {
9239           if ((prev = prev_nonnote_insn (prev)) == 0
9240               || GET_CODE (prev) != INSN
9241               || (set = single_set (prev)) == 0
9242               || SET_DEST (set) != cc0_rtx)
9243             return 0;
9244
9245           op0 = SET_SRC (set);
9246           op1 = CONST0_RTX (GET_MODE (op0));
9247           if (earliest)
9248             *earliest = prev;
9249         }
9250 #endif
9251
9252       /* If this is a COMPARE, pick up the two things being compared.  */
9253       if (GET_CODE (op0) == COMPARE)
9254         {
9255           op1 = XEXP (op0, 1);
9256           op0 = XEXP (op0, 0);
9257           continue;
9258         }
9259       else if (GET_CODE (op0) != REG)
9260         break;
9261
9262       /* Go back to the previous insn.  Stop if it is not an INSN.  We also
9263          stop if it isn't a single set or if it has a REG_INC note because
9264          we don't want to bother dealing with it.  */
9265
9266       if ((prev = prev_nonnote_insn (prev)) == 0
9267           || GET_CODE (prev) != INSN
9268           || FIND_REG_INC_NOTE (prev, NULL_RTX))
9269         break;
9270
9271       set = set_of (op0, prev);
9272
9273       if (set
9274           && (GET_CODE (set) != SET
9275               || !rtx_equal_p (SET_DEST (set), op0)))
9276         break;
9277
9278       /* If this is setting OP0, get what it sets it to if it looks
9279          relevant.  */
9280       if (set)
9281         {
9282           enum machine_mode inner_mode = GET_MODE (SET_DEST (set));
9283 #ifdef FLOAT_STORE_FLAG_VALUE
9284           REAL_VALUE_TYPE fsfv;
9285 #endif
9286
9287           /* ??? We may not combine comparisons done in a CCmode with
9288              comparisons not done in a CCmode.  This is to aid targets
9289              like Alpha that have an IEEE compliant EQ instruction, and
9290              a non-IEEE compliant BEQ instruction.  The use of CCmode is
9291              actually artificial, simply to prevent the combination, but
9292              should not affect other platforms.
9293
9294              However, we must allow VOIDmode comparisons to match either
9295              CCmode or non-CCmode comparison, because some ports have
9296              modeless comparisons inside branch patterns.
9297
9298              ??? This mode check should perhaps look more like the mode check
9299              in simplify_comparison in combine.  */
9300
9301           if ((GET_CODE (SET_SRC (set)) == COMPARE
9302                || (((code == NE
9303                      || (code == LT
9304                          && GET_MODE_CLASS (inner_mode) == MODE_INT
9305                          && (GET_MODE_BITSIZE (inner_mode)
9306                              <= HOST_BITS_PER_WIDE_INT)
9307                          && (STORE_FLAG_VALUE
9308                              & ((HOST_WIDE_INT) 1
9309                                 << (GET_MODE_BITSIZE (inner_mode) - 1))))
9310 #ifdef FLOAT_STORE_FLAG_VALUE
9311                      || (code == LT
9312                          && GET_MODE_CLASS (inner_mode) == MODE_FLOAT
9313                          && (fsfv = FLOAT_STORE_FLAG_VALUE (inner_mode),
9314                              REAL_VALUE_NEGATIVE (fsfv)))
9315 #endif
9316                      ))
9317                    && COMPARISON_P (SET_SRC (set))))
9318               && (((GET_MODE_CLASS (mode) == MODE_CC)
9319                    == (GET_MODE_CLASS (inner_mode) == MODE_CC))
9320                   || mode == VOIDmode || inner_mode == VOIDmode))
9321             x = SET_SRC (set);
9322           else if (((code == EQ
9323                      || (code == GE
9324                          && (GET_MODE_BITSIZE (inner_mode)
9325                              <= HOST_BITS_PER_WIDE_INT)
9326                          && GET_MODE_CLASS (inner_mode) == MODE_INT
9327                          && (STORE_FLAG_VALUE
9328                              & ((HOST_WIDE_INT) 1
9329                                 << (GET_MODE_BITSIZE (inner_mode) - 1))))
9330 #ifdef FLOAT_STORE_FLAG_VALUE
9331                      || (code == GE
9332                          && GET_MODE_CLASS (inner_mode) == MODE_FLOAT
9333                          && (fsfv = FLOAT_STORE_FLAG_VALUE (inner_mode),
9334                              REAL_VALUE_NEGATIVE (fsfv)))
9335 #endif
9336                      ))
9337                    && COMPARISON_P (SET_SRC (set))
9338                    && (((GET_MODE_CLASS (mode) == MODE_CC)
9339                         == (GET_MODE_CLASS (inner_mode) == MODE_CC))
9340                        || mode == VOIDmode || inner_mode == VOIDmode))
9341
9342             {
9343               reverse_code = 1;
9344               x = SET_SRC (set);
9345             }
9346           else
9347             break;
9348         }
9349
9350       else if (reg_set_p (op0, prev))
9351         /* If this sets OP0, but not directly, we have to give up.  */
9352         break;
9353
9354       if (x)
9355         {
9356           if (COMPARISON_P (x))
9357             code = GET_CODE (x);
9358           if (reverse_code)
9359             {
9360               code = reversed_comparison_code (x, prev);
9361               if (code == UNKNOWN)
9362                 return 0;
9363               reverse_code = 0;
9364             }
9365
9366           op0 = XEXP (x, 0), op1 = XEXP (x, 1);
9367           if (earliest)
9368             *earliest = prev;
9369         }
9370     }
9371
9372   /* If constant is first, put it last.  */
9373   if (CONSTANT_P (op0))
9374     code = swap_condition (code), tem = op0, op0 = op1, op1 = tem;
9375
9376   /* If OP0 is the result of a comparison, we weren't able to find what
9377      was really being compared, so fail.  */
9378   if (!allow_cc_mode
9379       && GET_MODE_CLASS (GET_MODE (op0)) == MODE_CC)
9380     return 0;
9381
9382   /* Canonicalize any ordered comparison with integers involving equality
9383      if we can do computations in the relevant mode and we do not
9384      overflow.  */
9385
9386   if (GET_MODE_CLASS (GET_MODE (op0)) != MODE_CC
9387       && GET_CODE (op1) == CONST_INT
9388       && GET_MODE (op0) != VOIDmode
9389       && GET_MODE_BITSIZE (GET_MODE (op0)) <= HOST_BITS_PER_WIDE_INT)
9390     {
9391       HOST_WIDE_INT const_val = INTVAL (op1);
9392       unsigned HOST_WIDE_INT uconst_val = const_val;
9393       unsigned HOST_WIDE_INT max_val
9394         = (unsigned HOST_WIDE_INT) GET_MODE_MASK (GET_MODE (op0));
9395
9396       switch (code)
9397         {
9398         case LE:
9399           if ((unsigned HOST_WIDE_INT) const_val != max_val >> 1)
9400             code = LT, op1 = gen_int_mode (const_val + 1, GET_MODE (op0));
9401           break;
9402
9403         /* When cross-compiling, const_val might be sign-extended from
9404            BITS_PER_WORD to HOST_BITS_PER_WIDE_INT */
9405         case GE:
9406           if ((HOST_WIDE_INT) (const_val & max_val)
9407               != (((HOST_WIDE_INT) 1
9408                    << (GET_MODE_BITSIZE (GET_MODE (op0)) - 1))))
9409             code = GT, op1 = gen_int_mode (const_val - 1, GET_MODE (op0));
9410           break;
9411
9412         case LEU:
9413           if (uconst_val < max_val)
9414             code = LTU, op1 = gen_int_mode (uconst_val + 1, GET_MODE (op0));
9415           break;
9416
9417         case GEU:
9418           if (uconst_val != 0)
9419             code = GTU, op1 = gen_int_mode (uconst_val - 1, GET_MODE (op0));
9420           break;
9421
9422         default:
9423           break;
9424         }
9425     }
9426
9427   /* Never return CC0; return zero instead.  */
9428   if (CC0_P (op0))
9429     return 0;
9430
9431   return gen_rtx_fmt_ee (code, VOIDmode, op0, op1);
9432 }
9433
9434 /* Given a jump insn JUMP, return the condition that will cause it to branch
9435    to its JUMP_LABEL.  If the condition cannot be understood, or is an
9436    inequality floating-point comparison which needs to be reversed, 0 will
9437    be returned.
9438
9439    If EARLIEST is nonzero, it is a pointer to a place where the earliest
9440    insn used in locating the condition was found.  If a replacement test
9441    of the condition is desired, it should be placed in front of that
9442    insn and we will be sure that the inputs are still valid.
9443
9444    If ALLOW_CC_MODE is nonzero, allow the condition returned to be a
9445    compare CC mode register.  */
9446
9447 rtx
9448 get_condition (rtx jump, rtx *earliest, int allow_cc_mode)
9449 {
9450   rtx cond;
9451   int reverse;
9452   rtx set;
9453
9454   /* If this is not a standard conditional jump, we can't parse it.  */
9455   if (GET_CODE (jump) != JUMP_INSN
9456       || ! any_condjump_p (jump))
9457     return 0;
9458   set = pc_set (jump);
9459
9460   cond = XEXP (SET_SRC (set), 0);
9461
9462   /* If this branches to JUMP_LABEL when the condition is false, reverse
9463      the condition.  */
9464   reverse
9465     = GET_CODE (XEXP (SET_SRC (set), 2)) == LABEL_REF
9466       && XEXP (XEXP (SET_SRC (set), 2), 0) == JUMP_LABEL (jump);
9467
9468   return canonicalize_condition (jump, cond, reverse, earliest, NULL_RTX,
9469                                  allow_cc_mode);
9470 }
9471
9472 /* Similar to above routine, except that we also put an invariant last
9473    unless both operands are invariants.  */
9474
9475 rtx
9476 get_condition_for_loop (const struct loop *loop, rtx x)
9477 {
9478   rtx comparison = get_condition (x, (rtx*) 0, false);
9479
9480   if (comparison == 0
9481       || ! loop_invariant_p (loop, XEXP (comparison, 0))
9482       || loop_invariant_p (loop, XEXP (comparison, 1)))
9483     return comparison;
9484
9485   return gen_rtx_fmt_ee (swap_condition (GET_CODE (comparison)), VOIDmode,
9486                          XEXP (comparison, 1), XEXP (comparison, 0));
9487 }
9488
9489 /* Scan the function and determine whether it has indirect (computed) jumps.
9490
9491    This is taken mostly from flow.c; similar code exists elsewhere
9492    in the compiler.  It may be useful to put this into rtlanal.c.  */
9493 static int
9494 indirect_jump_in_function_p (rtx start)
9495 {
9496   rtx insn;
9497
9498   for (insn = start; insn; insn = NEXT_INSN (insn))
9499     if (computed_jump_p (insn))
9500       return 1;
9501
9502   return 0;
9503 }
9504
9505 /* Add MEM to the LOOP_MEMS array, if appropriate.  See the
9506    documentation for LOOP_MEMS for the definition of `appropriate'.
9507    This function is called from prescan_loop via for_each_rtx.  */
9508
9509 static int
9510 insert_loop_mem (rtx *mem, void *data ATTRIBUTE_UNUSED)
9511 {
9512   struct loop_info *loop_info = data;
9513   int i;
9514   rtx m = *mem;
9515
9516   if (m == NULL_RTX)
9517     return 0;
9518
9519   switch (GET_CODE (m))
9520     {
9521     case MEM:
9522       break;
9523
9524     case CLOBBER:
9525       /* We're not interested in MEMs that are only clobbered.  */
9526       return -1;
9527
9528     case CONST_DOUBLE:
9529       /* We're not interested in the MEM associated with a
9530          CONST_DOUBLE, so there's no need to traverse into this.  */
9531       return -1;
9532
9533     case EXPR_LIST:
9534       /* We're not interested in any MEMs that only appear in notes.  */
9535       return -1;
9536
9537     default:
9538       /* This is not a MEM.  */
9539       return 0;
9540     }
9541
9542   /* See if we've already seen this MEM.  */
9543   for (i = 0; i < loop_info->mems_idx; ++i)
9544     if (rtx_equal_p (m, loop_info->mems[i].mem))
9545       {
9546         if (MEM_VOLATILE_P (m) && !MEM_VOLATILE_P (loop_info->mems[i].mem))
9547           loop_info->mems[i].mem = m;
9548         if (GET_MODE (m) != GET_MODE (loop_info->mems[i].mem))
9549           /* The modes of the two memory accesses are different.  If
9550              this happens, something tricky is going on, and we just
9551              don't optimize accesses to this MEM.  */
9552           loop_info->mems[i].optimize = 0;
9553
9554         return 0;
9555       }
9556
9557   /* Resize the array, if necessary.  */
9558   if (loop_info->mems_idx == loop_info->mems_allocated)
9559     {
9560       if (loop_info->mems_allocated != 0)
9561         loop_info->mems_allocated *= 2;
9562       else
9563         loop_info->mems_allocated = 32;
9564
9565       loop_info->mems = xrealloc (loop_info->mems,
9566                                   loop_info->mems_allocated * sizeof (loop_mem_info));
9567     }
9568
9569   /* Actually insert the MEM.  */
9570   loop_info->mems[loop_info->mems_idx].mem = m;
9571   /* We can't hoist this MEM out of the loop if it's a BLKmode MEM
9572      because we can't put it in a register.  We still store it in the
9573      table, though, so that if we see the same address later, but in a
9574      non-BLK mode, we'll not think we can optimize it at that point.  */
9575   loop_info->mems[loop_info->mems_idx].optimize = (GET_MODE (m) != BLKmode);
9576   loop_info->mems[loop_info->mems_idx].reg = NULL_RTX;
9577   ++loop_info->mems_idx;
9578
9579   return 0;
9580 }
9581
9582
9583 /* Allocate REGS->ARRAY or reallocate it if it is too small.
9584
9585    Increment REGS->ARRAY[I].SET_IN_LOOP at the index I of each
9586    register that is modified by an insn between FROM and TO.  If the
9587    value of an element of REGS->array[I].SET_IN_LOOP becomes 127 or
9588    more, stop incrementing it, to avoid overflow.
9589
9590    Store in REGS->ARRAY[I].SINGLE_USAGE the single insn in which
9591    register I is used, if it is only used once.  Otherwise, it is set
9592    to 0 (for no uses) or const0_rtx for more than one use.  This
9593    parameter may be zero, in which case this processing is not done.
9594
9595    Set REGS->ARRAY[I].MAY_NOT_OPTIMIZE nonzero if we should not
9596    optimize register I.  */
9597
9598 static void
9599 loop_regs_scan (const struct loop *loop, int extra_size)
9600 {
9601   struct loop_regs *regs = LOOP_REGS (loop);
9602   int old_nregs;
9603   /* last_set[n] is nonzero iff reg n has been set in the current
9604    basic block.  In that case, it is the insn that last set reg n.  */
9605   rtx *last_set;
9606   rtx insn;
9607   int i;
9608
9609   old_nregs = regs->num;
9610   regs->num = max_reg_num ();
9611
9612   /* Grow the regs array if not allocated or too small.  */
9613   if (regs->num >= regs->size)
9614     {
9615       regs->size = regs->num + extra_size;
9616
9617       regs->array = xrealloc (regs->array, regs->size * sizeof (*regs->array));
9618
9619       /* Zero the new elements.  */
9620       memset (regs->array + old_nregs, 0,
9621               (regs->size - old_nregs) * sizeof (*regs->array));
9622     }
9623
9624   /* Clear previously scanned fields but do not clear n_times_set.  */
9625   for (i = 0; i < old_nregs; i++)
9626     {
9627       regs->array[i].set_in_loop = 0;
9628       regs->array[i].may_not_optimize = 0;
9629       regs->array[i].single_usage = NULL_RTX;
9630     }
9631
9632   last_set = xcalloc (regs->num, sizeof (rtx));
9633
9634   /* Scan the loop, recording register usage.  */
9635   for (insn = loop->top ? loop->top : loop->start; insn != loop->end;
9636        insn = NEXT_INSN (insn))
9637     {
9638       if (INSN_P (insn))
9639         {
9640           /* Record registers that have exactly one use.  */
9641           find_single_use_in_loop (regs, insn, PATTERN (insn));
9642
9643           /* Include uses in REG_EQUAL notes.  */
9644           if (REG_NOTES (insn))
9645             find_single_use_in_loop (regs, insn, REG_NOTES (insn));
9646
9647           if (GET_CODE (PATTERN (insn)) == SET
9648               || GET_CODE (PATTERN (insn)) == CLOBBER)
9649             count_one_set (regs, insn, PATTERN (insn), last_set);
9650           else if (GET_CODE (PATTERN (insn)) == PARALLEL)
9651             {
9652               int i;
9653               for (i = XVECLEN (PATTERN (insn), 0) - 1; i >= 0; i--)
9654                 count_one_set (regs, insn, XVECEXP (PATTERN (insn), 0, i),
9655                                last_set);
9656             }
9657         }
9658
9659       if (GET_CODE (insn) == CODE_LABEL || GET_CODE (insn) == JUMP_INSN)
9660         memset (last_set, 0, regs->num * sizeof (rtx));
9661
9662       /* Invalidate all registers used for function argument passing.
9663          We check rtx_varies_p for the same reason as below, to allow
9664          optimizing PIC calculations.  */
9665       if (GET_CODE (insn) == CALL_INSN)
9666         {
9667           rtx link;
9668           for (link = CALL_INSN_FUNCTION_USAGE (insn);
9669                link;
9670                link = XEXP (link, 1))
9671             {
9672               rtx op, reg;
9673
9674               if (GET_CODE (op = XEXP (link, 0)) == USE
9675                   && GET_CODE (reg = XEXP (op, 0)) == REG
9676                   && rtx_varies_p (reg, 1))
9677                 regs->array[REGNO (reg)].may_not_optimize = 1;
9678             }
9679         }
9680     }
9681
9682   /* Invalidate all hard registers clobbered by calls.  With one exception:
9683      a call-clobbered PIC register is still function-invariant for our
9684      purposes, since we can hoist any PIC calculations out of the loop.
9685      Thus the call to rtx_varies_p.  */
9686   if (LOOP_INFO (loop)->has_call)
9687     for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
9688       if (TEST_HARD_REG_BIT (regs_invalidated_by_call, i)
9689           && rtx_varies_p (regno_reg_rtx[i], 1))
9690         {
9691           regs->array[i].may_not_optimize = 1;
9692           regs->array[i].set_in_loop = 1;
9693         }
9694
9695 #ifdef AVOID_CCMODE_COPIES
9696   /* Don't try to move insns which set CC registers if we should not
9697      create CCmode register copies.  */
9698   for (i = regs->num - 1; i >= FIRST_PSEUDO_REGISTER; i--)
9699     if (GET_MODE_CLASS (GET_MODE (regno_reg_rtx[i])) == MODE_CC)
9700       regs->array[i].may_not_optimize = 1;
9701 #endif
9702
9703   /* Set regs->array[I].n_times_set for the new registers.  */
9704   for (i = old_nregs; i < regs->num; i++)
9705     regs->array[i].n_times_set = regs->array[i].set_in_loop;
9706
9707   free (last_set);
9708 }
9709
9710 /* Returns the number of real INSNs in the LOOP.  */
9711
9712 static int
9713 count_insns_in_loop (const struct loop *loop)
9714 {
9715   int count = 0;
9716   rtx insn;
9717
9718   for (insn = loop->top ? loop->top : loop->start; insn != loop->end;
9719        insn = NEXT_INSN (insn))
9720     if (INSN_P (insn))
9721       ++count;
9722
9723   return count;
9724 }
9725
9726 /* Move MEMs into registers for the duration of the loop.  */
9727
9728 static void
9729 load_mems (const struct loop *loop)
9730 {
9731   struct loop_info *loop_info = LOOP_INFO (loop);
9732   struct loop_regs *regs = LOOP_REGS (loop);
9733   int maybe_never = 0;
9734   int i;
9735   rtx p, prev_ebb_head;
9736   rtx label = NULL_RTX;
9737   rtx end_label;
9738   /* Nonzero if the next instruction may never be executed.  */
9739   int next_maybe_never = 0;
9740   unsigned int last_max_reg = max_reg_num ();
9741
9742   if (loop_info->mems_idx == 0)
9743     return;
9744
9745   /* We cannot use next_label here because it skips over normal insns.  */
9746   end_label = next_nonnote_insn (loop->end);
9747   if (end_label && GET_CODE (end_label) != CODE_LABEL)
9748     end_label = NULL_RTX;
9749
9750   /* Check to see if it's possible that some instructions in the loop are
9751      never executed.  Also check if there is a goto out of the loop other
9752      than right after the end of the loop.  */
9753   for (p = next_insn_in_loop (loop, loop->scan_start);
9754        p != NULL_RTX;
9755        p = next_insn_in_loop (loop, p))
9756     {
9757       if (GET_CODE (p) == CODE_LABEL)
9758         maybe_never = 1;
9759       else if (GET_CODE (p) == JUMP_INSN
9760                /* If we enter the loop in the middle, and scan
9761                   around to the beginning, don't set maybe_never
9762                   for that.  This must be an unconditional jump,
9763                   otherwise the code at the top of the loop might
9764                   never be executed.  Unconditional jumps are
9765                   followed a by barrier then loop end.  */
9766                && ! (GET_CODE (p) == JUMP_INSN
9767                      && JUMP_LABEL (p) == loop->top
9768                      && NEXT_INSN (NEXT_INSN (p)) == loop->end
9769                      && any_uncondjump_p (p)))
9770         {
9771           /* If this is a jump outside of the loop but not right
9772              after the end of the loop, we would have to emit new fixup
9773              sequences for each such label.  */
9774           if (/* If we can't tell where control might go when this
9775                  JUMP_INSN is executed, we must be conservative.  */
9776               !JUMP_LABEL (p)
9777               || (JUMP_LABEL (p) != end_label
9778                   && (INSN_UID (JUMP_LABEL (p)) >= max_uid_for_loop
9779                       || INSN_LUID (JUMP_LABEL (p)) < INSN_LUID (loop->start)
9780                       || INSN_LUID (JUMP_LABEL (p)) > INSN_LUID (loop->end))))
9781             return;
9782
9783           if (!any_condjump_p (p))
9784             /* Something complicated.  */
9785             maybe_never = 1;
9786           else
9787             /* If there are any more instructions in the loop, they
9788                might not be reached.  */
9789             next_maybe_never = 1;
9790         }
9791       else if (next_maybe_never)
9792         maybe_never = 1;
9793     }
9794
9795   /* Find start of the extended basic block that enters the loop.  */
9796   for (p = loop->start;
9797        PREV_INSN (p) && GET_CODE (p) != CODE_LABEL;
9798        p = PREV_INSN (p))
9799     ;
9800   prev_ebb_head = p;
9801
9802   cselib_init (true);
9803
9804   /* Build table of mems that get set to constant values before the
9805      loop.  */
9806   for (; p != loop->start; p = NEXT_INSN (p))
9807     cselib_process_insn (p);
9808
9809   /* Actually move the MEMs.  */
9810   for (i = 0; i < loop_info->mems_idx; ++i)
9811     {
9812       regset_head load_copies;
9813       regset_head store_copies;
9814       int written = 0;
9815       rtx reg;
9816       rtx mem = loop_info->mems[i].mem;
9817       rtx mem_list_entry;
9818
9819       if (MEM_VOLATILE_P (mem)
9820           || loop_invariant_p (loop, XEXP (mem, 0)) != 1)
9821         /* There's no telling whether or not MEM is modified.  */
9822         loop_info->mems[i].optimize = 0;
9823
9824       /* Go through the MEMs written to in the loop to see if this
9825          one is aliased by one of them.  */
9826       mem_list_entry = loop_info->store_mems;
9827       while (mem_list_entry)
9828         {
9829           if (rtx_equal_p (mem, XEXP (mem_list_entry, 0)))
9830             written = 1;
9831           else if (true_dependence (XEXP (mem_list_entry, 0), VOIDmode,
9832                                     mem, rtx_varies_p))
9833             {
9834               /* MEM is indeed aliased by this store.  */
9835               loop_info->mems[i].optimize = 0;
9836               break;
9837             }
9838           mem_list_entry = XEXP (mem_list_entry, 1);
9839         }
9840
9841       if (flag_float_store && written
9842           && GET_MODE_CLASS (GET_MODE (mem)) == MODE_FLOAT)
9843         loop_info->mems[i].optimize = 0;
9844
9845       /* If this MEM is written to, we must be sure that there
9846          are no reads from another MEM that aliases this one.  */
9847       if (loop_info->mems[i].optimize && written)
9848         {
9849           int j;
9850
9851           for (j = 0; j < loop_info->mems_idx; ++j)
9852             {
9853               if (j == i)
9854                 continue;
9855               else if (true_dependence (mem,
9856                                         VOIDmode,
9857                                         loop_info->mems[j].mem,
9858                                         rtx_varies_p))
9859                 {
9860                   /* It's not safe to hoist loop_info->mems[i] out of
9861                      the loop because writes to it might not be
9862                      seen by reads from loop_info->mems[j].  */
9863                   loop_info->mems[i].optimize = 0;
9864                   break;
9865                 }
9866             }
9867         }
9868
9869       if (maybe_never && may_trap_p (mem))
9870         /* We can't access the MEM outside the loop; it might
9871            cause a trap that wouldn't have happened otherwise.  */
9872         loop_info->mems[i].optimize = 0;
9873
9874       if (!loop_info->mems[i].optimize)
9875         /* We thought we were going to lift this MEM out of the
9876            loop, but later discovered that we could not.  */
9877         continue;
9878
9879       INIT_REG_SET (&load_copies);
9880       INIT_REG_SET (&store_copies);
9881
9882       /* Allocate a pseudo for this MEM.  We set REG_USERVAR_P in
9883          order to keep scan_loop from moving stores to this MEM
9884          out of the loop just because this REG is neither a
9885          user-variable nor used in the loop test.  */
9886       reg = gen_reg_rtx (GET_MODE (mem));
9887       REG_USERVAR_P (reg) = 1;
9888       loop_info->mems[i].reg = reg;
9889
9890       /* Now, replace all references to the MEM with the
9891          corresponding pseudos.  */
9892       maybe_never = 0;
9893       for (p = next_insn_in_loop (loop, loop->scan_start);
9894            p != NULL_RTX;
9895            p = next_insn_in_loop (loop, p))
9896         {
9897           if (INSN_P (p))
9898             {
9899               rtx set;
9900
9901               set = single_set (p);
9902
9903               /* See if this copies the mem into a register that isn't
9904                  modified afterwards.  We'll try to do copy propagation
9905                  a little further on.  */
9906               if (set
9907                   /* @@@ This test is _way_ too conservative.  */
9908                   && ! maybe_never
9909                   && GET_CODE (SET_DEST (set)) == REG
9910                   && REGNO (SET_DEST (set)) >= FIRST_PSEUDO_REGISTER
9911                   && REGNO (SET_DEST (set)) < last_max_reg
9912                   && regs->array[REGNO (SET_DEST (set))].n_times_set == 1
9913                   && rtx_equal_p (SET_SRC (set), mem))
9914                 SET_REGNO_REG_SET (&load_copies, REGNO (SET_DEST (set)));
9915
9916               /* See if this copies the mem from a register that isn't
9917                  modified afterwards.  We'll try to remove the
9918                  redundant copy later on by doing a little register
9919                  renaming and copy propagation.   This will help
9920                  to untangle things for the BIV detection code.  */
9921               if (set
9922                   && ! maybe_never
9923                   && GET_CODE (SET_SRC (set)) == REG
9924                   && REGNO (SET_SRC (set)) >= FIRST_PSEUDO_REGISTER
9925                   && REGNO (SET_SRC (set)) < last_max_reg
9926                   && regs->array[REGNO (SET_SRC (set))].n_times_set == 1
9927                   && rtx_equal_p (SET_DEST (set), mem))
9928                 SET_REGNO_REG_SET (&store_copies, REGNO (SET_SRC (set)));
9929
9930               /* If this is a call which uses / clobbers this memory
9931                  location, we must not change the interface here.  */
9932               if (GET_CODE (p) == CALL_INSN
9933                   && reg_mentioned_p (loop_info->mems[i].mem,
9934                                       CALL_INSN_FUNCTION_USAGE (p)))
9935                 {
9936                   cancel_changes (0);
9937                   loop_info->mems[i].optimize = 0;
9938                   break;
9939                 }
9940               else
9941                 /* Replace the memory reference with the shadow register.  */
9942                 replace_loop_mems (p, loop_info->mems[i].mem,
9943                                    loop_info->mems[i].reg, written);
9944             }
9945
9946           if (GET_CODE (p) == CODE_LABEL
9947               || GET_CODE (p) == JUMP_INSN)
9948             maybe_never = 1;
9949         }
9950
9951       if (! loop_info->mems[i].optimize)
9952         ; /* We found we couldn't do the replacement, so do nothing.  */
9953       else if (! apply_change_group ())
9954         /* We couldn't replace all occurrences of the MEM.  */
9955         loop_info->mems[i].optimize = 0;
9956       else
9957         {
9958           /* Load the memory immediately before LOOP->START, which is
9959              the NOTE_LOOP_BEG.  */
9960           cselib_val *e = cselib_lookup (mem, VOIDmode, 0);
9961           rtx set;
9962           rtx best = mem;
9963           int j;
9964           struct elt_loc_list *const_equiv = 0;
9965
9966           if (e)
9967             {
9968               struct elt_loc_list *equiv;
9969               struct elt_loc_list *best_equiv = 0;
9970               for (equiv = e->locs; equiv; equiv = equiv->next)
9971                 {
9972                   if (CONSTANT_P (equiv->loc))
9973                     const_equiv = equiv;
9974                   else if (GET_CODE (equiv->loc) == REG
9975                            /* Extending hard register lifetimes causes crash
9976                               on SRC targets.  Doing so on non-SRC is
9977                               probably also not good idea, since we most
9978                               probably have pseudoregister equivalence as
9979                               well.  */
9980                            && REGNO (equiv->loc) >= FIRST_PSEUDO_REGISTER)
9981                     best_equiv = equiv;
9982                 }
9983               /* Use the constant equivalence if that is cheap enough.  */
9984               if (! best_equiv)
9985                 best_equiv = const_equiv;
9986               else if (const_equiv
9987                        && (rtx_cost (const_equiv->loc, SET)
9988                            <= rtx_cost (best_equiv->loc, SET)))
9989                 {
9990                   best_equiv = const_equiv;
9991                   const_equiv = 0;
9992                 }
9993
9994               /* If best_equiv is nonzero, we know that MEM is set to a
9995                  constant or register before the loop.  We will use this
9996                  knowledge to initialize the shadow register with that
9997                  constant or reg rather than by loading from MEM.  */
9998               if (best_equiv)
9999                 best = copy_rtx (best_equiv->loc);
10000             }
10001
10002           set = gen_move_insn (reg, best);
10003           set = loop_insn_hoist (loop, set);
10004           if (REG_P (best))
10005             {
10006               for (p = prev_ebb_head; p != loop->start; p = NEXT_INSN (p))
10007                 if (REGNO_LAST_UID (REGNO (best)) == INSN_UID (p))
10008                   {
10009                     REGNO_LAST_UID (REGNO (best)) = INSN_UID (set);
10010                     break;
10011                   }
10012             }
10013
10014           if (const_equiv)
10015             set_unique_reg_note (set, REG_EQUAL, copy_rtx (const_equiv->loc));
10016
10017           if (written)
10018             {
10019               if (label == NULL_RTX)
10020                 {
10021                   label = gen_label_rtx ();
10022                   emit_label_after (label, loop->end);
10023                 }
10024
10025               /* Store the memory immediately after END, which is
10026                  the NOTE_LOOP_END.  */
10027               set = gen_move_insn (copy_rtx (mem), reg);
10028               loop_insn_emit_after (loop, 0, label, set);
10029             }
10030
10031           if (loop_dump_stream)
10032             {
10033               fprintf (loop_dump_stream, "Hoisted regno %d %s from ",
10034                        REGNO (reg), (written ? "r/w" : "r/o"));
10035               print_rtl (loop_dump_stream, mem);
10036               fputc ('\n', loop_dump_stream);
10037             }
10038
10039           /* Attempt a bit of copy propagation.  This helps untangle the
10040              data flow, and enables {basic,general}_induction_var to find
10041              more bivs/givs.  */
10042           EXECUTE_IF_SET_IN_REG_SET
10043             (&load_copies, FIRST_PSEUDO_REGISTER, j,
10044              {
10045                try_copy_prop (loop, reg, j);
10046              });
10047           CLEAR_REG_SET (&load_copies);
10048
10049           EXECUTE_IF_SET_IN_REG_SET
10050             (&store_copies, FIRST_PSEUDO_REGISTER, j,
10051              {
10052                try_swap_copy_prop (loop, reg, j);
10053              });
10054           CLEAR_REG_SET (&store_copies);
10055         }
10056     }
10057
10058   /* Now, we need to replace all references to the previous exit
10059      label with the new one.  */
10060   if (label != NULL_RTX && end_label != NULL_RTX)
10061     for (p = loop->start; p != loop->end; p = NEXT_INSN (p))
10062       if (GET_CODE (p) == JUMP_INSN && JUMP_LABEL (p) == end_label)
10063         redirect_jump (p, label, false);
10064
10065   cselib_finish ();
10066 }
10067
10068 /* For communication between note_reg_stored and its caller.  */
10069 struct note_reg_stored_arg
10070 {
10071   int set_seen;
10072   rtx reg;
10073 };
10074
10075 /* Called via note_stores, record in SET_SEEN whether X, which is written,
10076    is equal to ARG.  */
10077 static void
10078 note_reg_stored (rtx x, rtx setter ATTRIBUTE_UNUSED, void *arg)
10079 {
10080   struct note_reg_stored_arg *t = (struct note_reg_stored_arg *) arg;
10081   if (t->reg == x)
10082     t->set_seen = 1;
10083 }
10084
10085 /* Try to replace every occurrence of pseudo REGNO with REPLACEMENT.
10086    There must be exactly one insn that sets this pseudo; it will be
10087    deleted if all replacements succeed and we can prove that the register
10088    is not used after the loop.  */
10089
10090 static void
10091 try_copy_prop (const struct loop *loop, rtx replacement, unsigned int regno)
10092 {
10093   /* This is the reg that we are copying from.  */
10094   rtx reg_rtx = regno_reg_rtx[regno];
10095   rtx init_insn = 0;
10096   rtx insn;
10097   /* These help keep track of whether we replaced all uses of the reg.  */
10098   int replaced_last = 0;
10099   int store_is_first = 0;
10100
10101   for (insn = next_insn_in_loop (loop, loop->scan_start);
10102        insn != NULL_RTX;
10103        insn = next_insn_in_loop (loop, insn))
10104     {
10105       rtx set;
10106
10107       /* Only substitute within one extended basic block from the initializing
10108          insn.  */
10109       if (GET_CODE (insn) == CODE_LABEL && init_insn)
10110         break;
10111
10112       if (! INSN_P (insn))
10113         continue;
10114
10115       /* Is this the initializing insn?  */
10116       set = single_set (insn);
10117       if (set
10118           && GET_CODE (SET_DEST (set)) == REG
10119           && REGNO (SET_DEST (set)) == regno)
10120         {
10121           if (init_insn)
10122             abort ();
10123
10124           init_insn = insn;
10125           if (REGNO_FIRST_UID (regno) == INSN_UID (insn))
10126             store_is_first = 1;
10127         }
10128
10129       /* Only substitute after seeing the initializing insn.  */
10130       if (init_insn && insn != init_insn)
10131         {
10132           struct note_reg_stored_arg arg;
10133
10134           replace_loop_regs (insn, reg_rtx, replacement);
10135           if (REGNO_LAST_UID (regno) == INSN_UID (insn))
10136             replaced_last = 1;
10137
10138           /* Stop replacing when REPLACEMENT is modified.  */
10139           arg.reg = replacement;
10140           arg.set_seen = 0;
10141           note_stores (PATTERN (insn), note_reg_stored, &arg);
10142           if (arg.set_seen)
10143             {
10144               rtx note = find_reg_note (insn, REG_EQUAL, NULL);
10145
10146               /* It is possible that we've turned previously valid REG_EQUAL to
10147                  invalid, as we change the REGNO to REPLACEMENT and unlike REGNO,
10148                  REPLACEMENT is modified, we get different meaning.  */
10149               if (note && reg_mentioned_p (replacement, XEXP (note, 0)))
10150                 remove_note (insn, note);
10151               break;
10152             }
10153         }
10154     }
10155   if (! init_insn)
10156     abort ();
10157   if (apply_change_group ())
10158     {
10159       if (loop_dump_stream)
10160         fprintf (loop_dump_stream, "  Replaced reg %d", regno);
10161       if (store_is_first && replaced_last)
10162         {
10163           rtx first;
10164           rtx retval_note;
10165
10166           /* Assume we're just deleting INIT_INSN.  */
10167           first = init_insn;
10168           /* Look for REG_RETVAL note.  If we're deleting the end of
10169              the libcall sequence, the whole sequence can go.  */
10170           retval_note = find_reg_note (init_insn, REG_RETVAL, NULL_RTX);
10171           /* If we found a REG_RETVAL note, find the first instruction
10172              in the sequence.  */
10173           if (retval_note)
10174             first = XEXP (retval_note, 0);
10175
10176           /* Delete the instructions.  */
10177           loop_delete_insns (first, init_insn);
10178         }
10179       if (loop_dump_stream)
10180         fprintf (loop_dump_stream, ".\n");
10181     }
10182 }
10183
10184 /* Replace all the instructions from FIRST up to and including LAST
10185    with NOTE_INSN_DELETED notes.  */
10186
10187 static void
10188 loop_delete_insns (rtx first, rtx last)
10189 {
10190   while (1)
10191     {
10192       if (loop_dump_stream)
10193         fprintf (loop_dump_stream, ", deleting init_insn (%d)",
10194                  INSN_UID (first));
10195       delete_insn (first);
10196
10197       /* If this was the LAST instructions we're supposed to delete,
10198          we're done.  */
10199       if (first == last)
10200         break;
10201
10202       first = NEXT_INSN (first);
10203     }
10204 }
10205
10206 /* Try to replace occurrences of pseudo REGNO with REPLACEMENT within
10207    loop LOOP if the order of the sets of these registers can be
10208    swapped.  There must be exactly one insn within the loop that sets
10209    this pseudo followed immediately by a move insn that sets
10210    REPLACEMENT with REGNO.  */
10211 static void
10212 try_swap_copy_prop (const struct loop *loop, rtx replacement,
10213                     unsigned int regno)
10214 {
10215   rtx insn;
10216   rtx set = NULL_RTX;
10217   unsigned int new_regno;
10218
10219   new_regno = REGNO (replacement);
10220
10221   for (insn = next_insn_in_loop (loop, loop->scan_start);
10222        insn != NULL_RTX;
10223        insn = next_insn_in_loop (loop, insn))
10224     {
10225       /* Search for the insn that copies REGNO to NEW_REGNO?  */
10226       if (INSN_P (insn)
10227           && (set = single_set (insn))
10228           && GET_CODE (SET_DEST (set)) == REG
10229           && REGNO (SET_DEST (set)) == new_regno
10230           && GET_CODE (SET_SRC (set)) == REG
10231           && REGNO (SET_SRC (set)) == regno)
10232         break;
10233     }
10234
10235   if (insn != NULL_RTX)
10236     {
10237       rtx prev_insn;
10238       rtx prev_set;
10239
10240       /* Some DEF-USE info would come in handy here to make this
10241          function more general.  For now, just check the previous insn
10242          which is the most likely candidate for setting REGNO.  */
10243
10244       prev_insn = PREV_INSN (insn);
10245
10246       if (INSN_P (insn)
10247           && (prev_set = single_set (prev_insn))
10248           && GET_CODE (SET_DEST (prev_set)) == REG
10249           && REGNO (SET_DEST (prev_set)) == regno)
10250         {
10251           /* We have:
10252              (set (reg regno) (expr))
10253              (set (reg new_regno) (reg regno))
10254
10255              so try converting this to:
10256              (set (reg new_regno) (expr))
10257              (set (reg regno) (reg new_regno))
10258
10259              The former construct is often generated when a global
10260              variable used for an induction variable is shadowed by a
10261              register (NEW_REGNO).  The latter construct improves the
10262              chances of GIV replacement and BIV elimination.  */
10263
10264           validate_change (prev_insn, &SET_DEST (prev_set),
10265                            replacement, 1);
10266           validate_change (insn, &SET_DEST (set),
10267                            SET_SRC (set), 1);
10268           validate_change (insn, &SET_SRC (set),
10269                            replacement, 1);
10270
10271           if (apply_change_group ())
10272             {
10273               if (loop_dump_stream)
10274                 fprintf (loop_dump_stream,
10275                          "  Swapped set of reg %d at %d with reg %d at %d.\n",
10276                          regno, INSN_UID (insn),
10277                          new_regno, INSN_UID (prev_insn));
10278
10279               /* Update first use of REGNO.  */
10280               if (REGNO_FIRST_UID (regno) == INSN_UID (prev_insn))
10281                 REGNO_FIRST_UID (regno) = INSN_UID (insn);
10282
10283               /* Now perform copy propagation to hopefully
10284                  remove all uses of REGNO within the loop.  */
10285               try_copy_prop (loop, replacement, regno);
10286             }
10287         }
10288     }
10289 }
10290
10291 /* Worker function for find_mem_in_note, called via for_each_rtx.  */
10292
10293 static int
10294 find_mem_in_note_1 (rtx *x, void *data)
10295 {
10296   if (*x != NULL_RTX && GET_CODE (*x) == MEM)
10297     {
10298       rtx *res = (rtx *) data;
10299       *res = *x;
10300       return 1;
10301     }
10302   return 0;
10303 }
10304
10305 /* Returns the first MEM found in NOTE by depth-first search.  */
10306
10307 static rtx
10308 find_mem_in_note (rtx note)
10309 {
10310   if (note && for_each_rtx (&note, find_mem_in_note_1, &note))
10311     return note;
10312   return NULL_RTX;
10313 }
10314
10315 /* Replace MEM with its associated pseudo register.  This function is
10316    called from load_mems via for_each_rtx.  DATA is actually a pointer
10317    to a structure describing the instruction currently being scanned
10318    and the MEM we are currently replacing.  */
10319
10320 static int
10321 replace_loop_mem (rtx *mem, void *data)
10322 {
10323   loop_replace_args *args = (loop_replace_args *) data;
10324   rtx m = *mem;
10325
10326   if (m == NULL_RTX)
10327     return 0;
10328
10329   switch (GET_CODE (m))
10330     {
10331     case MEM:
10332       break;
10333
10334     case CONST_DOUBLE:
10335       /* We're not interested in the MEM associated with a
10336          CONST_DOUBLE, so there's no need to traverse into one.  */
10337       return -1;
10338
10339     default:
10340       /* This is not a MEM.  */
10341       return 0;
10342     }
10343
10344   if (!rtx_equal_p (args->match, m))
10345     /* This is not the MEM we are currently replacing.  */
10346     return 0;
10347
10348   /* Actually replace the MEM.  */
10349   validate_change (args->insn, mem, args->replacement, 1);
10350
10351   return 0;
10352 }
10353
10354 static void
10355 replace_loop_mems (rtx insn, rtx mem, rtx reg, int written)
10356 {
10357   loop_replace_args args;
10358
10359   args.insn = insn;
10360   args.match = mem;
10361   args.replacement = reg;
10362
10363   for_each_rtx (&insn, replace_loop_mem, &args);
10364
10365   /* If we hoist a mem write out of the loop, then REG_EQUAL
10366      notes referring to the mem are no longer valid.  */
10367   if (written)
10368     {
10369       rtx note, sub;
10370       rtx *link;
10371
10372       for (link = &REG_NOTES (insn); (note = *link); link = &XEXP (note, 1))
10373         {
10374           if (REG_NOTE_KIND (note) == REG_EQUAL
10375               && (sub = find_mem_in_note (note))
10376               && true_dependence (mem, VOIDmode, sub, rtx_varies_p))
10377             {
10378               /* Remove the note.  */
10379               validate_change (NULL_RTX, link, XEXP (note, 1), 1);
10380               break;
10381             }
10382         }
10383     }
10384 }
10385
10386 /* Replace one register with another.  Called through for_each_rtx; PX points
10387    to the rtx being scanned.  DATA is actually a pointer to
10388    a structure of arguments.  */
10389
10390 static int
10391 replace_loop_reg (rtx *px, void *data)
10392 {
10393   rtx x = *px;
10394   loop_replace_args *args = (loop_replace_args *) data;
10395
10396   if (x == NULL_RTX)
10397     return 0;
10398
10399   if (x == args->match)
10400     validate_change (args->insn, px, args->replacement, 1);
10401
10402   return 0;
10403 }
10404
10405 static void
10406 replace_loop_regs (rtx insn, rtx reg, rtx replacement)
10407 {
10408   loop_replace_args args;
10409
10410   args.insn = insn;
10411   args.match = reg;
10412   args.replacement = replacement;
10413
10414   for_each_rtx (&insn, replace_loop_reg, &args);
10415 }
10416 \f
10417 /* Emit insn for PATTERN after WHERE_INSN in basic block WHERE_BB
10418    (ignored in the interim).  */
10419
10420 static rtx
10421 loop_insn_emit_after (const struct loop *loop ATTRIBUTE_UNUSED,
10422                       basic_block where_bb ATTRIBUTE_UNUSED, rtx where_insn,
10423                       rtx pattern)
10424 {
10425   return emit_insn_after (pattern, where_insn);
10426 }
10427
10428
10429 /* If WHERE_INSN is nonzero emit insn for PATTERN before WHERE_INSN
10430    in basic block WHERE_BB (ignored in the interim) within the loop
10431    otherwise hoist PATTERN into the loop pre-header.  */
10432
10433 rtx
10434 loop_insn_emit_before (const struct loop *loop,
10435                        basic_block where_bb ATTRIBUTE_UNUSED,
10436                        rtx where_insn, rtx pattern)
10437 {
10438   if (! where_insn)
10439     return loop_insn_hoist (loop, pattern);
10440   return emit_insn_before (pattern, where_insn);
10441 }
10442
10443
10444 /* Emit call insn for PATTERN before WHERE_INSN in basic block
10445    WHERE_BB (ignored in the interim) within the loop.  */
10446
10447 static rtx
10448 loop_call_insn_emit_before (const struct loop *loop ATTRIBUTE_UNUSED,
10449                             basic_block where_bb ATTRIBUTE_UNUSED,
10450                             rtx where_insn, rtx pattern)
10451 {
10452   return emit_call_insn_before (pattern, where_insn);
10453 }
10454
10455
10456 /* Hoist insn for PATTERN into the loop pre-header.  */
10457
10458 rtx
10459 loop_insn_hoist (const struct loop *loop, rtx pattern)
10460 {
10461   return loop_insn_emit_before (loop, 0, loop->start, pattern);
10462 }
10463
10464
10465 /* Hoist call insn for PATTERN into the loop pre-header.  */
10466
10467 static rtx
10468 loop_call_insn_hoist (const struct loop *loop, rtx pattern)
10469 {
10470   return loop_call_insn_emit_before (loop, 0, loop->start, pattern);
10471 }
10472
10473
10474 /* Sink insn for PATTERN after the loop end.  */
10475
10476 rtx
10477 loop_insn_sink (const struct loop *loop, rtx pattern)
10478 {
10479   return loop_insn_emit_before (loop, 0, loop->sink, pattern);
10480 }
10481
10482 /* bl->final_value can be either general_operand or PLUS of general_operand
10483    and constant.  Emit sequence of instructions to load it into REG.  */
10484 static rtx
10485 gen_load_of_final_value (rtx reg, rtx final_value)
10486 {
10487   rtx seq;
10488   start_sequence ();
10489   final_value = force_operand (final_value, reg);
10490   if (final_value != reg)
10491     emit_move_insn (reg, final_value);
10492   seq = get_insns ();
10493   end_sequence ();
10494   return seq;
10495 }
10496
10497 /* If the loop has multiple exits, emit insn for PATTERN before the
10498    loop to ensure that it will always be executed no matter how the
10499    loop exits.  Otherwise, emit the insn for PATTERN after the loop,
10500    since this is slightly more efficient.  */
10501
10502 static rtx
10503 loop_insn_sink_or_swim (const struct loop *loop, rtx pattern)
10504 {
10505   if (loop->exit_count)
10506     return loop_insn_hoist (loop, pattern);
10507   else
10508     return loop_insn_sink (loop, pattern);
10509 }
10510 \f
10511 static void
10512 loop_ivs_dump (const struct loop *loop, FILE *file, int verbose)
10513 {
10514   struct iv_class *bl;
10515   int iv_num = 0;
10516
10517   if (! loop || ! file)
10518     return;
10519
10520   for (bl = LOOP_IVS (loop)->list; bl; bl = bl->next)
10521     iv_num++;
10522
10523   fprintf (file, "Loop %d: %d IV classes\n", loop->num, iv_num);
10524
10525   for (bl = LOOP_IVS (loop)->list; bl; bl = bl->next)
10526     {
10527       loop_iv_class_dump (bl, file, verbose);
10528       fputc ('\n', file);
10529     }
10530 }
10531
10532
10533 static void
10534 loop_iv_class_dump (const struct iv_class *bl, FILE *file,
10535                     int verbose ATTRIBUTE_UNUSED)
10536 {
10537   struct induction *v;
10538   rtx incr;
10539   int i;
10540
10541   if (! bl || ! file)
10542     return;
10543
10544   fprintf (file, "IV class for reg %d, benefit %d\n",
10545            bl->regno, bl->total_benefit);
10546
10547   fprintf (file, " Init insn %d", INSN_UID (bl->init_insn));
10548   if (bl->initial_value)
10549     {
10550       fprintf (file, ", init val: ");
10551       print_simple_rtl (file, bl->initial_value);
10552     }
10553   if (bl->initial_test)
10554     {
10555       fprintf (file, ", init test: ");
10556       print_simple_rtl (file, bl->initial_test);
10557     }
10558   fputc ('\n', file);
10559
10560   if (bl->final_value)
10561     {
10562       fprintf (file, " Final val: ");
10563       print_simple_rtl (file, bl->final_value);
10564       fputc ('\n', file);
10565     }
10566
10567   if ((incr = biv_total_increment (bl)))
10568     {
10569       fprintf (file, " Total increment: ");
10570       print_simple_rtl (file, incr);
10571       fputc ('\n', file);
10572     }
10573
10574   /* List the increments.  */
10575   for (i = 0, v = bl->biv; v; v = v->next_iv, i++)
10576     {
10577       fprintf (file, " Inc%d: insn %d, incr: ", i, INSN_UID (v->insn));
10578       print_simple_rtl (file, v->add_val);
10579       fputc ('\n', file);
10580     }
10581
10582   /* List the givs.  */
10583   for (i = 0, v = bl->giv; v; v = v->next_iv, i++)
10584     {
10585       fprintf (file, " Giv%d: insn %d, benefit %d, ",
10586                i, INSN_UID (v->insn), v->benefit);
10587       if (v->giv_type == DEST_ADDR)
10588         print_simple_rtl (file, v->mem);
10589       else
10590         print_simple_rtl (file, single_set (v->insn));
10591       fputc ('\n', file);
10592     }
10593 }
10594
10595
10596 static void
10597 loop_biv_dump (const struct induction *v, FILE *file, int verbose)
10598 {
10599   if (! v || ! file)
10600     return;
10601
10602   fprintf (file,
10603            "Biv %d: insn %d",
10604            REGNO (v->dest_reg), INSN_UID (v->insn));
10605   fprintf (file, " const ");
10606   print_simple_rtl (file, v->add_val);
10607
10608   if (verbose && v->final_value)
10609     {
10610       fputc ('\n', file);
10611       fprintf (file, " final ");
10612       print_simple_rtl (file, v->final_value);
10613     }
10614
10615   fputc ('\n', file);
10616 }
10617
10618
10619 static void
10620 loop_giv_dump (const struct induction *v, FILE *file, int verbose)
10621 {
10622   if (! v || ! file)
10623     return;
10624
10625   if (v->giv_type == DEST_REG)
10626     fprintf (file, "Giv %d: insn %d",
10627              REGNO (v->dest_reg), INSN_UID (v->insn));
10628   else
10629     fprintf (file, "Dest address: insn %d",
10630              INSN_UID (v->insn));
10631
10632   fprintf (file, " src reg %d benefit %d",
10633            REGNO (v->src_reg), v->benefit);
10634   fprintf (file, " lifetime %d",
10635            v->lifetime);
10636
10637   if (v->replaceable)
10638     fprintf (file, " replaceable");
10639
10640   if (v->no_const_addval)
10641     fprintf (file, " ncav");
10642
10643   if (v->ext_dependent)
10644     {
10645       switch (GET_CODE (v->ext_dependent))
10646         {
10647         case SIGN_EXTEND:
10648           fprintf (file, " ext se");
10649           break;
10650         case ZERO_EXTEND:
10651           fprintf (file, " ext ze");
10652           break;
10653         case TRUNCATE:
10654           fprintf (file, " ext tr");
10655           break;
10656         default:
10657           abort ();
10658         }
10659     }
10660
10661   fputc ('\n', file);
10662   fprintf (file, " mult ");
10663   print_simple_rtl (file, v->mult_val);
10664
10665   fputc ('\n', file);
10666   fprintf (file, " add  ");
10667   print_simple_rtl (file, v->add_val);
10668
10669   if (verbose && v->final_value)
10670     {
10671       fputc ('\n', file);
10672       fprintf (file, " final ");
10673       print_simple_rtl (file, v->final_value);
10674     }
10675
10676   fputc ('\n', file);
10677 }
10678
10679
10680 void
10681 debug_ivs (const struct loop *loop)
10682 {
10683   loop_ivs_dump (loop, stderr, 1);
10684 }
10685
10686
10687 void
10688 debug_iv_class (const struct iv_class *bl)
10689 {
10690   loop_iv_class_dump (bl, stderr, 1);
10691 }
10692
10693
10694 void
10695 debug_biv (const struct induction *v)
10696 {
10697   loop_biv_dump (v, stderr, 1);
10698 }
10699
10700
10701 void
10702 debug_giv (const struct induction *v)
10703 {
10704   loop_giv_dump (v, stderr, 1);
10705 }
10706
10707
10708 #define LOOP_BLOCK_NUM_1(INSN) \
10709 ((INSN) ? (BLOCK_FOR_INSN (INSN) ? BLOCK_NUM (INSN) : - 1) : -1)
10710
10711 /* The notes do not have an assigned block, so look at the next insn.  */
10712 #define LOOP_BLOCK_NUM(INSN) \
10713 ((INSN) ? (GET_CODE (INSN) == NOTE \
10714             ? LOOP_BLOCK_NUM_1 (next_nonnote_insn (INSN)) \
10715             : LOOP_BLOCK_NUM_1 (INSN)) \
10716         : -1)
10717
10718 #define LOOP_INSN_UID(INSN) ((INSN) ? INSN_UID (INSN) : -1)
10719
10720 static void
10721 loop_dump_aux (const struct loop *loop, FILE *file,
10722                int verbose ATTRIBUTE_UNUSED)
10723 {
10724   rtx label;
10725
10726   if (! loop || ! file)
10727     return;
10728
10729   /* Print diagnostics to compare our concept of a loop with
10730      what the loop notes say.  */
10731   if (! PREV_INSN (BB_HEAD (loop->first))
10732       || GET_CODE (PREV_INSN (BB_HEAD (loop->first))) != NOTE
10733       || NOTE_LINE_NUMBER (PREV_INSN (BB_HEAD (loop->first)))
10734       != NOTE_INSN_LOOP_BEG)
10735     fprintf (file, ";;  No NOTE_INSN_LOOP_BEG at %d\n",
10736              INSN_UID (PREV_INSN (BB_HEAD (loop->first))));
10737   if (! NEXT_INSN (BB_END (loop->last))
10738       || GET_CODE (NEXT_INSN (BB_END (loop->last))) != NOTE
10739       || NOTE_LINE_NUMBER (NEXT_INSN (BB_END (loop->last)))
10740       != NOTE_INSN_LOOP_END)
10741     fprintf (file, ";;  No NOTE_INSN_LOOP_END at %d\n",
10742              INSN_UID (NEXT_INSN (BB_END (loop->last))));
10743
10744   if (loop->start)
10745     {
10746       fprintf (file,
10747                ";;  start %d (%d), cont dom %d (%d), cont %d (%d), vtop %d (%d), end %d (%d)\n",
10748                LOOP_BLOCK_NUM (loop->start),
10749                LOOP_INSN_UID (loop->start),
10750                LOOP_BLOCK_NUM (loop->cont),
10751                LOOP_INSN_UID (loop->cont),
10752                LOOP_BLOCK_NUM (loop->cont),
10753                LOOP_INSN_UID (loop->cont),
10754                LOOP_BLOCK_NUM (loop->vtop),
10755                LOOP_INSN_UID (loop->vtop),
10756                LOOP_BLOCK_NUM (loop->end),
10757                LOOP_INSN_UID (loop->end));
10758       fprintf (file, ";;  top %d (%d), scan start %d (%d)\n",
10759                LOOP_BLOCK_NUM (loop->top),
10760                LOOP_INSN_UID (loop->top),
10761                LOOP_BLOCK_NUM (loop->scan_start),
10762                LOOP_INSN_UID (loop->scan_start));
10763       fprintf (file, ";;  exit_count %d", loop->exit_count);
10764       if (loop->exit_count)
10765         {
10766           fputs (", labels:", file);
10767           for (label = loop->exit_labels; label; label = LABEL_NEXTREF (label))
10768             {
10769               fprintf (file, " %d ",
10770                        LOOP_INSN_UID (XEXP (label, 0)));
10771             }
10772         }
10773       fputs ("\n", file);
10774
10775       /* This can happen when a marked loop appears as two nested loops,
10776          say from while (a || b) {}.  The inner loop won't match
10777          the loop markers but the outer one will.  */
10778       if (LOOP_BLOCK_NUM (loop->cont) != loop->latch->index)
10779         fprintf (file, ";;  NOTE_INSN_LOOP_CONT not in loop latch\n");
10780     }
10781 }
10782
10783 /* Call this function from the debugger to dump LOOP.  */
10784
10785 void
10786 debug_loop (const struct loop *loop)
10787 {
10788   flow_loop_dump (loop, stderr, loop_dump_aux, 1);
10789 }
10790
10791 /* Call this function from the debugger to dump LOOPS.  */
10792
10793 void
10794 debug_loops (const struct loops *loops)
10795 {
10796   flow_loops_dump (loops, stderr, loop_dump_aux, 1);
10797 }