]> git.ipfire.org Git - thirdparty/gcc.git/blame - gcc/gimple-ssa-strength-reduction.c
Automated conversion of passes to C++ classes
[thirdparty/gcc.git] / gcc / gimple-ssa-strength-reduction.c
CommitLineData
4502f5d0 1/* Straight-line strength reduction.
711789cc 2 Copyright (C) 2012-2013 Free Software Foundation, Inc.
4502f5d0 3 Contributed by Bill Schmidt, IBM <wschmidt@linux.ibm.com>
4
5This file is part of GCC.
6
7GCC is free software; you can redistribute it and/or modify it under
8the terms of the GNU General Public License as published by the Free
9Software Foundation; either version 3, or (at your option) any later
10version.
11
12GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13WARRANTY; without even the implied warranty of MERCHANTABILITY or
14FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15for more details.
16
17You should have received a copy of the GNU General Public License
18along with GCC; see the file COPYING3. If not see
19<http://www.gnu.org/licenses/>. */
20
21/* There are many algorithms for performing strength reduction on
22 loops. This is not one of them. IVOPTS handles strength reduction
23 of induction variables just fine. This pass is intended to pick
24 up the crumbs it leaves behind, by considering opportunities for
25 strength reduction along dominator paths.
26
1168caca 27 Strength reduction addresses explicit multiplies, and certain
28 multiplies implicit in addressing expressions. It would also be
29 possible to apply strength reduction to divisions and modulos,
30 but such opportunities are relatively uncommon.
4502f5d0 31
32 Strength reduction is also currently restricted to integer operations.
33 If desired, it could be extended to floating-point operations under
34 control of something like -funsafe-math-optimizations. */
35
36#include "config.h"
37#include "system.h"
38#include "coretypes.h"
39#include "tree.h"
40#include "gimple.h"
41#include "basic-block.h"
42#include "tree-pass.h"
4502f5d0 43#include "cfgloop.h"
4502f5d0 44#include "gimple-pretty-print.h"
45#include "tree-flow.h"
46#include "domwalk.h"
47#include "pointer-set.h"
72655676 48#include "expmed.h"
df4c32b3 49#include "params.h"
d9dd21a8 50#include "hash-table.h"
4502f5d0 51\f
52/* Information about a strength reduction candidate. Each statement
53 in the candidate table represents an expression of one of the
54 following forms (the special case of CAND_REF will be described
55 later):
56
57 (CAND_MULT) S1: X = (B + i) * S
58 (CAND_ADD) S1: X = B + (i * S)
59
60 Here X and B are SSA names, i is an integer constant, and S is
61 either an SSA name or a constant. We call B the "base," i the
62 "index", and S the "stride."
63
64 Any statement S0 that dominates S1 and is of the form:
65
66 (CAND_MULT) S0: Y = (B + i') * S
67 (CAND_ADD) S0: Y = B + (i' * S)
68
69 is called a "basis" for S1. In both cases, S1 may be replaced by
70
71 S1': X = Y + (i - i') * S,
72
73 where (i - i') * S is folded to the extent possible.
74
75 All gimple statements are visited in dominator order, and each
76 statement that may contribute to one of the forms of S1 above is
77 given at least one entry in the candidate table. Such statements
78 include addition, pointer addition, subtraction, multiplication,
79 negation, copies, and nontrivial type casts. If a statement may
80 represent more than one expression of the forms of S1 above,
81 multiple "interpretations" are stored in the table and chained
82 together. Examples:
83
84 * An add of two SSA names may treat either operand as the base.
85 * A multiply of two SSA names, likewise.
86 * A copy or cast may be thought of as either a CAND_MULT with
87 i = 0 and S = 1, or as a CAND_ADD with i = 0 or S = 0.
88
89 Candidate records are allocated from an obstack. They are addressed
90 both from a hash table keyed on S1, and from a vector of candidate
91 pointers arranged in predominator order.
92
93 Opportunity note
94 ----------------
95 Currently we don't recognize:
96
97 S0: Y = (S * i') - B
98 S1: X = (S * i) - B
99
100 as a strength reduction opportunity, even though this S1 would
101 also be replaceable by the S1' above. This can be added if it
070bf980 102 comes up in practice.
103
104 Strength reduction in addressing
105 --------------------------------
106 There is another kind of candidate known as CAND_REF. A CAND_REF
107 describes a statement containing a memory reference having
108 complex addressing that might benefit from strength reduction.
109 Specifically, we are interested in references for which
110 get_inner_reference returns a base address, offset, and bitpos as
111 follows:
112
113 base: MEM_REF (T1, C1)
114 offset: MULT_EXPR (PLUS_EXPR (T2, C2), C3)
115 bitpos: C4 * BITS_PER_UNIT
116
117 Here T1 and T2 are arbitrary trees, and C1, C2, C3, C4 are
118 arbitrary integer constants. Note that C2 may be zero, in which
119 case the offset will be MULT_EXPR (T2, C3).
120
121 When this pattern is recognized, the original memory reference
122 can be replaced with:
123
124 MEM_REF (POINTER_PLUS_EXPR (T1, MULT_EXPR (T2, C3)),
125 C1 + (C2 * C3) + C4)
126
127 which distributes the multiply to allow constant folding. When
128 two or more addressing expressions can be represented by MEM_REFs
129 of this form, differing only in the constants C1, C2, and C4,
130 making this substitution produces more efficient addressing during
131 the RTL phases. When there are not at least two expressions with
132 the same values of T1, T2, and C3, there is nothing to be gained
133 by the replacement.
134
135 Strength reduction of CAND_REFs uses the same infrastructure as
136 that used by CAND_MULTs and CAND_ADDs. We record T1 in the base (B)
137 field, MULT_EXPR (T2, C3) in the stride (S) field, and
138 C1 + (C2 * C3) + C4 in the index (i) field. A basis for a CAND_REF
139 is thus another CAND_REF with the same B and S values. When at
140 least two CAND_REFs are chained together using the basis relation,
141 each of them is replaced as above, resulting in improved code
1168caca 142 generation for addressing.
143
144 Conditional candidates
145 ======================
146
147 Conditional candidates are best illustrated with an example.
148 Consider the code sequence:
149
150 (1) x_0 = ...;
151 (2) a_0 = x_0 * 5; MULT (B: x_0; i: 0; S: 5)
152 if (...)
153 (3) x_1 = x_0 + 1; ADD (B: x_0, i: 1; S: 1)
154 (4) x_2 = PHI <x_0, x_1>; PHI (B: x_0, i: 0, S: 1)
155 (5) x_3 = x_2 + 1; ADD (B: x_2, i: 1, S: 1)
156 (6) a_1 = x_3 * 5; MULT (B: x_2, i: 1; S: 5)
157
158 Here strength reduction is complicated by the uncertain value of x_2.
159 A legitimate transformation is:
160
161 (1) x_0 = ...;
162 (2) a_0 = x_0 * 5;
163 if (...)
164 {
165 (3) [x_1 = x_0 + 1;]
166 (3a) t_1 = a_0 + 5;
167 }
168 (4) [x_2 = PHI <x_0, x_1>;]
169 (4a) t_2 = PHI <a_0, t_1>;
170 (5) [x_3 = x_2 + 1;]
171 (6r) a_1 = t_2 + 5;
172
173 where the bracketed instructions may go dead.
174
175 To recognize this opportunity, we have to observe that statement (6)
176 has a "hidden basis" (2). The hidden basis is unlike a normal basis
177 in that the statement and the hidden basis have different base SSA
178 names (x_2 and x_0, respectively). The relationship is established
179 when a statement's base name (x_2) is defined by a phi statement (4),
180 each argument of which (x_0, x_1) has an identical "derived base name."
181 If the argument is defined by a candidate (as x_1 is by (3)) that is a
182 CAND_ADD having a stride of 1, the derived base name of the argument is
183 the base name of the candidate (x_0). Otherwise, the argument itself
184 is its derived base name (as is the case with argument x_0).
185
186 The hidden basis for statement (6) is the nearest dominating candidate
187 whose base name is the derived base name (x_0) of the feeding phi (4),
188 and whose stride is identical to that of the statement. We can then
189 create the new "phi basis" (4a) and feeding adds along incoming arcs (3a),
190 allowing the final replacement of (6) by the strength-reduced (6r).
191
192 To facilitate this, a new kind of candidate (CAND_PHI) is introduced.
193 A CAND_PHI is not a candidate for replacement, but is maintained in the
194 candidate table to ease discovery of hidden bases. Any phi statement
195 whose arguments share a common derived base name is entered into the
196 table with the derived base name, an (arbitrary) index of zero, and a
197 stride of 1. A statement with a hidden basis can then be detected by
198 simply looking up its feeding phi definition in the candidate table,
199 extracting the derived base name, and searching for a basis in the
200 usual manner after substituting the derived base name.
201
202 Note that the transformation is only valid when the original phi and
203 the statements that define the phi's arguments are all at the same
204 position in the loop hierarchy. */
4502f5d0 205
206
207/* Index into the candidate vector, offset by 1. VECs are zero-based,
208 while cand_idx's are one-based, with zero indicating null. */
209typedef unsigned cand_idx;
210
211/* The kind of candidate. */
212enum cand_kind
213{
214 CAND_MULT,
070bf980 215 CAND_ADD,
1168caca 216 CAND_REF,
217 CAND_PHI
4502f5d0 218};
219
220struct slsr_cand_d
221{
222 /* The candidate statement S1. */
223 gimple cand_stmt;
224
c99e471e 225 /* The base expression B: often an SSA name, but not always. */
226 tree base_expr;
4502f5d0 227
228 /* The stride S. */
229 tree stride;
230
231 /* The index constant i. */
232 double_int index;
233
c99e471e 234 /* The type of the candidate. This is normally the type of base_expr,
4502f5d0 235 but casts may have occurred when combining feeding instructions.
070bf980 236 A candidate can only be a basis for candidates of the same final type.
237 (For CAND_REFs, this is the type to be used for operand 1 of the
238 replacement MEM_REF.) */
4502f5d0 239 tree cand_type;
240
241 /* The kind of candidate (CAND_MULT, etc.). */
242 enum cand_kind kind;
243
244 /* Index of this candidate in the candidate vector. */
245 cand_idx cand_num;
246
247 /* Index of the next candidate record for the same statement.
248 A statement may be useful in more than one way (e.g., due to
249 commutativity). So we can have multiple "interpretations"
250 of a statement. */
251 cand_idx next_interp;
252
253 /* Index of the basis statement S0, if any, in the candidate vector. */
254 cand_idx basis;
255
256 /* First candidate for which this candidate is a basis, if one exists. */
257 cand_idx dependent;
258
259 /* Next candidate having the same basis as this one. */
260 cand_idx sibling;
261
1168caca 262 /* If this is a conditional candidate, the CAND_PHI candidate
263 that defines the base SSA name B. */
264 cand_idx def_phi;
4502f5d0 265
266 /* Savings that can be expected from eliminating dead code if this
267 candidate is replaced. */
268 int dead_savings;
269};
270
271typedef struct slsr_cand_d slsr_cand, *slsr_cand_t;
272typedef const struct slsr_cand_d *const_slsr_cand_t;
273
274/* Pointers to candidates are chained together as part of a mapping
c99e471e 275 from base expressions to the candidates that use them. */
4502f5d0 276
277struct cand_chain_d
278{
c99e471e 279 /* Base expression for the chain of candidates: often, but not
280 always, an SSA name. */
281 tree base_expr;
4502f5d0 282
283 /* Pointer to a candidate. */
284 slsr_cand_t cand;
285
286 /* Chain pointer. */
287 struct cand_chain_d *next;
288
289};
290
291typedef struct cand_chain_d cand_chain, *cand_chain_t;
292typedef const struct cand_chain_d *const_cand_chain_t;
293
9ce0359e 294/* Information about a unique "increment" associated with candidates
295 having an SSA name for a stride. An increment is the difference
296 between the index of the candidate and the index of its basis,
297 i.e., (i - i') as discussed in the module commentary.
298
299 When we are not going to generate address arithmetic we treat
300 increments that differ only in sign as the same, allowing sharing
301 of the cost of initializers. The absolute value of the increment
302 is stored in the incr_info. */
303
304struct incr_info_d
305{
306 /* The increment that relates a candidate to its basis. */
307 double_int incr;
308
309 /* How many times the increment occurs in the candidate tree. */
310 unsigned count;
311
312 /* Cost of replacing candidates using this increment. Negative and
313 zero costs indicate replacement should be performed. */
314 int cost;
315
316 /* If this increment is profitable but is not -1, 0, or 1, it requires
317 an initializer T_0 = stride * incr to be found or introduced in the
318 nearest common dominator of all candidates. This field holds T_0
319 for subsequent use. */
320 tree initializer;
321
322 /* If the initializer was found to already exist, this is the block
323 where it was found. */
324 basic_block init_bb;
325};
326
327typedef struct incr_info_d incr_info, *incr_info_t;
328
4502f5d0 329/* Candidates are maintained in a vector. If candidate X dominates
330 candidate Y, then X appears before Y in the vector; but the
331 converse does not necessarily hold. */
f1f41a6c 332static vec<slsr_cand_t> cand_vec;
4502f5d0 333
334enum cost_consts
335{
336 COST_NEUTRAL = 0,
337 COST_INFINITE = 1000
338};
339
1168caca 340enum stride_status
341{
342 UNKNOWN_STRIDE = 0,
343 KNOWN_STRIDE = 1
344};
345
346enum phi_adjust_status
347{
348 NOT_PHI_ADJUST = 0,
349 PHI_ADJUST = 1
350};
351
352enum count_phis_status
353{
354 DONT_COUNT_PHIS = 0,
355 COUNT_PHIS = 1
356};
357
4502f5d0 358/* Pointer map embodying a mapping from statements to candidates. */
359static struct pointer_map_t *stmt_cand_map;
360
361/* Obstack for candidates. */
362static struct obstack cand_obstack;
363
4502f5d0 364/* Obstack for candidate chains. */
365static struct obstack chain_obstack;
9ce0359e 366
367/* An array INCR_VEC of incr_infos is used during analysis of related
368 candidates having an SSA name for a stride. INCR_VEC_LEN describes
d62a8480 369 its current length. MAX_INCR_VEC_LEN is used to avoid costly
370 pathological cases. */
9ce0359e 371static incr_info_t incr_vec;
372static unsigned incr_vec_len;
d62a8480 373const int MAX_INCR_VEC_LEN = 16;
9ce0359e 374
375/* For a chain of candidates with unknown stride, indicates whether or not
376 we must generate pointer arithmetic when replacing statements. */
377static bool address_arithmetic_p;
1168caca 378
379/* Forward function declarations. */
380static slsr_cand_t base_cand_from_table (tree);
d54ab372 381static tree introduce_cast_before_cand (slsr_cand_t, tree, tree);
4502f5d0 382\f
383/* Produce a pointer to the IDX'th candidate in the candidate vector. */
384
385static slsr_cand_t
386lookup_cand (cand_idx idx)
387{
f1f41a6c 388 return cand_vec[idx - 1];
4502f5d0 389}
390
d9dd21a8 391/* Helper for hashing a candidate chain header. */
070bf980 392
d9dd21a8 393struct cand_chain_hasher : typed_noop_remove <cand_chain>
070bf980 394{
d9dd21a8 395 typedef cand_chain value_type;
396 typedef cand_chain compare_type;
397 static inline hashval_t hash (const value_type *);
398 static inline bool equal (const value_type *, const compare_type *);
399};
070bf980 400
d9dd21a8 401inline hashval_t
402cand_chain_hasher::hash (const value_type *p)
070bf980 403{
d9dd21a8 404 tree base_expr = p->base_expr;
405 return iterative_hash_expr (base_expr, 0);
070bf980 406}
407
d9dd21a8 408inline bool
409cand_chain_hasher::equal (const value_type *chain1, const compare_type *chain2)
070bf980 410{
c99e471e 411 return operand_equal_p (chain1->base_expr, chain2->base_expr, 0);
070bf980 412}
d9dd21a8 413
414/* Hash table embodying a mapping from base exprs to chains of candidates. */
415static hash_table <cand_chain_hasher> base_cand_map;
070bf980 416\f
1168caca 417/* Look in the candidate table for a CAND_PHI that defines BASE and
8858a76d 418 return it if found; otherwise return NULL. */
4502f5d0 419
1168caca 420static cand_idx
8858a76d 421find_phi_def (tree base)
1168caca 422{
423 slsr_cand_t c;
424
425 if (TREE_CODE (base) != SSA_NAME)
426 return 0;
cebae8f7 427
1168caca 428 c = base_cand_from_table (base);
429
430 if (!c || c->kind != CAND_PHI)
431 return 0;
432
433 return c->cand_num;
434}
435
436/* Helper routine for find_basis_for_candidate. May be called twice:
437 once for the candidate's base expr, and optionally again for the
438 candidate's phi definition. */
439
440static slsr_cand_t
441find_basis_for_base_expr (slsr_cand_t c, tree base_expr)
4502f5d0 442{
070bf980 443 cand_chain mapping_key;
4502f5d0 444 cand_chain_t chain;
445 slsr_cand_t basis = NULL;
446
df4c32b3 447 // Limit potential of N^2 behavior for long candidate chains.
448 int iters = 0;
449 int max_iters = PARAM_VALUE (PARAM_MAX_SLSR_CANDIDATE_SCAN);
450
1168caca 451 mapping_key.base_expr = base_expr;
d9dd21a8 452 chain = base_cand_map.find (&mapping_key);
4502f5d0 453
df4c32b3 454 for (; chain && iters < max_iters; chain = chain->next, ++iters)
4502f5d0 455 {
456 slsr_cand_t one_basis = chain->cand;
457
458 if (one_basis->kind != c->kind
9cc0ec41 459 || one_basis->cand_stmt == c->cand_stmt
4502f5d0 460 || !operand_equal_p (one_basis->stride, c->stride, 0)
461 || !types_compatible_p (one_basis->cand_type, c->cand_type)
462 || !dominated_by_p (CDI_DOMINATORS,
463 gimple_bb (c->cand_stmt),
464 gimple_bb (one_basis->cand_stmt)))
465 continue;
466
467 if (!basis || basis->cand_num < one_basis->cand_num)
468 basis = one_basis;
469 }
470
1168caca 471 return basis;
472}
473
474/* Use the base expr from candidate C to look for possible candidates
475 that can serve as a basis for C. Each potential basis must also
476 appear in a block that dominates the candidate statement and have
477 the same stride and type. If more than one possible basis exists,
478 the one with highest index in the vector is chosen; this will be
479 the most immediately dominating basis. */
480
481static int
482find_basis_for_candidate (slsr_cand_t c)
483{
484 slsr_cand_t basis = find_basis_for_base_expr (c, c->base_expr);
485
486 /* If a candidate doesn't have a basis using its base expression,
487 it may have a basis hidden by one or more intervening phis. */
488 if (!basis && c->def_phi)
489 {
490 basic_block basis_bb, phi_bb;
491 slsr_cand_t phi_cand = lookup_cand (c->def_phi);
492 basis = find_basis_for_base_expr (c, phi_cand->base_expr);
493
494 if (basis)
495 {
496 /* A hidden basis must dominate the phi-definition of the
497 candidate's base name. */
498 phi_bb = gimple_bb (phi_cand->cand_stmt);
499 basis_bb = gimple_bb (basis->cand_stmt);
500
501 if (phi_bb == basis_bb
502 || !dominated_by_p (CDI_DOMINATORS, phi_bb, basis_bb))
503 {
504 basis = NULL;
505 c->basis = 0;
506 }
507
508 /* If we found a hidden basis, estimate additional dead-code
509 savings if the phi and its feeding statements can be removed. */
510 if (basis && has_single_use (gimple_phi_result (phi_cand->cand_stmt)))
511 c->dead_savings += phi_cand->dead_savings;
512 }
513 }
514
4502f5d0 515 if (basis)
516 {
517 c->sibling = basis->dependent;
518 basis->dependent = c->cand_num;
519 return basis->cand_num;
520 }
521
522 return 0;
523}
524
c99e471e 525/* Record a mapping from the base expression of C to C itself, indicating that
526 C may potentially serve as a basis using that base expression. */
4502f5d0 527
528static void
529record_potential_basis (slsr_cand_t c)
530{
070bf980 531 cand_chain_t node;
d9dd21a8 532 cand_chain **slot;
4502f5d0 533
534 node = (cand_chain_t) obstack_alloc (&chain_obstack, sizeof (cand_chain));
c99e471e 535 node->base_expr = c->base_expr;
4502f5d0 536 node->cand = c;
537 node->next = NULL;
d9dd21a8 538 slot = base_cand_map.find_slot (node, INSERT);
4502f5d0 539
070bf980 540 if (*slot)
4502f5d0 541 {
070bf980 542 cand_chain_t head = (cand_chain_t) (*slot);
4502f5d0 543 node->next = head->next;
544 head->next = node;
545 }
546 else
070bf980 547 *slot = node;
4502f5d0 548}
549
550/* Allocate storage for a new candidate and initialize its fields.
551 Attempt to find a basis for the candidate. */
552
553static slsr_cand_t
554alloc_cand_and_find_basis (enum cand_kind kind, gimple gs, tree base,
555 double_int index, tree stride, tree ctype,
556 unsigned savings)
557{
558 slsr_cand_t c = (slsr_cand_t) obstack_alloc (&cand_obstack,
559 sizeof (slsr_cand));
560 c->cand_stmt = gs;
c99e471e 561 c->base_expr = base;
4502f5d0 562 c->stride = stride;
563 c->index = index;
564 c->cand_type = ctype;
565 c->kind = kind;
f1f41a6c 566 c->cand_num = cand_vec.length () + 1;
4502f5d0 567 c->next_interp = 0;
568 c->dependent = 0;
569 c->sibling = 0;
8858a76d 570 c->def_phi = kind == CAND_MULT ? find_phi_def (base) : 0;
4502f5d0 571 c->dead_savings = savings;
572
f1f41a6c 573 cand_vec.safe_push (c);
1168caca 574
575 if (kind == CAND_PHI)
576 c->basis = 0;
577 else
578 c->basis = find_basis_for_candidate (c);
579
4502f5d0 580 record_potential_basis (c);
581
582 return c;
583}
584
585/* Determine the target cost of statement GS when compiling according
586 to SPEED. */
587
588static int
589stmt_cost (gimple gs, bool speed)
590{
591 tree lhs, rhs1, rhs2;
592 enum machine_mode lhs_mode;
593
594 gcc_assert (is_gimple_assign (gs));
595 lhs = gimple_assign_lhs (gs);
596 rhs1 = gimple_assign_rhs1 (gs);
597 lhs_mode = TYPE_MODE (TREE_TYPE (lhs));
598
599 switch (gimple_assign_rhs_code (gs))
600 {
601 case MULT_EXPR:
602 rhs2 = gimple_assign_rhs2 (gs);
603
604 if (host_integerp (rhs2, 0))
72655676 605 return mult_by_coeff_cost (TREE_INT_CST_LOW (rhs2), lhs_mode, speed);
4502f5d0 606
607 gcc_assert (TREE_CODE (rhs1) != INTEGER_CST);
49a71e58 608 return mul_cost (speed, lhs_mode);
4502f5d0 609
610 case PLUS_EXPR:
611 case POINTER_PLUS_EXPR:
612 case MINUS_EXPR:
49a71e58 613 return add_cost (speed, lhs_mode);
4502f5d0 614
615 case NEGATE_EXPR:
49a71e58 616 return neg_cost (speed, lhs_mode);
4502f5d0 617
618 case NOP_EXPR:
72655676 619 return convert_cost (lhs_mode, TYPE_MODE (TREE_TYPE (rhs1)), speed);
4502f5d0 620
621 /* Note that we don't assign costs to copies that in most cases
622 will go away. */
623 default:
624 ;
625 }
626
627 gcc_unreachable ();
628 return 0;
629}
630
631/* Look up the defining statement for BASE_IN and return a pointer
632 to its candidate in the candidate table, if any; otherwise NULL.
633 Only CAND_ADD and CAND_MULT candidates are returned. */
634
635static slsr_cand_t
636base_cand_from_table (tree base_in)
637{
638 slsr_cand_t *result;
639
640 gimple def = SSA_NAME_DEF_STMT (base_in);
641 if (!def)
642 return (slsr_cand_t) NULL;
643
644 result = (slsr_cand_t *) pointer_map_contains (stmt_cand_map, def);
070bf980 645
646 if (result && (*result)->kind != CAND_REF)
647 return *result;
4502f5d0 648
070bf980 649 return (slsr_cand_t) NULL;
4502f5d0 650}
651
652/* Add an entry to the statement-to-candidate mapping. */
653
654static void
655add_cand_for_stmt (gimple gs, slsr_cand_t c)
656{
657 void **slot = pointer_map_insert (stmt_cand_map, gs);
658 gcc_assert (!*slot);
659 *slot = c;
660}
661\f
1168caca 662/* Given PHI which contains a phi statement, determine whether it
663 satisfies all the requirements of a phi candidate. If so, create
664 a candidate. Note that a CAND_PHI never has a basis itself, but
665 is used to help find a basis for subsequent candidates. */
666
667static void
668slsr_process_phi (gimple phi, bool speed)
669{
670 unsigned i;
671 tree arg0_base = NULL_TREE, base_type;
672 slsr_cand_t c;
673 struct loop *cand_loop = gimple_bb (phi)->loop_father;
674 unsigned savings = 0;
675
676 /* A CAND_PHI requires each of its arguments to have the same
677 derived base name. (See the module header commentary for a
678 definition of derived base names.) Furthermore, all feeding
679 definitions must be in the same position in the loop hierarchy
680 as PHI. */
681
682 for (i = 0; i < gimple_phi_num_args (phi); i++)
683 {
684 slsr_cand_t arg_cand;
685 tree arg = gimple_phi_arg_def (phi, i);
686 tree derived_base_name = NULL_TREE;
687 gimple arg_stmt = NULL;
688 basic_block arg_bb = NULL;
689
690 if (TREE_CODE (arg) != SSA_NAME)
691 return;
692
693 arg_cand = base_cand_from_table (arg);
694
695 if (arg_cand)
696 {
697 while (arg_cand->kind != CAND_ADD && arg_cand->kind != CAND_PHI)
698 {
699 if (!arg_cand->next_interp)
700 return;
701
702 arg_cand = lookup_cand (arg_cand->next_interp);
703 }
704
705 if (!integer_onep (arg_cand->stride))
706 return;
707
708 derived_base_name = arg_cand->base_expr;
709 arg_stmt = arg_cand->cand_stmt;
710 arg_bb = gimple_bb (arg_stmt);
711
712 /* Gather potential dead code savings if the phi statement
713 can be removed later on. */
714 if (has_single_use (arg))
715 {
716 if (gimple_code (arg_stmt) == GIMPLE_PHI)
717 savings += arg_cand->dead_savings;
718 else
719 savings += stmt_cost (arg_stmt, speed);
720 }
721 }
722 else
723 {
724 derived_base_name = arg;
725
726 if (SSA_NAME_IS_DEFAULT_DEF (arg))
727 arg_bb = single_succ (ENTRY_BLOCK_PTR);
728 else
729 gimple_bb (SSA_NAME_DEF_STMT (arg));
730 }
731
732 if (!arg_bb || arg_bb->loop_father != cand_loop)
733 return;
734
735 if (i == 0)
736 arg0_base = derived_base_name;
737 else if (!operand_equal_p (derived_base_name, arg0_base, 0))
738 return;
739 }
740
741 /* Create the candidate. "alloc_cand_and_find_basis" is named
742 misleadingly for this case, as no basis will be sought for a
743 CAND_PHI. */
744 base_type = TREE_TYPE (arg0_base);
745
746 c = alloc_cand_and_find_basis (CAND_PHI, phi, arg0_base, double_int_zero,
747 integer_one_node, base_type, savings);
748
749 /* Add the candidate to the statement-candidate mapping. */
750 add_cand_for_stmt (phi, c);
751}
752
070bf980 753/* Look for the following pattern:
754
755 *PBASE: MEM_REF (T1, C1)
756
757 *POFFSET: MULT_EXPR (T2, C3) [C2 is zero]
758 or
759 MULT_EXPR (PLUS_EXPR (T2, C2), C3)
760 or
761 MULT_EXPR (MINUS_EXPR (T2, -C2), C3)
762
763 *PINDEX: C4 * BITS_PER_UNIT
764
765 If not present, leave the input values unchanged and return FALSE.
766 Otherwise, modify the input values as follows and return TRUE:
767
768 *PBASE: T1
769 *POFFSET: MULT_EXPR (T2, C3)
770 *PINDEX: C1 + (C2 * C3) + C4 */
771
772static bool
773restructure_reference (tree *pbase, tree *poffset, double_int *pindex,
774 tree *ptype)
775{
776 tree base = *pbase, offset = *poffset;
777 double_int index = *pindex;
cf8f0e63 778 double_int bpu = double_int::from_uhwi (BITS_PER_UNIT);
070bf980 779 tree mult_op0, mult_op1, t1, t2, type;
780 double_int c1, c2, c3, c4;
781
782 if (!base
783 || !offset
784 || TREE_CODE (base) != MEM_REF
785 || TREE_CODE (offset) != MULT_EXPR
786 || TREE_CODE (TREE_OPERAND (offset, 1)) != INTEGER_CST
cf8f0e63 787 || !index.umod (bpu, FLOOR_MOD_EXPR).is_zero ())
070bf980 788 return false;
789
790 t1 = TREE_OPERAND (base, 0);
791 c1 = mem_ref_offset (base);
792 type = TREE_TYPE (TREE_OPERAND (base, 1));
793
794 mult_op0 = TREE_OPERAND (offset, 0);
795 mult_op1 = TREE_OPERAND (offset, 1);
796
797 c3 = tree_to_double_int (mult_op1);
798
799 if (TREE_CODE (mult_op0) == PLUS_EXPR)
800
801 if (TREE_CODE (TREE_OPERAND (mult_op0, 1)) == INTEGER_CST)
802 {
803 t2 = TREE_OPERAND (mult_op0, 0);
804 c2 = tree_to_double_int (TREE_OPERAND (mult_op0, 1));
805 }
806 else
807 return false;
808
809 else if (TREE_CODE (mult_op0) == MINUS_EXPR)
810
811 if (TREE_CODE (TREE_OPERAND (mult_op0, 1)) == INTEGER_CST)
812 {
813 t2 = TREE_OPERAND (mult_op0, 0);
cf8f0e63 814 c2 = -tree_to_double_int (TREE_OPERAND (mult_op0, 1));
070bf980 815 }
816 else
817 return false;
818
819 else
820 {
821 t2 = mult_op0;
822 c2 = double_int_zero;
823 }
824
cf8f0e63 825 c4 = index.udiv (bpu, FLOOR_DIV_EXPR);
070bf980 826
827 *pbase = t1;
828 *poffset = fold_build2 (MULT_EXPR, sizetype, t2,
829 double_int_to_tree (sizetype, c3));
cf8f0e63 830 *pindex = c1 + c2 * c3 + c4;
070bf980 831 *ptype = type;
832
833 return true;
834}
835
836/* Given GS which contains a data reference, create a CAND_REF entry in
837 the candidate table and attempt to find a basis. */
838
839static void
840slsr_process_ref (gimple gs)
841{
842 tree ref_expr, base, offset, type;
843 HOST_WIDE_INT bitsize, bitpos;
844 enum machine_mode mode;
845 int unsignedp, volatilep;
846 double_int index;
847 slsr_cand_t c;
848
849 if (gimple_vdef (gs))
850 ref_expr = gimple_assign_lhs (gs);
851 else
852 ref_expr = gimple_assign_rhs1 (gs);
853
854 if (!handled_component_p (ref_expr)
855 || TREE_CODE (ref_expr) == BIT_FIELD_REF
856 || (TREE_CODE (ref_expr) == COMPONENT_REF
857 && DECL_BIT_FIELD (TREE_OPERAND (ref_expr, 1))))
858 return;
859
860 base = get_inner_reference (ref_expr, &bitsize, &bitpos, &offset, &mode,
861 &unsignedp, &volatilep, false);
cf8f0e63 862 index = double_int::from_uhwi (bitpos);
070bf980 863
864 if (!restructure_reference (&base, &offset, &index, &type))
865 return;
866
867 c = alloc_cand_and_find_basis (CAND_REF, gs, base, index, offset,
868 type, 0);
869
870 /* Add the candidate to the statement-candidate mapping. */
871 add_cand_for_stmt (gs, c);
872}
873
4502f5d0 874/* Create a candidate entry for a statement GS, where GS multiplies
875 two SSA names BASE_IN and STRIDE_IN. Propagate any known information
876 about the two SSA names into the new candidate. Return the new
877 candidate. */
878
879static slsr_cand_t
880create_mul_ssa_cand (gimple gs, tree base_in, tree stride_in, bool speed)
881{
882 tree base = NULL_TREE, stride = NULL_TREE, ctype = NULL_TREE;
883 double_int index;
884 unsigned savings = 0;
885 slsr_cand_t c;
886 slsr_cand_t base_cand = base_cand_from_table (base_in);
887
888 /* Look at all interpretations of the base candidate, if necessary,
889 to find information to propagate into this candidate. */
1168caca 890 while (base_cand && !base && base_cand->kind != CAND_PHI)
4502f5d0 891 {
892
1168caca 893 if (base_cand->kind == CAND_MULT && integer_onep (base_cand->stride))
4502f5d0 894 {
895 /* Y = (B + i') * 1
896 X = Y * Z
897 ================
898 X = (B + i') * Z */
c99e471e 899 base = base_cand->base_expr;
4502f5d0 900 index = base_cand->index;
901 stride = stride_in;
902 ctype = base_cand->cand_type;
903 if (has_single_use (base_in))
904 savings = (base_cand->dead_savings
905 + stmt_cost (base_cand->cand_stmt, speed));
906 }
907 else if (base_cand->kind == CAND_ADD
908 && TREE_CODE (base_cand->stride) == INTEGER_CST)
909 {
910 /* Y = B + (i' * S), S constant
911 X = Y * Z
912 ============================
913 X = B + ((i' * S) * Z) */
c99e471e 914 base = base_cand->base_expr;
cf8f0e63 915 index = base_cand->index * tree_to_double_int (base_cand->stride);
4502f5d0 916 stride = stride_in;
917 ctype = base_cand->cand_type;
918 if (has_single_use (base_in))
919 savings = (base_cand->dead_savings
920 + stmt_cost (base_cand->cand_stmt, speed));
921 }
922
923 if (base_cand->next_interp)
924 base_cand = lookup_cand (base_cand->next_interp);
925 else
926 base_cand = NULL;
927 }
928
929 if (!base)
930 {
931 /* No interpretations had anything useful to propagate, so
932 produce X = (Y + 0) * Z. */
933 base = base_in;
934 index = double_int_zero;
935 stride = stride_in;
3b652cc1 936 ctype = TREE_TYPE (base_in);
4502f5d0 937 }
938
939 c = alloc_cand_and_find_basis (CAND_MULT, gs, base, index, stride,
940 ctype, savings);
941 return c;
942}
943
944/* Create a candidate entry for a statement GS, where GS multiplies
945 SSA name BASE_IN by constant STRIDE_IN. Propagate any known
946 information about BASE_IN into the new candidate. Return the new
947 candidate. */
948
949static slsr_cand_t
950create_mul_imm_cand (gimple gs, tree base_in, tree stride_in, bool speed)
951{
952 tree base = NULL_TREE, stride = NULL_TREE, ctype = NULL_TREE;
953 double_int index, temp;
954 unsigned savings = 0;
955 slsr_cand_t c;
956 slsr_cand_t base_cand = base_cand_from_table (base_in);
957
958 /* Look at all interpretations of the base candidate, if necessary,
959 to find information to propagate into this candidate. */
1168caca 960 while (base_cand && !base && base_cand->kind != CAND_PHI)
4502f5d0 961 {
962 if (base_cand->kind == CAND_MULT
963 && TREE_CODE (base_cand->stride) == INTEGER_CST)
964 {
965 /* Y = (B + i') * S, S constant
966 X = Y * c
967 ============================
968 X = (B + i') * (S * c) */
c99e471e 969 base = base_cand->base_expr;
4502f5d0 970 index = base_cand->index;
cf8f0e63 971 temp = tree_to_double_int (base_cand->stride)
972 * tree_to_double_int (stride_in);
4502f5d0 973 stride = double_int_to_tree (TREE_TYPE (stride_in), temp);
974 ctype = base_cand->cand_type;
975 if (has_single_use (base_in))
976 savings = (base_cand->dead_savings
977 + stmt_cost (base_cand->cand_stmt, speed));
978 }
1168caca 979 else if (base_cand->kind == CAND_ADD && integer_onep (base_cand->stride))
4502f5d0 980 {
981 /* Y = B + (i' * 1)
982 X = Y * c
983 ===========================
984 X = (B + i') * c */
c99e471e 985 base = base_cand->base_expr;
4502f5d0 986 index = base_cand->index;
987 stride = stride_in;
988 ctype = base_cand->cand_type;
989 if (has_single_use (base_in))
990 savings = (base_cand->dead_savings
991 + stmt_cost (base_cand->cand_stmt, speed));
992 }
993 else if (base_cand->kind == CAND_ADD
cf8f0e63 994 && base_cand->index.is_one ()
4502f5d0 995 && TREE_CODE (base_cand->stride) == INTEGER_CST)
996 {
997 /* Y = B + (1 * S), S constant
998 X = Y * c
999 ===========================
1000 X = (B + S) * c */
c99e471e 1001 base = base_cand->base_expr;
4502f5d0 1002 index = tree_to_double_int (base_cand->stride);
1003 stride = stride_in;
1004 ctype = base_cand->cand_type;
1005 if (has_single_use (base_in))
1006 savings = (base_cand->dead_savings
1007 + stmt_cost (base_cand->cand_stmt, speed));
1008 }
1009
1010 if (base_cand->next_interp)
1011 base_cand = lookup_cand (base_cand->next_interp);
1012 else
1013 base_cand = NULL;
1014 }
1015
1016 if (!base)
1017 {
1018 /* No interpretations had anything useful to propagate, so
1019 produce X = (Y + 0) * c. */
1020 base = base_in;
1021 index = double_int_zero;
1022 stride = stride_in;
3b652cc1 1023 ctype = TREE_TYPE (base_in);
4502f5d0 1024 }
1025
1026 c = alloc_cand_and_find_basis (CAND_MULT, gs, base, index, stride,
1027 ctype, savings);
1028 return c;
1029}
1030
1031/* Given GS which is a multiply of scalar integers, make an appropriate
1032 entry in the candidate table. If this is a multiply of two SSA names,
1033 create two CAND_MULT interpretations and attempt to find a basis for
1034 each of them. Otherwise, create a single CAND_MULT and attempt to
1035 find a basis. */
1036
1037static void
1038slsr_process_mul (gimple gs, tree rhs1, tree rhs2, bool speed)
1039{
1040 slsr_cand_t c, c2;
1041
1042 /* If this is a multiply of an SSA name with itself, it is highly
1043 unlikely that we will get a strength reduction opportunity, so
1044 don't record it as a candidate. This simplifies the logic for
1045 finding a basis, so if this is removed that must be considered. */
1046 if (rhs1 == rhs2)
1047 return;
1048
1049 if (TREE_CODE (rhs2) == SSA_NAME)
1050 {
1051 /* Record an interpretation of this statement in the candidate table
c99e471e 1052 assuming RHS1 is the base expression and RHS2 is the stride. */
4502f5d0 1053 c = create_mul_ssa_cand (gs, rhs1, rhs2, speed);
1054
1055 /* Add the first interpretation to the statement-candidate mapping. */
1056 add_cand_for_stmt (gs, c);
1057
1058 /* Record another interpretation of this statement assuming RHS1
c99e471e 1059 is the stride and RHS2 is the base expression. */
4502f5d0 1060 c2 = create_mul_ssa_cand (gs, rhs2, rhs1, speed);
1061 c->next_interp = c2->cand_num;
1062 }
1063 else
1064 {
1065 /* Record an interpretation for the multiply-immediate. */
1066 c = create_mul_imm_cand (gs, rhs1, rhs2, speed);
1067
1068 /* Add the interpretation to the statement-candidate mapping. */
1069 add_cand_for_stmt (gs, c);
1070 }
1071}
1072
1073/* Create a candidate entry for a statement GS, where GS adds two
1074 SSA names BASE_IN and ADDEND_IN if SUBTRACT_P is false, and
1075 subtracts ADDEND_IN from BASE_IN otherwise. Propagate any known
1076 information about the two SSA names into the new candidate.
1077 Return the new candidate. */
1078
1079static slsr_cand_t
1080create_add_ssa_cand (gimple gs, tree base_in, tree addend_in,
1081 bool subtract_p, bool speed)
1082{
1083 tree base = NULL_TREE, stride = NULL_TREE, ctype = NULL;
1084 double_int index;
1085 unsigned savings = 0;
1086 slsr_cand_t c;
1087 slsr_cand_t base_cand = base_cand_from_table (base_in);
1088 slsr_cand_t addend_cand = base_cand_from_table (addend_in);
1089
1090 /* The most useful transformation is a multiply-immediate feeding
1091 an add or subtract. Look for that first. */
1168caca 1092 while (addend_cand && !base && addend_cand->kind != CAND_PHI)
4502f5d0 1093 {
1094 if (addend_cand->kind == CAND_MULT
cf8f0e63 1095 && addend_cand->index.is_zero ()
4502f5d0 1096 && TREE_CODE (addend_cand->stride) == INTEGER_CST)
1097 {
1098 /* Z = (B + 0) * S, S constant
1099 X = Y +/- Z
1100 ===========================
1101 X = Y + ((+/-1 * S) * B) */
1102 base = base_in;
1103 index = tree_to_double_int (addend_cand->stride);
1104 if (subtract_p)
cf8f0e63 1105 index = -index;
c99e471e 1106 stride = addend_cand->base_expr;
3b652cc1 1107 ctype = TREE_TYPE (base_in);
4502f5d0 1108 if (has_single_use (addend_in))
1109 savings = (addend_cand->dead_savings
1110 + stmt_cost (addend_cand->cand_stmt, speed));
1111 }
1112
1113 if (addend_cand->next_interp)
1114 addend_cand = lookup_cand (addend_cand->next_interp);
1115 else
1116 addend_cand = NULL;
1117 }
1118
1168caca 1119 while (base_cand && !base && base_cand->kind != CAND_PHI)
4502f5d0 1120 {
1121 if (base_cand->kind == CAND_ADD
cf8f0e63 1122 && (base_cand->index.is_zero ()
4502f5d0 1123 || operand_equal_p (base_cand->stride,
1124 integer_zero_node, 0)))
1125 {
1126 /* Y = B + (i' * S), i' * S = 0
1127 X = Y +/- Z
1128 ============================
1129 X = B + (+/-1 * Z) */
c99e471e 1130 base = base_cand->base_expr;
4502f5d0 1131 index = subtract_p ? double_int_minus_one : double_int_one;
1132 stride = addend_in;
1133 ctype = base_cand->cand_type;
1134 if (has_single_use (base_in))
1135 savings = (base_cand->dead_savings
1136 + stmt_cost (base_cand->cand_stmt, speed));
1137 }
1138 else if (subtract_p)
1139 {
1140 slsr_cand_t subtrahend_cand = base_cand_from_table (addend_in);
1141
1168caca 1142 while (subtrahend_cand && !base && subtrahend_cand->kind != CAND_PHI)
4502f5d0 1143 {
1144 if (subtrahend_cand->kind == CAND_MULT
cf8f0e63 1145 && subtrahend_cand->index.is_zero ()
4502f5d0 1146 && TREE_CODE (subtrahend_cand->stride) == INTEGER_CST)
1147 {
1148 /* Z = (B + 0) * S, S constant
1149 X = Y - Z
1150 ===========================
1151 Value: X = Y + ((-1 * S) * B) */
1152 base = base_in;
1153 index = tree_to_double_int (subtrahend_cand->stride);
cf8f0e63 1154 index = -index;
c99e471e 1155 stride = subtrahend_cand->base_expr;
3b652cc1 1156 ctype = TREE_TYPE (base_in);
4502f5d0 1157 if (has_single_use (addend_in))
1158 savings = (subtrahend_cand->dead_savings
1159 + stmt_cost (subtrahend_cand->cand_stmt, speed));
1160 }
1161
1162 if (subtrahend_cand->next_interp)
1163 subtrahend_cand = lookup_cand (subtrahend_cand->next_interp);
1164 else
1165 subtrahend_cand = NULL;
1166 }
1167 }
1168
1169 if (base_cand->next_interp)
1170 base_cand = lookup_cand (base_cand->next_interp);
1171 else
1172 base_cand = NULL;
1173 }
1174
1175 if (!base)
1176 {
1177 /* No interpretations had anything useful to propagate, so
1178 produce X = Y + (1 * Z). */
1179 base = base_in;
1180 index = subtract_p ? double_int_minus_one : double_int_one;
1181 stride = addend_in;
3b652cc1 1182 ctype = TREE_TYPE (base_in);
4502f5d0 1183 }
1184
1185 c = alloc_cand_and_find_basis (CAND_ADD, gs, base, index, stride,
1186 ctype, savings);
1187 return c;
1188}
1189
1190/* Create a candidate entry for a statement GS, where GS adds SSA
1191 name BASE_IN to constant INDEX_IN. Propagate any known information
1192 about BASE_IN into the new candidate. Return the new candidate. */
1193
1194static slsr_cand_t
1195create_add_imm_cand (gimple gs, tree base_in, double_int index_in, bool speed)
1196{
1197 enum cand_kind kind = CAND_ADD;
1198 tree base = NULL_TREE, stride = NULL_TREE, ctype = NULL_TREE;
1199 double_int index, multiple;
1200 unsigned savings = 0;
1201 slsr_cand_t c;
1202 slsr_cand_t base_cand = base_cand_from_table (base_in);
1203
1168caca 1204 while (base_cand && !base && base_cand->kind != CAND_PHI)
4502f5d0 1205 {
1206 bool unsigned_p = TYPE_UNSIGNED (TREE_TYPE (base_cand->stride));
1207
1208 if (TREE_CODE (base_cand->stride) == INTEGER_CST
cf8f0e63 1209 && index_in.multiple_of (tree_to_double_int (base_cand->stride),
1210 unsigned_p, &multiple))
4502f5d0 1211 {
1212 /* Y = (B + i') * S, S constant, c = kS for some integer k
1213 X = Y + c
1214 ============================
1215 X = (B + (i'+ k)) * S
1216 OR
1217 Y = B + (i' * S), S constant, c = kS for some integer k
1218 X = Y + c
1219 ============================
1220 X = (B + (i'+ k)) * S */
1221 kind = base_cand->kind;
c99e471e 1222 base = base_cand->base_expr;
cf8f0e63 1223 index = base_cand->index + multiple;
4502f5d0 1224 stride = base_cand->stride;
1225 ctype = base_cand->cand_type;
1226 if (has_single_use (base_in))
1227 savings = (base_cand->dead_savings
1228 + stmt_cost (base_cand->cand_stmt, speed));
1229 }
1230
1231 if (base_cand->next_interp)
1232 base_cand = lookup_cand (base_cand->next_interp);
1233 else
1234 base_cand = NULL;
1235 }
1236
1237 if (!base)
1238 {
1239 /* No interpretations had anything useful to propagate, so
1240 produce X = Y + (c * 1). */
1241 kind = CAND_ADD;
1242 base = base_in;
1243 index = index_in;
1244 stride = integer_one_node;
3b652cc1 1245 ctype = TREE_TYPE (base_in);
4502f5d0 1246 }
1247
1248 c = alloc_cand_and_find_basis (kind, gs, base, index, stride,
1249 ctype, savings);
1250 return c;
1251}
1252
1253/* Given GS which is an add or subtract of scalar integers or pointers,
1254 make at least one appropriate entry in the candidate table. */
1255
1256static void
1257slsr_process_add (gimple gs, tree rhs1, tree rhs2, bool speed)
1258{
1259 bool subtract_p = gimple_assign_rhs_code (gs) == MINUS_EXPR;
1260 slsr_cand_t c = NULL, c2;
1261
1262 if (TREE_CODE (rhs2) == SSA_NAME)
1263 {
c99e471e 1264 /* First record an interpretation assuming RHS1 is the base expression
4502f5d0 1265 and RHS2 is the stride. But it doesn't make sense for the
1266 stride to be a pointer, so don't record a candidate in that case. */
3b652cc1 1267 if (!POINTER_TYPE_P (TREE_TYPE (rhs2)))
4502f5d0 1268 {
1269 c = create_add_ssa_cand (gs, rhs1, rhs2, subtract_p, speed);
1270
1271 /* Add the first interpretation to the statement-candidate
1272 mapping. */
1273 add_cand_for_stmt (gs, c);
1274 }
1275
1276 /* If the two RHS operands are identical, or this is a subtract,
1277 we're done. */
1278 if (operand_equal_p (rhs1, rhs2, 0) || subtract_p)
1279 return;
1280
1281 /* Otherwise, record another interpretation assuming RHS2 is the
c99e471e 1282 base expression and RHS1 is the stride, again provided that the
4502f5d0 1283 stride is not a pointer. */
3b652cc1 1284 if (!POINTER_TYPE_P (TREE_TYPE (rhs1)))
4502f5d0 1285 {
1286 c2 = create_add_ssa_cand (gs, rhs2, rhs1, false, speed);
1287 if (c)
1288 c->next_interp = c2->cand_num;
1289 else
1290 add_cand_for_stmt (gs, c2);
1291 }
1292 }
1293 else
1294 {
1295 double_int index;
1296
1297 /* Record an interpretation for the add-immediate. */
1298 index = tree_to_double_int (rhs2);
1299 if (subtract_p)
cf8f0e63 1300 index = -index;
4502f5d0 1301
1302 c = create_add_imm_cand (gs, rhs1, index, speed);
1303
1304 /* Add the interpretation to the statement-candidate mapping. */
1305 add_cand_for_stmt (gs, c);
1306 }
1307}
1308
1309/* Given GS which is a negate of a scalar integer, make an appropriate
1310 entry in the candidate table. A negate is equivalent to a multiply
1311 by -1. */
1312
1313static void
1314slsr_process_neg (gimple gs, tree rhs1, bool speed)
1315{
1316 /* Record a CAND_MULT interpretation for the multiply by -1. */
1317 slsr_cand_t c = create_mul_imm_cand (gs, rhs1, integer_minus_one_node, speed);
1318
1319 /* Add the interpretation to the statement-candidate mapping. */
1320 add_cand_for_stmt (gs, c);
1321}
1322
38304570 1323/* Help function for legal_cast_p, operating on two trees. Checks
1324 whether it's allowable to cast from RHS to LHS. See legal_cast_p
1325 for more details. */
1326
1327static bool
1328legal_cast_p_1 (tree lhs, tree rhs)
1329{
1330 tree lhs_type, rhs_type;
1331 unsigned lhs_size, rhs_size;
1332 bool lhs_wraps, rhs_wraps;
1333
1334 lhs_type = TREE_TYPE (lhs);
1335 rhs_type = TREE_TYPE (rhs);
1336 lhs_size = TYPE_PRECISION (lhs_type);
1337 rhs_size = TYPE_PRECISION (rhs_type);
1338 lhs_wraps = TYPE_OVERFLOW_WRAPS (lhs_type);
1339 rhs_wraps = TYPE_OVERFLOW_WRAPS (rhs_type);
1340
1341 if (lhs_size < rhs_size
1342 || (rhs_wraps && !lhs_wraps)
1343 || (rhs_wraps && lhs_wraps && rhs_size != lhs_size))
1344 return false;
1345
1346 return true;
1347}
1348
4502f5d0 1349/* Return TRUE if GS is a statement that defines an SSA name from
1350 a conversion and is legal for us to combine with an add and multiply
1351 in the candidate table. For example, suppose we have:
1352
1353 A = B + i;
1354 C = (type) A;
1355 D = C * S;
1356
1357 Without the type-cast, we would create a CAND_MULT for D with base B,
1358 index i, and stride S. We want to record this candidate only if it
1359 is equivalent to apply the type cast following the multiply:
1360
1361 A = B + i;
1362 E = A * S;
1363 D = (type) E;
1364
1365 We will record the type with the candidate for D. This allows us
1366 to use a similar previous candidate as a basis. If we have earlier seen
1367
1368 A' = B + i';
1369 C' = (type) A';
1370 D' = C' * S;
1371
1372 we can replace D with
1373
1374 D = D' + (i - i') * S;
1375
1376 But if moving the type-cast would change semantics, we mustn't do this.
1377
1378 This is legitimate for casts from a non-wrapping integral type to
1379 any integral type of the same or larger size. It is not legitimate
1380 to convert a wrapping type to a non-wrapping type, or to a wrapping
1381 type of a different size. I.e., with a wrapping type, we must
1382 assume that the addition B + i could wrap, in which case performing
1383 the multiply before or after one of the "illegal" type casts will
1384 have different semantics. */
1385
1386static bool
1387legal_cast_p (gimple gs, tree rhs)
1388{
4502f5d0 1389 if (!is_gimple_assign (gs)
1390 || !CONVERT_EXPR_CODE_P (gimple_assign_rhs_code (gs)))
1391 return false;
1392
38304570 1393 return legal_cast_p_1 (gimple_assign_lhs (gs), rhs);
4502f5d0 1394}
1395
1396/* Given GS which is a cast to a scalar integer type, determine whether
1397 the cast is legal for strength reduction. If so, make at least one
1398 appropriate entry in the candidate table. */
1399
1400static void
1401slsr_process_cast (gimple gs, tree rhs1, bool speed)
1402{
1403 tree lhs, ctype;
1404 slsr_cand_t base_cand, c, c2;
1405 unsigned savings = 0;
1406
1407 if (!legal_cast_p (gs, rhs1))
1408 return;
1409
1410 lhs = gimple_assign_lhs (gs);
1411 base_cand = base_cand_from_table (rhs1);
1412 ctype = TREE_TYPE (lhs);
1413
1168caca 1414 if (base_cand && base_cand->kind != CAND_PHI)
4502f5d0 1415 {
1416 while (base_cand)
1417 {
1418 /* Propagate all data from the base candidate except the type,
1419 which comes from the cast, and the base candidate's cast,
1420 which is no longer applicable. */
1421 if (has_single_use (rhs1))
1422 savings = (base_cand->dead_savings
1423 + stmt_cost (base_cand->cand_stmt, speed));
1424
1425 c = alloc_cand_and_find_basis (base_cand->kind, gs,
c99e471e 1426 base_cand->base_expr,
4502f5d0 1427 base_cand->index, base_cand->stride,
1428 ctype, savings);
1429 if (base_cand->next_interp)
1430 base_cand = lookup_cand (base_cand->next_interp);
1431 else
1432 base_cand = NULL;
1433 }
1434 }
1435 else
1436 {
1437 /* If nothing is known about the RHS, create fresh CAND_ADD and
1438 CAND_MULT interpretations:
1439
1440 X = Y + (0 * 1)
1441 X = (Y + 0) * 1
1442
1443 The first of these is somewhat arbitrary, but the choice of
1444 1 for the stride simplifies the logic for propagating casts
1445 into their uses. */
1446 c = alloc_cand_and_find_basis (CAND_ADD, gs, rhs1, double_int_zero,
1447 integer_one_node, ctype, 0);
1448 c2 = alloc_cand_and_find_basis (CAND_MULT, gs, rhs1, double_int_zero,
1449 integer_one_node, ctype, 0);
1450 c->next_interp = c2->cand_num;
1451 }
1452
1453 /* Add the first (or only) interpretation to the statement-candidate
1454 mapping. */
1455 add_cand_for_stmt (gs, c);
1456}
1457
1458/* Given GS which is a copy of a scalar integer type, make at least one
1459 appropriate entry in the candidate table.
1460
1461 This interface is included for completeness, but is unnecessary
1462 if this pass immediately follows a pass that performs copy
1463 propagation, such as DOM. */
1464
1465static void
1466slsr_process_copy (gimple gs, tree rhs1, bool speed)
1467{
1468 slsr_cand_t base_cand, c, c2;
1469 unsigned savings = 0;
1470
1471 base_cand = base_cand_from_table (rhs1);
1472
1168caca 1473 if (base_cand && base_cand->kind != CAND_PHI)
4502f5d0 1474 {
1475 while (base_cand)
1476 {
1477 /* Propagate all data from the base candidate. */
1478 if (has_single_use (rhs1))
1479 savings = (base_cand->dead_savings
1480 + stmt_cost (base_cand->cand_stmt, speed));
1481
1482 c = alloc_cand_and_find_basis (base_cand->kind, gs,
c99e471e 1483 base_cand->base_expr,
4502f5d0 1484 base_cand->index, base_cand->stride,
1485 base_cand->cand_type, savings);
1486 if (base_cand->next_interp)
1487 base_cand = lookup_cand (base_cand->next_interp);
1488 else
1489 base_cand = NULL;
1490 }
1491 }
1492 else
1493 {
1494 /* If nothing is known about the RHS, create fresh CAND_ADD and
1495 CAND_MULT interpretations:
1496
1497 X = Y + (0 * 1)
1498 X = (Y + 0) * 1
1499
1500 The first of these is somewhat arbitrary, but the choice of
1501 1 for the stride simplifies the logic for propagating casts
1502 into their uses. */
1503 c = alloc_cand_and_find_basis (CAND_ADD, gs, rhs1, double_int_zero,
1504 integer_one_node, TREE_TYPE (rhs1), 0);
1505 c2 = alloc_cand_and_find_basis (CAND_MULT, gs, rhs1, double_int_zero,
1506 integer_one_node, TREE_TYPE (rhs1), 0);
1507 c->next_interp = c2->cand_num;
1508 }
1509
1510 /* Add the first (or only) interpretation to the statement-candidate
1511 mapping. */
1512 add_cand_for_stmt (gs, c);
1513}
1514\f
1515/* Find strength-reduction candidates in block BB. */
1516
1517static void
1518find_candidates_in_block (struct dom_walk_data *walk_data ATTRIBUTE_UNUSED,
1519 basic_block bb)
1520{
1521 bool speed = optimize_bb_for_speed_p (bb);
1522 gimple_stmt_iterator gsi;
1523
1168caca 1524 for (gsi = gsi_start_phis (bb); !gsi_end_p (gsi); gsi_next (&gsi))
1525 slsr_process_phi (gsi_stmt (gsi), speed);
1526
4502f5d0 1527 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
1528 {
1529 gimple gs = gsi_stmt (gsi);
1530
070bf980 1531 if (gimple_vuse (gs) && gimple_assign_single_p (gs))
1532 slsr_process_ref (gs);
1533
1534 else if (is_gimple_assign (gs)
1535 && SCALAR_INT_MODE_P
1536 (TYPE_MODE (TREE_TYPE (gimple_assign_lhs (gs)))))
4502f5d0 1537 {
1538 tree rhs1 = NULL_TREE, rhs2 = NULL_TREE;
1539
1540 switch (gimple_assign_rhs_code (gs))
1541 {
1542 case MULT_EXPR:
1543 case PLUS_EXPR:
1544 rhs1 = gimple_assign_rhs1 (gs);
1545 rhs2 = gimple_assign_rhs2 (gs);
1546 /* Should never happen, but currently some buggy situations
1547 in earlier phases put constants in rhs1. */
1548 if (TREE_CODE (rhs1) != SSA_NAME)
1549 continue;
1550 break;
1551
1552 /* Possible future opportunity: rhs1 of a ptr+ can be
1553 an ADDR_EXPR. */
1554 case POINTER_PLUS_EXPR:
1555 case MINUS_EXPR:
1556 rhs2 = gimple_assign_rhs2 (gs);
1557 /* Fall-through. */
1558
1559 case NOP_EXPR:
1560 case MODIFY_EXPR:
1561 case NEGATE_EXPR:
1562 rhs1 = gimple_assign_rhs1 (gs);
1563 if (TREE_CODE (rhs1) != SSA_NAME)
1564 continue;
1565 break;
1566
1567 default:
1568 ;
1569 }
1570
1571 switch (gimple_assign_rhs_code (gs))
1572 {
1573 case MULT_EXPR:
1574 slsr_process_mul (gs, rhs1, rhs2, speed);
1575 break;
1576
1577 case PLUS_EXPR:
1578 case POINTER_PLUS_EXPR:
1579 case MINUS_EXPR:
1580 slsr_process_add (gs, rhs1, rhs2, speed);
1581 break;
1582
1583 case NEGATE_EXPR:
1584 slsr_process_neg (gs, rhs1, speed);
1585 break;
1586
1587 case NOP_EXPR:
1588 slsr_process_cast (gs, rhs1, speed);
1589 break;
1590
1591 case MODIFY_EXPR:
1592 slsr_process_copy (gs, rhs1, speed);
1593 break;
1594
1595 default:
1596 ;
1597 }
1598 }
1599 }
1600}
1601\f
1602/* Dump a candidate for debug. */
1603
1604static void
1605dump_candidate (slsr_cand_t c)
1606{
1607 fprintf (dump_file, "%3d [%d] ", c->cand_num,
1608 gimple_bb (c->cand_stmt)->index);
1609 print_gimple_stmt (dump_file, c->cand_stmt, 0, 0);
1610 switch (c->kind)
1611 {
1612 case CAND_MULT:
1613 fputs (" MULT : (", dump_file);
c99e471e 1614 print_generic_expr (dump_file, c->base_expr, 0);
4502f5d0 1615 fputs (" + ", dump_file);
1616 dump_double_int (dump_file, c->index, false);
1617 fputs (") * ", dump_file);
1618 print_generic_expr (dump_file, c->stride, 0);
1619 fputs (" : ", dump_file);
1620 break;
1621 case CAND_ADD:
1622 fputs (" ADD : ", dump_file);
c99e471e 1623 print_generic_expr (dump_file, c->base_expr, 0);
4502f5d0 1624 fputs (" + (", dump_file);
1625 dump_double_int (dump_file, c->index, false);
1626 fputs (" * ", dump_file);
1627 print_generic_expr (dump_file, c->stride, 0);
1628 fputs (") : ", dump_file);
1629 break;
070bf980 1630 case CAND_REF:
1631 fputs (" REF : ", dump_file);
c99e471e 1632 print_generic_expr (dump_file, c->base_expr, 0);
070bf980 1633 fputs (" + (", dump_file);
1634 print_generic_expr (dump_file, c->stride, 0);
1635 fputs (") + ", dump_file);
1636 dump_double_int (dump_file, c->index, false);
1637 fputs (" : ", dump_file);
1638 break;
1168caca 1639 case CAND_PHI:
1640 fputs (" PHI : ", dump_file);
1641 print_generic_expr (dump_file, c->base_expr, 0);
1642 fputs (" + (unknown * ", dump_file);
1643 print_generic_expr (dump_file, c->stride, 0);
1644 fputs (") : ", dump_file);
1645 break;
4502f5d0 1646 default:
1647 gcc_unreachable ();
1648 }
1649 print_generic_expr (dump_file, c->cand_type, 0);
1650 fprintf (dump_file, "\n basis: %d dependent: %d sibling: %d\n",
1651 c->basis, c->dependent, c->sibling);
1652 fprintf (dump_file, " next-interp: %d dead-savings: %d\n",
1653 c->next_interp, c->dead_savings);
1654 if (c->def_phi)
1168caca 1655 fprintf (dump_file, " phi: %d\n", c->def_phi);
4502f5d0 1656 fputs ("\n", dump_file);
1657}
1658
1659/* Dump the candidate vector for debug. */
1660
1661static void
1662dump_cand_vec (void)
1663{
1664 unsigned i;
1665 slsr_cand_t c;
1666
1667 fprintf (dump_file, "\nStrength reduction candidate vector:\n\n");
1668
f1f41a6c 1669 FOR_EACH_VEC_ELT (cand_vec, i, c)
4502f5d0 1670 dump_candidate (c);
1671}
1672
070bf980 1673/* Callback used to dump the candidate chains hash table. */
4502f5d0 1674
d9dd21a8 1675int
1676ssa_base_cand_dump_callback (cand_chain **slot, void *ignored ATTRIBUTE_UNUSED)
4502f5d0 1677{
d9dd21a8 1678 const_cand_chain_t chain = *slot;
070bf980 1679 cand_chain_t p;
4502f5d0 1680
c99e471e 1681 print_generic_expr (dump_file, chain->base_expr, 0);
070bf980 1682 fprintf (dump_file, " -> %d", chain->cand->cand_num);
4502f5d0 1683
070bf980 1684 for (p = chain->next; p; p = p->next)
1685 fprintf (dump_file, " -> %d", p->cand->cand_num);
4502f5d0 1686
070bf980 1687 fputs ("\n", dump_file);
1688 return 1;
1689}
4502f5d0 1690
070bf980 1691/* Dump the candidate chains. */
4502f5d0 1692
070bf980 1693static void
1694dump_cand_chains (void)
1695{
1696 fprintf (dump_file, "\nStrength reduction candidate chains:\n\n");
d9dd21a8 1697 base_cand_map.traverse_noresize <void *, ssa_base_cand_dump_callback> (NULL);
4502f5d0 1698 fputs ("\n", dump_file);
1699}
9ce0359e 1700
1701/* Dump the increment vector for debug. */
1702
1703static void
1704dump_incr_vec (void)
1705{
1706 if (dump_file && (dump_flags & TDF_DETAILS))
1707 {
1708 unsigned i;
1709
1710 fprintf (dump_file, "\nIncrement vector:\n\n");
1711
1712 for (i = 0; i < incr_vec_len; i++)
1713 {
1714 fprintf (dump_file, "%3d increment: ", i);
1715 dump_double_int (dump_file, incr_vec[i].incr, false);
1716 fprintf (dump_file, "\n count: %d", incr_vec[i].count);
1717 fprintf (dump_file, "\n cost: %d", incr_vec[i].cost);
1718 fputs ("\n initializer: ", dump_file);
1719 print_generic_expr (dump_file, incr_vec[i].initializer, 0);
1720 fputs ("\n\n", dump_file);
1721 }
1722 }
1723}
4502f5d0 1724\f
070bf980 1725/* Replace *EXPR in candidate C with an equivalent strength-reduced
1726 data reference. */
1727
1728static void
1729replace_ref (tree *expr, slsr_cand_t c)
1730{
c99e471e 1731 tree add_expr = fold_build2 (POINTER_PLUS_EXPR, TREE_TYPE (c->base_expr),
1732 c->base_expr, c->stride);
070bf980 1733 tree mem_ref = fold_build2 (MEM_REF, TREE_TYPE (*expr), add_expr,
1734 double_int_to_tree (c->cand_type, c->index));
1735
1736 /* Gimplify the base addressing expression for the new MEM_REF tree. */
1737 gimple_stmt_iterator gsi = gsi_for_stmt (c->cand_stmt);
1738 TREE_OPERAND (mem_ref, 0)
1739 = force_gimple_operand_gsi (&gsi, TREE_OPERAND (mem_ref, 0),
1740 /*simple_p=*/true, NULL,
1741 /*before=*/true, GSI_SAME_STMT);
1742 copy_ref_info (mem_ref, *expr);
1743 *expr = mem_ref;
1744 update_stmt (c->cand_stmt);
1745}
1746
1747/* Replace CAND_REF candidate C, each sibling of candidate C, and each
1748 dependent of candidate C with an equivalent strength-reduced data
1749 reference. */
1750
1751static void
1752replace_refs (slsr_cand_t c)
1753{
1754 if (gimple_vdef (c->cand_stmt))
1755 {
1756 tree *lhs = gimple_assign_lhs_ptr (c->cand_stmt);
1757 replace_ref (lhs, c);
1758 }
1759 else
1760 {
1761 tree *rhs = gimple_assign_rhs1_ptr (c->cand_stmt);
1762 replace_ref (rhs, c);
1763 }
1764
1765 if (c->sibling)
1766 replace_refs (lookup_cand (c->sibling));
1767
1768 if (c->dependent)
1769 replace_refs (lookup_cand (c->dependent));
1770}
1771
1168caca 1772/* Return TRUE if candidate C is dependent upon a PHI. */
1773
1774static bool
1775phi_dependent_cand_p (slsr_cand_t c)
1776{
1777 /* A candidate is not necessarily dependent upon a PHI just because
1778 it has a phi definition for its base name. It may have a basis
1779 that relies upon the same phi definition, in which case the PHI
1780 is irrelevant to this candidate. */
1781 return (c->def_phi
1782 && c->basis
1783 && lookup_cand (c->basis)->def_phi != c->def_phi);
1784}
1785
4502f5d0 1786/* Calculate the increment required for candidate C relative to
1787 its basis. */
1788
1789static double_int
1790cand_increment (slsr_cand_t c)
1791{
1792 slsr_cand_t basis;
1793
1794 /* If the candidate doesn't have a basis, just return its own
1795 index. This is useful in record_increments to help us find
1168caca 1796 an existing initializer. Also, if the candidate's basis is
1797 hidden by a phi, then its own index will be the increment
1798 from the newly introduced phi basis. */
1799 if (!c->basis || phi_dependent_cand_p (c))
4502f5d0 1800 return c->index;
1801
1802 basis = lookup_cand (c->basis);
c99e471e 1803 gcc_assert (operand_equal_p (c->base_expr, basis->base_expr, 0));
cf8f0e63 1804 return c->index - basis->index;
4502f5d0 1805}
1806
9ce0359e 1807/* Calculate the increment required for candidate C relative to
1808 its basis. If we aren't going to generate pointer arithmetic
1809 for this candidate, return the absolute value of that increment
1810 instead. */
1811
1812static inline double_int
1813cand_abs_increment (slsr_cand_t c)
1814{
1815 double_int increment = cand_increment (c);
1816
cf8f0e63 1817 if (!address_arithmetic_p && increment.is_negative ())
1818 increment = -increment;
9ce0359e 1819
1820 return increment;
1821}
1822
4502f5d0 1823/* Return TRUE iff candidate C has already been replaced under
1824 another interpretation. */
1825
1826static inline bool
1827cand_already_replaced (slsr_cand_t c)
1828{
1829 return (gimple_bb (c->cand_stmt) == 0);
1830}
1831
1168caca 1832/* Common logic used by replace_unconditional_candidate and
1833 replace_conditional_candidate. */
4502f5d0 1834
1835static void
d54ab372 1836replace_mult_candidate (slsr_cand_t c, tree basis_name, double_int bump)
4502f5d0 1837{
1168caca 1838 tree target_type = TREE_TYPE (gimple_assign_lhs (c->cand_stmt));
1839 enum tree_code cand_code = gimple_assign_rhs_code (c->cand_stmt);
1840
4502f5d0 1841 /* It is highly unlikely, but possible, that the resulting
1842 bump doesn't fit in a HWI. Abandon the replacement
1168caca 1843 in this case. This does not affect siblings or dependents
1844 of C. Restriction to signed HWI is conservative for unsigned
1845 types but allows for safe negation without twisted logic. */
1846 if (bump.fits_shwi ()
1847 && bump.to_shwi () != HOST_WIDE_INT_MIN
1848 /* It is not useful to replace casts, copies, or adds of
1849 an SSA name and a constant. */
1850 && cand_code != MODIFY_EXPR
1851 && cand_code != NOP_EXPR
1852 && cand_code != PLUS_EXPR
1853 && cand_code != POINTER_PLUS_EXPR
1854 && cand_code != MINUS_EXPR)
1855 {
1856 enum tree_code code = PLUS_EXPR;
1857 tree bump_tree;
1858 gimple stmt_to_print = NULL;
1859
1860 /* If the basis name and the candidate's LHS have incompatible
1861 types, introduce a cast. */
1862 if (!useless_type_conversion_p (target_type, TREE_TYPE (basis_name)))
d54ab372 1863 basis_name = introduce_cast_before_cand (c, target_type, basis_name);
1168caca 1864 if (bump.is_negative ())
1865 {
1866 code = MINUS_EXPR;
1867 bump = -bump;
1868 }
1869
1870 bump_tree = double_int_to_tree (target_type, bump);
1871
1872 if (dump_file && (dump_flags & TDF_DETAILS))
1873 {
1874 fputs ("Replacing: ", dump_file);
1875 print_gimple_stmt (dump_file, c->cand_stmt, 0, 0);
1876 }
1877
1878 if (bump.is_zero ())
1879 {
1880 tree lhs = gimple_assign_lhs (c->cand_stmt);
1881 gimple copy_stmt = gimple_build_assign (lhs, basis_name);
1882 gimple_stmt_iterator gsi = gsi_for_stmt (c->cand_stmt);
1883 gimple_set_location (copy_stmt, gimple_location (c->cand_stmt));
1884 gsi_replace (&gsi, copy_stmt, false);
8f0676e4 1885 c->cand_stmt = copy_stmt;
1168caca 1886 if (dump_file && (dump_flags & TDF_DETAILS))
1887 stmt_to_print = copy_stmt;
1888 }
1889 else
1890 {
1891 tree rhs1, rhs2;
1892 if (cand_code != NEGATE_EXPR) {
1893 rhs1 = gimple_assign_rhs1 (c->cand_stmt);
1894 rhs2 = gimple_assign_rhs2 (c->cand_stmt);
1895 }
1896 if (cand_code != NEGATE_EXPR
1897 && ((operand_equal_p (rhs1, basis_name, 0)
1898 && operand_equal_p (rhs2, bump_tree, 0))
1899 || (operand_equal_p (rhs1, bump_tree, 0)
1900 && operand_equal_p (rhs2, basis_name, 0))))
1901 {
1902 if (dump_file && (dump_flags & TDF_DETAILS))
1903 {
1904 fputs ("(duplicate, not actually replacing)", dump_file);
1905 stmt_to_print = c->cand_stmt;
1906 }
1907 }
1908 else
1909 {
1910 gimple_stmt_iterator gsi = gsi_for_stmt (c->cand_stmt);
1911 gimple_assign_set_rhs_with_ops (&gsi, code,
1912 basis_name, bump_tree);
1913 update_stmt (gsi_stmt (gsi));
dc77dea1 1914 c->cand_stmt = gsi_stmt (gsi);
1168caca 1915 if (dump_file && (dump_flags & TDF_DETAILS))
1916 stmt_to_print = gsi_stmt (gsi);
1917 }
1918 }
1919
1920 if (dump_file && (dump_flags & TDF_DETAILS))
1921 {
1922 fputs ("With: ", dump_file);
1923 print_gimple_stmt (dump_file, stmt_to_print, 0, 0);
1924 fputs ("\n", dump_file);
1925 }
1926 }
1927}
1928
1929/* Replace candidate C with an add or subtract. Note that we only
1930 operate on CAND_MULTs with known strides, so we will never generate
1931 a POINTER_PLUS_EXPR. Each candidate X = (B + i) * S is replaced by
1932 X = Y + ((i - i') * S), as described in the module commentary. The
1933 folded value ((i - i') * S) is referred to here as the "bump." */
1934
1935static void
1936replace_unconditional_candidate (slsr_cand_t c)
1937{
1938 slsr_cand_t basis;
1939 double_int stride, bump;
1168caca 1940
1941 if (cand_already_replaced (c))
4502f5d0 1942 return;
1943
1944 basis = lookup_cand (c->basis);
1168caca 1945 stride = tree_to_double_int (c->stride);
1946 bump = cand_increment (c) * stride;
1947
d54ab372 1948 replace_mult_candidate (c, gimple_assign_lhs (basis->cand_stmt), bump);
1168caca 1949}
1950\f
d62a8480 1951/* Return the index in the increment vector of the given INCREMENT,
1952 or -1 if not found. The latter can occur if more than
1953 MAX_INCR_VEC_LEN increments have been found. */
1168caca 1954
d62a8480 1955static inline int
1168caca 1956incr_vec_index (double_int increment)
1957{
1958 unsigned i;
1959
1960 for (i = 0; i < incr_vec_len && increment != incr_vec[i].incr; i++)
1961 ;
1962
d62a8480 1963 if (i < incr_vec_len)
1964 return i;
1965 else
1966 return -1;
1168caca 1967}
1968
1969/* Create a new statement along edge E to add BASIS_NAME to the product
1970 of INCREMENT and the stride of candidate C. Create and return a new
1971 SSA name from *VAR to be used as the LHS of the new statement.
1972 KNOWN_STRIDE is true iff C's stride is a constant. */
1973
1974static tree
1975create_add_on_incoming_edge (slsr_cand_t c, tree basis_name,
1976 double_int increment, edge e, location_t loc,
1977 bool known_stride)
1978{
1979 basic_block insert_bb;
1980 gimple_stmt_iterator gsi;
1981 tree lhs, basis_type;
1982 gimple new_stmt;
1983
1984 /* If the add candidate along this incoming edge has the same
1985 index as C's hidden basis, the hidden basis represents this
1986 edge correctly. */
1987 if (increment.is_zero ())
1988 return basis_name;
1989
1990 basis_type = TREE_TYPE (basis_name);
1991 lhs = make_temp_ssa_name (basis_type, NULL, "slsr");
1992
1993 if (known_stride)
8e6331c6 1994 {
1168caca 1995 tree bump_tree;
1996 enum tree_code code = PLUS_EXPR;
1997 double_int bump = increment * tree_to_double_int (c->stride);
1998 if (bump.is_negative ())
1999 {
2000 code = MINUS_EXPR;
2001 bump = -bump;
2002 }
2003
2004 bump_tree = double_int_to_tree (basis_type, bump);
2005 new_stmt = gimple_build_assign_with_ops (code, lhs, basis_name,
2006 bump_tree);
8e6331c6 2007 }
2008 else
2009 {
d62a8480 2010 int i;
1168caca 2011 bool negate_incr = (!address_arithmetic_p && increment.is_negative ());
2012 i = incr_vec_index (negate_incr ? -increment : increment);
d62a8480 2013 gcc_assert (i >= 0);
4502f5d0 2014
1168caca 2015 if (incr_vec[i].initializer)
2016 {
2017 enum tree_code code = negate_incr ? MINUS_EXPR : PLUS_EXPR;
2018 new_stmt = gimple_build_assign_with_ops (code, lhs, basis_name,
2019 incr_vec[i].initializer);
2020 }
2021 else if (increment.is_one ())
2022 new_stmt = gimple_build_assign_with_ops (PLUS_EXPR, lhs, basis_name,
2023 c->stride);
2024 else if (increment.is_minus_one ())
2025 new_stmt = gimple_build_assign_with_ops (MINUS_EXPR, lhs, basis_name,
2026 c->stride);
2027 else
2028 gcc_unreachable ();
4502f5d0 2029 }
2030
1168caca 2031 insert_bb = single_succ_p (e->src) ? e->src : split_edge (e);
2032 gsi = gsi_last_bb (insert_bb);
2033
2034 if (!gsi_end_p (gsi) && is_ctrl_stmt (gsi_stmt (gsi)))
2035 gsi_insert_before (&gsi, new_stmt, GSI_NEW_STMT);
2036 else
2037 gsi_insert_after (&gsi, new_stmt, GSI_NEW_STMT);
2038
2039 gimple_set_location (new_stmt, loc);
4502f5d0 2040
2041 if (dump_file && (dump_flags & TDF_DETAILS))
2042 {
1168caca 2043 fprintf (dump_file, "Inserting in block %d: ", insert_bb->index);
2044 print_gimple_stmt (dump_file, new_stmt, 0, 0);
4502f5d0 2045 }
2046
1168caca 2047 return lhs;
2048}
2049
2050/* Given a candidate C with BASIS_NAME being the LHS of C's basis which
2051 is hidden by the phi node FROM_PHI, create a new phi node in the same
2052 block as FROM_PHI. The new phi is suitable for use as a basis by C,
2053 with its phi arguments representing conditional adjustments to the
2054 hidden basis along conditional incoming paths. Those adjustments are
2055 made by creating add statements (and sometimes recursively creating
2056 phis) along those incoming paths. LOC is the location to attach to
2057 the introduced statements. KNOWN_STRIDE is true iff C's stride is a
2058 constant. */
2059
2060static tree
2061create_phi_basis (slsr_cand_t c, gimple from_phi, tree basis_name,
2062 location_t loc, bool known_stride)
2063{
2064 int i;
2065 tree name, phi_arg;
2066 gimple phi;
2067 vec<tree> phi_args;
2068 slsr_cand_t basis = lookup_cand (c->basis);
2069 int nargs = gimple_phi_num_args (from_phi);
2070 basic_block phi_bb = gimple_bb (from_phi);
2071 slsr_cand_t phi_cand = base_cand_from_table (gimple_phi_result (from_phi));
2072 phi_args.create (nargs);
2073
2074 /* Process each argument of the existing phi that represents
2075 conditionally-executed add candidates. */
2076 for (i = 0; i < nargs; i++)
4502f5d0 2077 {
1168caca 2078 edge e = (*phi_bb->preds)[i];
2079 tree arg = gimple_phi_arg_def (from_phi, i);
2080 tree feeding_def;
2081
2082 /* If the phi argument is the base name of the CAND_PHI, then
2083 this incoming arc should use the hidden basis. */
2084 if (operand_equal_p (arg, phi_cand->base_expr, 0))
2085 if (basis->index.is_zero ())
2086 feeding_def = gimple_assign_lhs (basis->cand_stmt);
2087 else
2088 {
7090b697 2089 double_int incr = -basis->index;
1168caca 2090 feeding_def = create_add_on_incoming_edge (c, basis_name, incr,
2091 e, loc, known_stride);
2092 }
2093 else
4502f5d0 2094 {
1168caca 2095 gimple arg_def = SSA_NAME_DEF_STMT (arg);
2096
2097 /* If there is another phi along this incoming edge, we must
2098 process it in the same fashion to ensure that all basis
2099 adjustments are made along its incoming edges. */
2100 if (gimple_code (arg_def) == GIMPLE_PHI)
2101 feeding_def = create_phi_basis (c, arg_def, basis_name,
2102 loc, known_stride);
2103 else
4502f5d0 2104 {
1168caca 2105 slsr_cand_t arg_cand = base_cand_from_table (arg);
2106 double_int diff = arg_cand->index - basis->index;
2107 feeding_def = create_add_on_incoming_edge (c, basis_name, diff,
2108 e, loc, known_stride);
4502f5d0 2109 }
2110 }
1168caca 2111
2112 /* Because of recursion, we need to save the arguments in a vector
2113 so we can create the PHI statement all at once. Otherwise the
2114 storage for the half-created PHI can be reclaimed. */
2115 phi_args.safe_push (feeding_def);
4502f5d0 2116 }
1168caca 2117
2118 /* Create the new phi basis. */
2119 name = make_temp_ssa_name (TREE_TYPE (basis_name), NULL, "slsr");
2120 phi = create_phi_node (name, phi_bb);
2121 SSA_NAME_DEF_STMT (name) = phi;
2122
2123 FOR_EACH_VEC_ELT (phi_args, i, phi_arg)
2124 {
2125 edge e = (*phi_bb->preds)[i];
2126 add_phi_arg (phi, phi_arg, e, loc);
2127 }
2128
2129 update_stmt (phi);
2130
4502f5d0 2131 if (dump_file && (dump_flags & TDF_DETAILS))
2132 {
1168caca 2133 fputs ("Introducing new phi basis: ", dump_file);
2134 print_gimple_stmt (dump_file, phi, 0, 0);
4502f5d0 2135 }
1168caca 2136
2137 return name;
4502f5d0 2138}
2139
1168caca 2140/* Given a candidate C whose basis is hidden by at least one intervening
2141 phi, introduce a matching number of new phis to represent its basis
2142 adjusted by conditional increments along possible incoming paths. Then
2143 replace C as though it were an unconditional candidate, using the new
2144 basis. */
4502f5d0 2145
2146static void
1168caca 2147replace_conditional_candidate (slsr_cand_t c)
4502f5d0 2148{
d54ab372 2149 tree basis_name, name;
1168caca 2150 slsr_cand_t basis;
2151 location_t loc;
2152 double_int stride, bump;
4502f5d0 2153
1168caca 2154 /* Look up the LHS SSA name from C's basis. This will be the
2155 RHS1 of the adds we will introduce to create new phi arguments. */
2156 basis = lookup_cand (c->basis);
2157 basis_name = gimple_assign_lhs (basis->cand_stmt);
4502f5d0 2158
1168caca 2159 /* Create a new phi statement which will represent C's true basis
2160 after the transformation is complete. */
2161 loc = gimple_location (c->cand_stmt);
2162 name = create_phi_basis (c, lookup_cand (c->def_phi)->cand_stmt,
2163 basis_name, loc, KNOWN_STRIDE);
2164 /* Replace C with an add of the new basis phi and a constant. */
2165 stride = tree_to_double_int (c->stride);
2166 bump = c->index * stride;
4502f5d0 2167
d54ab372 2168 replace_mult_candidate (c, name, bump);
4502f5d0 2169}
9ce0359e 2170
1168caca 2171/* Compute the expected costs of inserting basis adjustments for
2172 candidate C with phi-definition PHI. The cost of inserting
2173 one adjustment is given by ONE_ADD_COST. If PHI has arguments
2174 which are themselves phi results, recursively calculate costs
2175 for those phis as well. */
2176
2177static int
2178phi_add_costs (gimple phi, slsr_cand_t c, int one_add_cost)
9ce0359e 2179{
2180 unsigned i;
1168caca 2181 int cost = 0;
2182 slsr_cand_t phi_cand = base_cand_from_table (gimple_phi_result (phi));
9ce0359e 2183
8f0676e4 2184 /* If we work our way back to a phi that isn't dominated by the hidden
2185 basis, this isn't a candidate for replacement. Indicate this by
2186 returning an unreasonably high cost. It's not easy to detect
2187 these situations when determining the basis, so we defer the
2188 decision until now. */
2189 basic_block phi_bb = gimple_bb (phi);
2190 slsr_cand_t basis = lookup_cand (c->basis);
2191 basic_block basis_bb = gimple_bb (basis->cand_stmt);
2192
2193 if (phi_bb == basis_bb || !dominated_by_p (CDI_DOMINATORS, phi_bb, basis_bb))
2194 return COST_INFINITE;
2195
1168caca 2196 for (i = 0; i < gimple_phi_num_args (phi); i++)
2197 {
2198 tree arg = gimple_phi_arg_def (phi, i);
2199
2200 if (arg != phi_cand->base_expr)
2201 {
2202 gimple arg_def = SSA_NAME_DEF_STMT (arg);
2203
2204 if (gimple_code (arg_def) == GIMPLE_PHI)
2205 cost += phi_add_costs (arg_def, c, one_add_cost);
2206 else
2207 {
2208 slsr_cand_t arg_cand = base_cand_from_table (arg);
2209
2210 if (arg_cand->index != c->index)
2211 cost += one_add_cost;
2212 }
2213 }
2214 }
2215
2216 return cost;
9ce0359e 2217}
2218
1168caca 2219/* For candidate C, each sibling of candidate C, and each dependent of
2220 candidate C, determine whether the candidate is dependent upon a
2221 phi that hides its basis. If not, replace the candidate unconditionally.
2222 Otherwise, determine whether the cost of introducing compensation code
2223 for the candidate is offset by the gains from strength reduction. If
2224 so, replace the candidate and introduce the compensation code. */
2225
2226static void
2227replace_uncond_cands_and_profitable_phis (slsr_cand_t c)
2228{
2229 if (phi_dependent_cand_p (c))
2230 {
2231 if (c->kind == CAND_MULT)
2232 {
2233 /* A candidate dependent upon a phi will replace a multiply by
2234 a constant with an add, and will insert at most one add for
2235 each phi argument. Add these costs with the potential dead-code
2236 savings to determine profitability. */
2237 bool speed = optimize_bb_for_speed_p (gimple_bb (c->cand_stmt));
2238 int mult_savings = stmt_cost (c->cand_stmt, speed);
2239 gimple phi = lookup_cand (c->def_phi)->cand_stmt;
2240 tree phi_result = gimple_phi_result (phi);
2241 int one_add_cost = add_cost (speed,
2242 TYPE_MODE (TREE_TYPE (phi_result)));
2243 int add_costs = one_add_cost + phi_add_costs (phi, c, one_add_cost);
2244 int cost = add_costs - mult_savings - c->dead_savings;
2245
2246 if (dump_file && (dump_flags & TDF_DETAILS))
2247 {
2248 fprintf (dump_file, " Conditional candidate %d:\n", c->cand_num);
2249 fprintf (dump_file, " add_costs = %d\n", add_costs);
2250 fprintf (dump_file, " mult_savings = %d\n", mult_savings);
2251 fprintf (dump_file, " dead_savings = %d\n", c->dead_savings);
2252 fprintf (dump_file, " cost = %d\n", cost);
2253 if (cost <= COST_NEUTRAL)
2254 fputs (" Replacing...\n", dump_file);
2255 else
2256 fputs (" Not replaced.\n", dump_file);
2257 }
2258
2259 if (cost <= COST_NEUTRAL)
2260 replace_conditional_candidate (c);
2261 }
2262 }
2263 else
2264 replace_unconditional_candidate (c);
2265
2266 if (c->sibling)
2267 replace_uncond_cands_and_profitable_phis (lookup_cand (c->sibling));
2268
2269 if (c->dependent)
2270 replace_uncond_cands_and_profitable_phis (lookup_cand (c->dependent));
2271}
2272\f
9ce0359e 2273/* Count the number of candidates in the tree rooted at C that have
2274 not already been replaced under other interpretations. */
2275
d873e825 2276static int
9ce0359e 2277count_candidates (slsr_cand_t c)
2278{
2279 unsigned count = cand_already_replaced (c) ? 0 : 1;
2280
2281 if (c->sibling)
2282 count += count_candidates (lookup_cand (c->sibling));
2283
2284 if (c->dependent)
2285 count += count_candidates (lookup_cand (c->dependent));
2286
2287 return count;
2288}
2289
2290/* Increase the count of INCREMENT by one in the increment vector.
1168caca 2291 INCREMENT is associated with candidate C. If INCREMENT is to be
2292 conditionally executed as part of a conditional candidate replacement,
2293 IS_PHI_ADJUST is true, otherwise false. If an initializer
9ce0359e 2294 T_0 = stride * I is provided by a candidate that dominates all
2295 candidates with the same increment, also record T_0 for subsequent use. */
2296
2297static void
1168caca 2298record_increment (slsr_cand_t c, double_int increment, bool is_phi_adjust)
9ce0359e 2299{
2300 bool found = false;
2301 unsigned i;
2302
2303 /* Treat increments that differ only in sign as identical so as to
2304 share initializers, unless we are generating pointer arithmetic. */
cf8f0e63 2305 if (!address_arithmetic_p && increment.is_negative ())
2306 increment = -increment;
9ce0359e 2307
2308 for (i = 0; i < incr_vec_len; i++)
2309 {
cf8f0e63 2310 if (incr_vec[i].incr == increment)
9ce0359e 2311 {
2312 incr_vec[i].count++;
2313 found = true;
2314
2315 /* If we previously recorded an initializer that doesn't
2316 dominate this candidate, it's not going to be useful to
2317 us after all. */
2318 if (incr_vec[i].initializer
2319 && !dominated_by_p (CDI_DOMINATORS,
2320 gimple_bb (c->cand_stmt),
2321 incr_vec[i].init_bb))
2322 {
2323 incr_vec[i].initializer = NULL_TREE;
2324 incr_vec[i].init_bb = NULL;
2325 }
2326
2327 break;
2328 }
2329 }
2330
d62a8480 2331 if (!found && incr_vec_len < MAX_INCR_VEC_LEN - 1)
9ce0359e 2332 {
2333 /* The first time we see an increment, create the entry for it.
2334 If this is the root candidate which doesn't have a basis, set
2335 the count to zero. We're only processing it so it can possibly
2336 provide an initializer for other candidates. */
2337 incr_vec[incr_vec_len].incr = increment;
1168caca 2338 incr_vec[incr_vec_len].count = c->basis || is_phi_adjust ? 1 : 0;
9ce0359e 2339 incr_vec[incr_vec_len].cost = COST_INFINITE;
2340
2341 /* Optimistically record the first occurrence of this increment
2342 as providing an initializer (if it does); we will revise this
2343 opinion later if it doesn't dominate all other occurrences.
1168caca 2344 Exception: increments of -1, 0, 1 never need initializers;
2345 and phi adjustments don't ever provide initializers. */
9ce0359e 2346 if (c->kind == CAND_ADD
1168caca 2347 && !is_phi_adjust
cf8f0e63 2348 && c->index == increment
2349 && (increment.sgt (double_int_one)
9de38bc3 2350 || increment.slt (double_int_minus_one))
2351 && (gimple_assign_rhs_code (c->cand_stmt) == PLUS_EXPR
2352 || gimple_assign_rhs_code (c->cand_stmt) == POINTER_PLUS_EXPR))
9ce0359e 2353 {
9de38bc3 2354 tree t0 = NULL_TREE;
9ce0359e 2355 tree rhs1 = gimple_assign_rhs1 (c->cand_stmt);
2356 tree rhs2 = gimple_assign_rhs2 (c->cand_stmt);
2357 if (operand_equal_p (rhs1, c->base_expr, 0))
2358 t0 = rhs2;
9de38bc3 2359 else if (operand_equal_p (rhs2, c->base_expr, 0))
9ce0359e 2360 t0 = rhs1;
9de38bc3 2361 if (t0
2362 && SSA_NAME_DEF_STMT (t0)
2363 && gimple_bb (SSA_NAME_DEF_STMT (t0)))
9ce0359e 2364 {
2365 incr_vec[incr_vec_len].initializer = t0;
2366 incr_vec[incr_vec_len++].init_bb
2367 = gimple_bb (SSA_NAME_DEF_STMT (t0));
2368 }
2369 else
2370 {
2371 incr_vec[incr_vec_len].initializer = NULL_TREE;
2372 incr_vec[incr_vec_len++].init_bb = NULL;
2373 }
2374 }
2375 else
2376 {
2377 incr_vec[incr_vec_len].initializer = NULL_TREE;
2378 incr_vec[incr_vec_len++].init_bb = NULL;
2379 }
2380 }
2381}
2382
1168caca 2383/* Given phi statement PHI that hides a candidate from its BASIS, find
2384 the increments along each incoming arc (recursively handling additional
2385 phis that may be present) and record them. These increments are the
2386 difference in index between the index-adjusting statements and the
2387 index of the basis. */
2388
2389static void
2390record_phi_increments (slsr_cand_t basis, gimple phi)
2391{
2392 unsigned i;
2393 slsr_cand_t phi_cand = base_cand_from_table (gimple_phi_result (phi));
2394
2395 for (i = 0; i < gimple_phi_num_args (phi); i++)
2396 {
2397 tree arg = gimple_phi_arg_def (phi, i);
2398
2399 if (!operand_equal_p (arg, phi_cand->base_expr, 0))
2400 {
2401 gimple arg_def = SSA_NAME_DEF_STMT (arg);
2402
2403 if (gimple_code (arg_def) == GIMPLE_PHI)
2404 record_phi_increments (basis, arg_def);
2405 else
2406 {
2407 slsr_cand_t arg_cand = base_cand_from_table (arg);
2408 double_int diff = arg_cand->index - basis->index;
2409 record_increment (arg_cand, diff, PHI_ADJUST);
2410 }
2411 }
2412 }
2413}
2414
9ce0359e 2415/* Determine how many times each unique increment occurs in the set
2416 of candidates rooted at C's parent, recording the data in the
2417 increment vector. For each unique increment I, if an initializer
2418 T_0 = stride * I is provided by a candidate that dominates all
2419 candidates with the same increment, also record T_0 for subsequent
2420 use. */
2421
2422static void
2423record_increments (slsr_cand_t c)
2424{
2425 if (!cand_already_replaced (c))
1168caca 2426 {
2427 if (!phi_dependent_cand_p (c))
2428 record_increment (c, cand_increment (c), NOT_PHI_ADJUST);
2429 else
2430 {
2431 /* A candidate with a basis hidden by a phi will have one
2432 increment for its relationship to the index represented by
2433 the phi, and potentially additional increments along each
2434 incoming edge. For the root of the dependency tree (which
2435 has no basis), process just the initial index in case it has
2436 an initializer that can be used by subsequent candidates. */
2437 record_increment (c, c->index, NOT_PHI_ADJUST);
2438
2439 if (c->basis)
2440 record_phi_increments (lookup_cand (c->basis),
2441 lookup_cand (c->def_phi)->cand_stmt);
2442 }
2443 }
9ce0359e 2444
2445 if (c->sibling)
2446 record_increments (lookup_cand (c->sibling));
2447
2448 if (c->dependent)
2449 record_increments (lookup_cand (c->dependent));
2450}
2451
1168caca 2452/* Add up and return the costs of introducing add statements that
2453 require the increment INCR on behalf of candidate C and phi
2454 statement PHI. Accumulate into *SAVINGS the potential savings
2455 from removing existing statements that feed PHI and have no other
2456 uses. */
2457
2458static int
2459phi_incr_cost (slsr_cand_t c, double_int incr, gimple phi, int *savings)
2460{
2461 unsigned i;
2462 int cost = 0;
2463 slsr_cand_t basis = lookup_cand (c->basis);
2464 slsr_cand_t phi_cand = base_cand_from_table (gimple_phi_result (phi));
2465
2466 for (i = 0; i < gimple_phi_num_args (phi); i++)
2467 {
2468 tree arg = gimple_phi_arg_def (phi, i);
2469
2470 if (!operand_equal_p (arg, phi_cand->base_expr, 0))
2471 {
2472 gimple arg_def = SSA_NAME_DEF_STMT (arg);
2473
2474 if (gimple_code (arg_def) == GIMPLE_PHI)
2475 {
2476 int feeding_savings = 0;
2477 cost += phi_incr_cost (c, incr, arg_def, &feeding_savings);
2478 if (has_single_use (gimple_phi_result (arg_def)))
2479 *savings += feeding_savings;
2480 }
2481 else
2482 {
2483 slsr_cand_t arg_cand = base_cand_from_table (arg);
2484 double_int diff = arg_cand->index - basis->index;
2485
2486 if (incr == diff)
2487 {
2488 tree basis_lhs = gimple_assign_lhs (basis->cand_stmt);
2489 tree lhs = gimple_assign_lhs (arg_cand->cand_stmt);
2490 cost += add_cost (true, TYPE_MODE (TREE_TYPE (basis_lhs)));
2491 if (has_single_use (lhs))
2492 *savings += stmt_cost (arg_cand->cand_stmt, true);
2493 }
2494 }
2495 }
2496 }
2497
2498 return cost;
2499}
2500
9ce0359e 2501/* Return the first candidate in the tree rooted at C that has not
2502 already been replaced, favoring siblings over dependents. */
2503
2504static slsr_cand_t
2505unreplaced_cand_in_tree (slsr_cand_t c)
2506{
2507 if (!cand_already_replaced (c))
2508 return c;
2509
2510 if (c->sibling)
2511 {
2512 slsr_cand_t sib = unreplaced_cand_in_tree (lookup_cand (c->sibling));
2513 if (sib)
2514 return sib;
2515 }
2516
2517 if (c->dependent)
2518 {
2519 slsr_cand_t dep = unreplaced_cand_in_tree (lookup_cand (c->dependent));
2520 if (dep)
2521 return dep;
2522 }
2523
2524 return NULL;
2525}
2526
2527/* Return TRUE if the candidates in the tree rooted at C should be
2528 optimized for speed, else FALSE. We estimate this based on the block
2529 containing the most dominant candidate in the tree that has not yet
2530 been replaced. */
2531
2532static bool
2533optimize_cands_for_speed_p (slsr_cand_t c)
2534{
2535 slsr_cand_t c2 = unreplaced_cand_in_tree (c);
2536 gcc_assert (c2);
2537 return optimize_bb_for_speed_p (gimple_bb (c2->cand_stmt));
2538}
2539
2540/* Add COST_IN to the lowest cost of any dependent path starting at
2541 candidate C or any of its siblings, counting only candidates along
2542 such paths with increment INCR. Assume that replacing a candidate
2543 reduces cost by REPL_SAVINGS. Also account for savings from any
1168caca 2544 statements that would go dead. If COUNT_PHIS is true, include
2545 costs of introducing feeding statements for conditional candidates. */
9ce0359e 2546
2547static int
1168caca 2548lowest_cost_path (int cost_in, int repl_savings, slsr_cand_t c,
2549 double_int incr, bool count_phis)
9ce0359e 2550{
1168caca 2551 int local_cost, sib_cost, savings = 0;
9ce0359e 2552 double_int cand_incr = cand_abs_increment (c);
2553
2554 if (cand_already_replaced (c))
2555 local_cost = cost_in;
cf8f0e63 2556 else if (incr == cand_incr)
9ce0359e 2557 local_cost = cost_in - repl_savings - c->dead_savings;
2558 else
2559 local_cost = cost_in - c->dead_savings;
2560
1168caca 2561 if (count_phis
2562 && phi_dependent_cand_p (c)
2563 && !cand_already_replaced (c))
2564 {
2565 gimple phi = lookup_cand (c->def_phi)->cand_stmt;
2566 local_cost += phi_incr_cost (c, incr, phi, &savings);
2567
2568 if (has_single_use (gimple_phi_result (phi)))
2569 local_cost -= savings;
2570 }
2571
9ce0359e 2572 if (c->dependent)
2573 local_cost = lowest_cost_path (local_cost, repl_savings,
1168caca 2574 lookup_cand (c->dependent), incr,
2575 count_phis);
9ce0359e 2576
2577 if (c->sibling)
2578 {
2579 sib_cost = lowest_cost_path (cost_in, repl_savings,
1168caca 2580 lookup_cand (c->sibling), incr,
2581 count_phis);
9ce0359e 2582 local_cost = MIN (local_cost, sib_cost);
2583 }
2584
2585 return local_cost;
2586}
2587
2588/* Compute the total savings that would accrue from all replacements
2589 in the candidate tree rooted at C, counting only candidates with
2590 increment INCR. Assume that replacing a candidate reduces cost
2591 by REPL_SAVINGS. Also account for savings from statements that
2592 would go dead. */
2593
2594static int
1168caca 2595total_savings (int repl_savings, slsr_cand_t c, double_int incr,
2596 bool count_phis)
9ce0359e 2597{
2598 int savings = 0;
2599 double_int cand_incr = cand_abs_increment (c);
2600
cf8f0e63 2601 if (incr == cand_incr && !cand_already_replaced (c))
9ce0359e 2602 savings += repl_savings + c->dead_savings;
2603
1168caca 2604 if (count_phis
2605 && phi_dependent_cand_p (c)
2606 && !cand_already_replaced (c))
2607 {
2608 int phi_savings = 0;
2609 gimple phi = lookup_cand (c->def_phi)->cand_stmt;
2610 savings -= phi_incr_cost (c, incr, phi, &phi_savings);
2611
2612 if (has_single_use (gimple_phi_result (phi)))
2613 savings += phi_savings;
2614 }
2615
9ce0359e 2616 if (c->dependent)
1168caca 2617 savings += total_savings (repl_savings, lookup_cand (c->dependent), incr,
2618 count_phis);
9ce0359e 2619
2620 if (c->sibling)
1168caca 2621 savings += total_savings (repl_savings, lookup_cand (c->sibling), incr,
2622 count_phis);
9ce0359e 2623
2624 return savings;
2625}
2626
2627/* Use target-specific costs to determine and record which increments
2628 in the current candidate tree are profitable to replace, assuming
2629 MODE and SPEED. FIRST_DEP is the first dependent of the root of
2630 the candidate tree.
2631
2632 One slight limitation here is that we don't account for the possible
2633 introduction of casts in some cases. See replace_one_candidate for
2634 the cases where these are introduced. This should probably be cleaned
2635 up sometime. */
2636
2637static void
2638analyze_increments (slsr_cand_t first_dep, enum machine_mode mode, bool speed)
2639{
2640 unsigned i;
2641
2642 for (i = 0; i < incr_vec_len; i++)
2643 {
cf8f0e63 2644 HOST_WIDE_INT incr = incr_vec[i].incr.to_shwi ();
9ce0359e 2645
2646 /* If somehow this increment is bigger than a HWI, we won't
2647 be optimizing candidates that use it. And if the increment
2648 has a count of zero, nothing will be done with it. */
cf8f0e63 2649 if (!incr_vec[i].incr.fits_shwi () || !incr_vec[i].count)
9ce0359e 2650 incr_vec[i].cost = COST_INFINITE;
2651
2652 /* Increments of 0, 1, and -1 are always profitable to replace,
2653 because they always replace a multiply or add with an add or
2654 copy, and may cause one or more existing instructions to go
2655 dead. Exception: -1 can't be assumed to be profitable for
2656 pointer addition. */
2657 else if (incr == 0
2658 || incr == 1
2659 || (incr == -1
2660 && (gimple_assign_rhs_code (first_dep->cand_stmt)
2661 != POINTER_PLUS_EXPR)))
2662 incr_vec[i].cost = COST_NEUTRAL;
2663
38304570 2664 /* FORNOW: If we need to add an initializer, give up if a cast from
2665 the candidate's type to its stride's type can lose precision.
2666 This could eventually be handled better by expressly retaining the
2667 result of a cast to a wider type in the stride. Example:
2668
2669 short int _1;
2670 _2 = (int) _1;
2671 _3 = _2 * 10;
2672 _4 = x + _3; ADD: x + (10 * _1) : int
2673 _5 = _2 * 15;
2674 _6 = x + _3; ADD: x + (15 * _1) : int
2675
2676 Right now replacing _6 would cause insertion of an initializer
2677 of the form "short int T = _1 * 5;" followed by a cast to
2678 int, which could overflow incorrectly. Had we recorded _2 or
2679 (int)_1 as the stride, this wouldn't happen. However, doing
2680 this breaks other opportunities, so this will require some
2681 care. */
2682 else if (!incr_vec[i].initializer
2683 && TREE_CODE (first_dep->stride) != INTEGER_CST
2684 && !legal_cast_p_1 (first_dep->stride,
2685 gimple_assign_lhs (first_dep->cand_stmt)))
2686
2687 incr_vec[i].cost = COST_INFINITE;
2688
781e2ff3 2689 /* If we need to add an initializer, make sure we don't introduce
2690 a multiply by a pointer type, which can happen in certain cast
2691 scenarios. FIXME: When cleaning up these cast issues, we can
2692 afford to introduce the multiply provided we cast out to an
2693 unsigned int of appropriate size. */
2694 else if (!incr_vec[i].initializer
2695 && TREE_CODE (first_dep->stride) != INTEGER_CST
2696 && POINTER_TYPE_P (TREE_TYPE (first_dep->stride)))
2697
2698 incr_vec[i].cost = COST_INFINITE;
2699
9ce0359e 2700 /* For any other increment, if this is a multiply candidate, we
2701 must introduce a temporary T and initialize it with
2702 T_0 = stride * increment. When optimizing for speed, walk the
2703 candidate tree to calculate the best cost reduction along any
2704 path; if it offsets the fixed cost of inserting the initializer,
2705 replacing the increment is profitable. When optimizing for
2706 size, instead calculate the total cost reduction from replacing
2707 all candidates with this increment. */
2708 else if (first_dep->kind == CAND_MULT)
2709 {
2710 int cost = mult_by_coeff_cost (incr, mode, speed);
2711 int repl_savings = mul_cost (speed, mode) - add_cost (speed, mode);
2712 if (speed)
2713 cost = lowest_cost_path (cost, repl_savings, first_dep,
1168caca 2714 incr_vec[i].incr, COUNT_PHIS);
9ce0359e 2715 else
1168caca 2716 cost -= total_savings (repl_savings, first_dep, incr_vec[i].incr,
2717 COUNT_PHIS);
9ce0359e 2718
2719 incr_vec[i].cost = cost;
2720 }
2721
2722 /* If this is an add candidate, the initializer may already
2723 exist, so only calculate the cost of the initializer if it
2724 doesn't. We are replacing one add with another here, so the
2725 known replacement savings is zero. We will account for removal
2726 of dead instructions in lowest_cost_path or total_savings. */
2727 else
2728 {
2729 int cost = 0;
2730 if (!incr_vec[i].initializer)
2731 cost = mult_by_coeff_cost (incr, mode, speed);
2732
2733 if (speed)
1168caca 2734 cost = lowest_cost_path (cost, 0, first_dep, incr_vec[i].incr,
2735 DONT_COUNT_PHIS);
9ce0359e 2736 else
1168caca 2737 cost -= total_savings (0, first_dep, incr_vec[i].incr,
2738 DONT_COUNT_PHIS);
9ce0359e 2739
2740 incr_vec[i].cost = cost;
2741 }
2742 }
2743}
2744
2745/* Return the nearest common dominator of BB1 and BB2. If the blocks
2746 are identical, return the earlier of C1 and C2 in *WHERE. Otherwise,
2747 if the NCD matches BB1, return C1 in *WHERE; if the NCD matches BB2,
2748 return C2 in *WHERE; and if the NCD matches neither, return NULL in
2749 *WHERE. Note: It is possible for one of C1 and C2 to be NULL. */
2750
2751static basic_block
2752ncd_for_two_cands (basic_block bb1, basic_block bb2,
2753 slsr_cand_t c1, slsr_cand_t c2, slsr_cand_t *where)
2754{
2755 basic_block ncd;
2756
2757 if (!bb1)
2758 {
2759 *where = c2;
2760 return bb2;
2761 }
2762
2763 if (!bb2)
2764 {
2765 *where = c1;
2766 return bb1;
2767 }
2768
2769 ncd = nearest_common_dominator (CDI_DOMINATORS, bb1, bb2);
2770
2771 /* If both candidates are in the same block, the earlier
2772 candidate wins. */
2773 if (bb1 == ncd && bb2 == ncd)
2774 {
2775 if (!c1 || (c2 && c2->cand_num < c1->cand_num))
2776 *where = c2;
2777 else
2778 *where = c1;
2779 }
2780
2781 /* Otherwise, if one of them produced a candidate in the
2782 dominator, that one wins. */
2783 else if (bb1 == ncd)
2784 *where = c1;
2785
2786 else if (bb2 == ncd)
2787 *where = c2;
2788
2789 /* If neither matches the dominator, neither wins. */
2790 else
2791 *where = NULL;
2792
2793 return ncd;
2794}
2795
1168caca 2796/* Consider all candidates that feed PHI. Find the nearest common
2797 dominator of those candidates requiring the given increment INCR.
2798 Further find and return the nearest common dominator of this result
2799 with block NCD. If the returned block contains one or more of the
2800 candidates, return the earliest candidate in the block in *WHERE. */
2801
2802static basic_block
2803ncd_with_phi (slsr_cand_t c, double_int incr, gimple phi,
2804 basic_block ncd, slsr_cand_t *where)
2805{
2806 unsigned i;
2807 slsr_cand_t basis = lookup_cand (c->basis);
2808 slsr_cand_t phi_cand = base_cand_from_table (gimple_phi_result (phi));
2809
2810 for (i = 0; i < gimple_phi_num_args (phi); i++)
2811 {
2812 tree arg = gimple_phi_arg_def (phi, i);
2813
2814 if (!operand_equal_p (arg, phi_cand->base_expr, 0))
2815 {
2816 gimple arg_def = SSA_NAME_DEF_STMT (arg);
2817
2818 if (gimple_code (arg_def) == GIMPLE_PHI)
2819 ncd = ncd_with_phi (c, incr, arg_def, ncd, where);
2820 else
2821 {
2822 slsr_cand_t arg_cand = base_cand_from_table (arg);
2823 double_int diff = arg_cand->index - basis->index;
2824
2825 if ((incr == diff) || (!address_arithmetic_p && incr == -diff))
2826 ncd = ncd_for_two_cands (ncd, gimple_bb (arg_cand->cand_stmt),
2827 *where, arg_cand, where);
2828 }
2829 }
2830 }
2831
2832 return ncd;
2833}
2834
2835/* Consider the candidate C together with any candidates that feed
2836 C's phi dependence (if any). Find and return the nearest common
2837 dominator of those candidates requiring the given increment INCR.
2838 If the returned block contains one or more of the candidates,
2839 return the earliest candidate in the block in *WHERE. */
2840
2841static basic_block
2842ncd_of_cand_and_phis (slsr_cand_t c, double_int incr, slsr_cand_t *where)
2843{
2844 basic_block ncd = NULL;
2845
2846 if (cand_abs_increment (c) == incr)
2847 {
2848 ncd = gimple_bb (c->cand_stmt);
2849 *where = c;
2850 }
2851
2852 if (phi_dependent_cand_p (c))
2853 ncd = ncd_with_phi (c, incr, lookup_cand (c->def_phi)->cand_stmt,
2854 ncd, where);
2855
2856 return ncd;
2857}
2858
9ce0359e 2859/* Consider all candidates in the tree rooted at C for which INCR
2860 represents the required increment of C relative to its basis.
2861 Find and return the basic block that most nearly dominates all
2862 such candidates. If the returned block contains one or more of
2863 the candidates, return the earliest candidate in the block in
2864 *WHERE. */
2865
2866static basic_block
2867nearest_common_dominator_for_cands (slsr_cand_t c, double_int incr,
2868 slsr_cand_t *where)
2869{
2870 basic_block sib_ncd = NULL, dep_ncd = NULL, this_ncd = NULL, ncd;
2871 slsr_cand_t sib_where = NULL, dep_where = NULL, this_where = NULL, new_where;
9ce0359e 2872
2873 /* First find the NCD of all siblings and dependents. */
2874 if (c->sibling)
2875 sib_ncd = nearest_common_dominator_for_cands (lookup_cand (c->sibling),
2876 incr, &sib_where);
2877 if (c->dependent)
2878 dep_ncd = nearest_common_dominator_for_cands (lookup_cand (c->dependent),
2879 incr, &dep_where);
2880 if (!sib_ncd && !dep_ncd)
2881 {
2882 new_where = NULL;
2883 ncd = NULL;
2884 }
2885 else if (sib_ncd && !dep_ncd)
2886 {
2887 new_where = sib_where;
2888 ncd = sib_ncd;
2889 }
2890 else if (dep_ncd && !sib_ncd)
2891 {
2892 new_where = dep_where;
2893 ncd = dep_ncd;
2894 }
2895 else
2896 ncd = ncd_for_two_cands (sib_ncd, dep_ncd, sib_where,
2897 dep_where, &new_where);
2898
2899 /* If the candidate's increment doesn't match the one we're interested
1168caca 2900 in (and nor do any increments for feeding defs of a phi-dependence),
2901 then the result depends only on siblings and dependents. */
2902 this_ncd = ncd_of_cand_and_phis (c, incr, &this_where);
9ce0359e 2903
1168caca 2904 if (!this_ncd || cand_already_replaced (c))
9ce0359e 2905 {
2906 *where = new_where;
2907 return ncd;
2908 }
2909
2910 /* Otherwise, compare this candidate with the result from all siblings
2911 and dependents. */
9ce0359e 2912 ncd = ncd_for_two_cands (ncd, this_ncd, new_where, this_where, where);
2913
2914 return ncd;
2915}
2916
2917/* Return TRUE if the increment indexed by INDEX is profitable to replace. */
2918
2919static inline bool
2920profitable_increment_p (unsigned index)
2921{
2922 return (incr_vec[index].cost <= COST_NEUTRAL);
2923}
2924
2925/* For each profitable increment in the increment vector not equal to
2926 0 or 1 (or -1, for non-pointer arithmetic), find the nearest common
2927 dominator of all statements in the candidate chain rooted at C
2928 that require that increment, and insert an initializer
2929 T_0 = stride * increment at that location. Record T_0 with the
2930 increment record. */
2931
2932static void
2933insert_initializers (slsr_cand_t c)
2934{
2935 unsigned i;
9ce0359e 2936
2937 for (i = 0; i < incr_vec_len; i++)
2938 {
2939 basic_block bb;
2940 slsr_cand_t where = NULL;
2941 gimple init_stmt;
2942 tree stride_type, new_name, incr_tree;
2943 double_int incr = incr_vec[i].incr;
2944
2945 if (!profitable_increment_p (i)
cf8f0e63 2946 || incr.is_one ()
2947 || (incr.is_minus_one ()
9ce0359e 2948 && gimple_assign_rhs_code (c->cand_stmt) != POINTER_PLUS_EXPR)
cf8f0e63 2949 || incr.is_zero ())
9ce0359e 2950 continue;
2951
2952 /* We may have already identified an existing initializer that
2953 will suffice. */
2954 if (incr_vec[i].initializer)
2955 {
2956 if (dump_file && (dump_flags & TDF_DETAILS))
2957 {
2958 fputs ("Using existing initializer: ", dump_file);
2959 print_gimple_stmt (dump_file,
2960 SSA_NAME_DEF_STMT (incr_vec[i].initializer),
2961 0, 0);
2962 }
2963 continue;
2964 }
2965
2966 /* Find the block that most closely dominates all candidates
2967 with this increment. If there is at least one candidate in
2968 that block, the earliest one will be returned in WHERE. */
2969 bb = nearest_common_dominator_for_cands (c, incr, &where);
2970
2971 /* Create a new SSA name to hold the initializer's value. */
2972 stride_type = TREE_TYPE (c->stride);
d54ab372 2973 new_name = make_temp_ssa_name (stride_type, NULL, "slsr");
9ce0359e 2974 incr_vec[i].initializer = new_name;
2975
2976 /* Create the initializer and insert it in the latest possible
2977 dominating position. */
2978 incr_tree = double_int_to_tree (stride_type, incr);
2979 init_stmt = gimple_build_assign_with_ops (MULT_EXPR, new_name,
2980 c->stride, incr_tree);
2981 if (where)
2982 {
2983 gimple_stmt_iterator gsi = gsi_for_stmt (where->cand_stmt);
2984 gsi_insert_before (&gsi, init_stmt, GSI_SAME_STMT);
2985 gimple_set_location (init_stmt, gimple_location (where->cand_stmt));
2986 }
2987 else
2988 {
2989 gimple_stmt_iterator gsi = gsi_last_bb (bb);
2990 gimple basis_stmt = lookup_cand (c->basis)->cand_stmt;
2991
2992 if (!gsi_end_p (gsi) && is_ctrl_stmt (gsi_stmt (gsi)))
2993 gsi_insert_before (&gsi, init_stmt, GSI_SAME_STMT);
2994 else
2995 gsi_insert_after (&gsi, init_stmt, GSI_SAME_STMT);
2996
2997 gimple_set_location (init_stmt, gimple_location (basis_stmt));
2998 }
2999
3000 if (dump_file && (dump_flags & TDF_DETAILS))
3001 {
3002 fputs ("Inserting initializer: ", dump_file);
3003 print_gimple_stmt (dump_file, init_stmt, 0, 0);
3004 }
3005 }
3006}
3007
1168caca 3008/* Return TRUE iff all required increments for candidates feeding PHI
3009 are profitable to replace on behalf of candidate C. */
3010
3011static bool
3012all_phi_incrs_profitable (slsr_cand_t c, gimple phi)
3013{
3014 unsigned i;
3015 slsr_cand_t basis = lookup_cand (c->basis);
3016 slsr_cand_t phi_cand = base_cand_from_table (gimple_phi_result (phi));
3017
3018 for (i = 0; i < gimple_phi_num_args (phi); i++)
3019 {
3020 tree arg = gimple_phi_arg_def (phi, i);
3021
3022 if (!operand_equal_p (arg, phi_cand->base_expr, 0))
3023 {
3024 gimple arg_def = SSA_NAME_DEF_STMT (arg);
3025
3026 if (gimple_code (arg_def) == GIMPLE_PHI)
3027 {
3028 if (!all_phi_incrs_profitable (c, arg_def))
3029 return false;
3030 }
3031 else
3032 {
d62a8480 3033 int j;
1168caca 3034 slsr_cand_t arg_cand = base_cand_from_table (arg);
3035 double_int increment = arg_cand->index - basis->index;
3036
3037 if (!address_arithmetic_p && increment.is_negative ())
3038 increment = -increment;
3039
3040 j = incr_vec_index (increment);
3041
3042 if (dump_file && (dump_flags & TDF_DETAILS))
3043 {
3044 fprintf (dump_file, " Conditional candidate %d, phi: ",
3045 c->cand_num);
3046 print_gimple_stmt (dump_file, phi, 0, 0);
3047 fputs (" increment: ", dump_file);
3048 dump_double_int (dump_file, increment, false);
d62a8480 3049 if (j < 0)
3050 fprintf (dump_file,
3051 "\n Not replaced; incr_vec overflow.\n");
3052 else {
3053 fprintf (dump_file, "\n cost: %d\n", incr_vec[j].cost);
3054 if (profitable_increment_p (j))
3055 fputs (" Replacing...\n", dump_file);
3056 else
3057 fputs (" Not replaced.\n", dump_file);
3058 }
1168caca 3059 }
3060
d62a8480 3061 if (j < 0 || !profitable_increment_p (j))
1168caca 3062 return false;
3063 }
3064 }
3065 }
3066
3067 return true;
3068}
3069
9ce0359e 3070/* Create a NOP_EXPR that copies FROM_EXPR into a new SSA name of
3071 type TO_TYPE, and insert it in front of the statement represented
3072 by candidate C. Use *NEW_VAR to create the new SSA name. Return
3073 the new SSA name. */
3074
3075static tree
d54ab372 3076introduce_cast_before_cand (slsr_cand_t c, tree to_type, tree from_expr)
9ce0359e 3077{
3078 tree cast_lhs;
3079 gimple cast_stmt;
3080 gimple_stmt_iterator gsi = gsi_for_stmt (c->cand_stmt);
3081
d54ab372 3082 cast_lhs = make_temp_ssa_name (to_type, NULL, "slsr");
9ce0359e 3083 cast_stmt = gimple_build_assign_with_ops (NOP_EXPR, cast_lhs,
3084 from_expr, NULL_TREE);
3085 gimple_set_location (cast_stmt, gimple_location (c->cand_stmt));
3086 gsi_insert_before (&gsi, cast_stmt, GSI_SAME_STMT);
3087
3088 if (dump_file && (dump_flags & TDF_DETAILS))
3089 {
3090 fputs (" Inserting: ", dump_file);
3091 print_gimple_stmt (dump_file, cast_stmt, 0, 0);
3092 }
3093
3094 return cast_lhs;
3095}
3096
3097/* Replace the RHS of the statement represented by candidate C with
3098 NEW_CODE, NEW_RHS1, and NEW_RHS2, provided that to do so doesn't
3099 leave C unchanged or just interchange its operands. The original
3100 operation and operands are in OLD_CODE, OLD_RHS1, and OLD_RHS2.
3101 If the replacement was made and we are doing a details dump,
3102 return the revised statement, else NULL. */
3103
3104static gimple
3105replace_rhs_if_not_dup (enum tree_code new_code, tree new_rhs1, tree new_rhs2,
3106 enum tree_code old_code, tree old_rhs1, tree old_rhs2,
3107 slsr_cand_t c)
3108{
3109 if (new_code != old_code
3110 || ((!operand_equal_p (new_rhs1, old_rhs1, 0)
3111 || !operand_equal_p (new_rhs2, old_rhs2, 0))
3112 && (!operand_equal_p (new_rhs1, old_rhs2, 0)
3113 || !operand_equal_p (new_rhs2, old_rhs1, 0))))
3114 {
3115 gimple_stmt_iterator gsi = gsi_for_stmt (c->cand_stmt);
3116 gimple_assign_set_rhs_with_ops (&gsi, new_code, new_rhs1, new_rhs2);
3117 update_stmt (gsi_stmt (gsi));
dc77dea1 3118 c->cand_stmt = gsi_stmt (gsi);
9ce0359e 3119
3120 if (dump_file && (dump_flags & TDF_DETAILS))
3121 return gsi_stmt (gsi);
3122 }
3123
3124 else if (dump_file && (dump_flags & TDF_DETAILS))
3125 fputs (" (duplicate, not actually replacing)\n", dump_file);
3126
3127 return NULL;
3128}
3129
3130/* Strength-reduce the statement represented by candidate C by replacing
3131 it with an equivalent addition or subtraction. I is the index into
3132 the increment vector identifying C's increment. NEW_VAR is used to
3133 create a new SSA name if a cast needs to be introduced. BASIS_NAME
3134 is the rhs1 to use in creating the add/subtract. */
3135
3136static void
d54ab372 3137replace_one_candidate (slsr_cand_t c, unsigned i, tree basis_name)
9ce0359e 3138{
3139 gimple stmt_to_print = NULL;
3140 tree orig_rhs1, orig_rhs2;
3141 tree rhs2;
3142 enum tree_code orig_code, repl_code;
3143 double_int cand_incr;
3144
3145 orig_code = gimple_assign_rhs_code (c->cand_stmt);
3146 orig_rhs1 = gimple_assign_rhs1 (c->cand_stmt);
3147 orig_rhs2 = gimple_assign_rhs2 (c->cand_stmt);
3148 cand_incr = cand_increment (c);
3149
3150 if (dump_file && (dump_flags & TDF_DETAILS))
3151 {
3152 fputs ("Replacing: ", dump_file);
3153 print_gimple_stmt (dump_file, c->cand_stmt, 0, 0);
3154 stmt_to_print = c->cand_stmt;
3155 }
3156
3157 if (address_arithmetic_p)
3158 repl_code = POINTER_PLUS_EXPR;
3159 else
3160 repl_code = PLUS_EXPR;
3161
3162 /* If the increment has an initializer T_0, replace the candidate
3163 statement with an add of the basis name and the initializer. */
3164 if (incr_vec[i].initializer)
3165 {
3166 tree init_type = TREE_TYPE (incr_vec[i].initializer);
3167 tree orig_type = TREE_TYPE (orig_rhs2);
3168
3169 if (types_compatible_p (orig_type, init_type))
3170 rhs2 = incr_vec[i].initializer;
3171 else
3172 rhs2 = introduce_cast_before_cand (c, orig_type,
d54ab372 3173 incr_vec[i].initializer);
9ce0359e 3174
cf8f0e63 3175 if (incr_vec[i].incr != cand_incr)
9ce0359e 3176 {
3177 gcc_assert (repl_code == PLUS_EXPR);
3178 repl_code = MINUS_EXPR;
3179 }
3180
3181 stmt_to_print = replace_rhs_if_not_dup (repl_code, basis_name, rhs2,
3182 orig_code, orig_rhs1, orig_rhs2,
3183 c);
3184 }
3185
3186 /* Otherwise, the increment is one of -1, 0, and 1. Replace
3187 with a subtract of the stride from the basis name, a copy
3188 from the basis name, or an add of the stride to the basis
3189 name, respectively. It may be necessary to introduce a
3190 cast (or reuse an existing cast). */
cf8f0e63 3191 else if (cand_incr.is_one ())
9ce0359e 3192 {
3193 tree stride_type = TREE_TYPE (c->stride);
3194 tree orig_type = TREE_TYPE (orig_rhs2);
3195
3196 if (types_compatible_p (orig_type, stride_type))
3197 rhs2 = c->stride;
3198 else
d54ab372 3199 rhs2 = introduce_cast_before_cand (c, orig_type, c->stride);
9ce0359e 3200
3201 stmt_to_print = replace_rhs_if_not_dup (repl_code, basis_name, rhs2,
3202 orig_code, orig_rhs1, orig_rhs2,
3203 c);
3204 }
3205
cf8f0e63 3206 else if (cand_incr.is_minus_one ())
9ce0359e 3207 {
3208 tree stride_type = TREE_TYPE (c->stride);
3209 tree orig_type = TREE_TYPE (orig_rhs2);
3210 gcc_assert (repl_code != POINTER_PLUS_EXPR);
3211
3212 if (types_compatible_p (orig_type, stride_type))
3213 rhs2 = c->stride;
3214 else
d54ab372 3215 rhs2 = introduce_cast_before_cand (c, orig_type, c->stride);
9ce0359e 3216
3217 if (orig_code != MINUS_EXPR
3218 || !operand_equal_p (basis_name, orig_rhs1, 0)
3219 || !operand_equal_p (rhs2, orig_rhs2, 0))
3220 {
3221 gimple_stmt_iterator gsi = gsi_for_stmt (c->cand_stmt);
3222 gimple_assign_set_rhs_with_ops (&gsi, MINUS_EXPR, basis_name, rhs2);
3223 update_stmt (gsi_stmt (gsi));
dc77dea1 3224 c->cand_stmt = gsi_stmt (gsi);
9ce0359e 3225
3226 if (dump_file && (dump_flags & TDF_DETAILS))
3227 stmt_to_print = gsi_stmt (gsi);
3228 }
3229 else if (dump_file && (dump_flags & TDF_DETAILS))
3230 fputs (" (duplicate, not actually replacing)\n", dump_file);
3231 }
3232
cf8f0e63 3233 else if (cand_incr.is_zero ())
9ce0359e 3234 {
3235 tree lhs = gimple_assign_lhs (c->cand_stmt);
3236 tree lhs_type = TREE_TYPE (lhs);
3237 tree basis_type = TREE_TYPE (basis_name);
3238
3239 if (types_compatible_p (lhs_type, basis_type))
3240 {
3241 gimple copy_stmt = gimple_build_assign (lhs, basis_name);
3242 gimple_stmt_iterator gsi = gsi_for_stmt (c->cand_stmt);
3243 gimple_set_location (copy_stmt, gimple_location (c->cand_stmt));
3244 gsi_replace (&gsi, copy_stmt, false);
8f0676e4 3245 c->cand_stmt = copy_stmt;
9ce0359e 3246
3247 if (dump_file && (dump_flags & TDF_DETAILS))
3248 stmt_to_print = copy_stmt;
3249 }
3250 else
3251 {
3252 gimple_stmt_iterator gsi = gsi_for_stmt (c->cand_stmt);
3253 gimple cast_stmt = gimple_build_assign_with_ops (NOP_EXPR, lhs,
3254 basis_name,
3255 NULL_TREE);
3256 gimple_set_location (cast_stmt, gimple_location (c->cand_stmt));
3257 gsi_replace (&gsi, cast_stmt, false);
8f0676e4 3258 c->cand_stmt = cast_stmt;
9ce0359e 3259
3260 if (dump_file && (dump_flags & TDF_DETAILS))
3261 stmt_to_print = cast_stmt;
3262 }
3263 }
3264 else
3265 gcc_unreachable ();
3266
3267 if (dump_file && (dump_flags & TDF_DETAILS) && stmt_to_print)
3268 {
3269 fputs ("With: ", dump_file);
3270 print_gimple_stmt (dump_file, stmt_to_print, 0, 0);
3271 fputs ("\n", dump_file);
3272 }
3273}
3274
3275/* For each candidate in the tree rooted at C, replace it with
3276 an increment if such has been shown to be profitable. */
3277
3278static void
3279replace_profitable_candidates (slsr_cand_t c)
3280{
3281 if (!cand_already_replaced (c))
3282 {
3283 double_int increment = cand_abs_increment (c);
9ce0359e 3284 enum tree_code orig_code = gimple_assign_rhs_code (c->cand_stmt);
d62a8480 3285 int i;
9ce0359e 3286
3287 i = incr_vec_index (increment);
3288
3289 /* Only process profitable increments. Nothing useful can be done
3290 to a cast or copy. */
d62a8480 3291 if (i >= 0
3292 && profitable_increment_p (i)
9ce0359e 3293 && orig_code != MODIFY_EXPR
3294 && orig_code != NOP_EXPR)
3295 {
1168caca 3296 if (phi_dependent_cand_p (c))
3297 {
3298 gimple phi = lookup_cand (c->def_phi)->cand_stmt;
3299
3300 if (all_phi_incrs_profitable (c, phi))
3301 {
3302 /* Look up the LHS SSA name from C's basis. This will be
3303 the RHS1 of the adds we will introduce to create new
3304 phi arguments. */
3305 slsr_cand_t basis = lookup_cand (c->basis);
3306 tree basis_name = gimple_assign_lhs (basis->cand_stmt);
3307
3308 /* Create a new phi statement that will represent C's true
3309 basis after the transformation is complete. */
3310 location_t loc = gimple_location (c->cand_stmt);
3311 tree name = create_phi_basis (c, phi, basis_name,
3312 loc, UNKNOWN_STRIDE);
3313
3314 /* Replace C with an add of the new basis phi and the
3315 increment. */
d54ab372 3316 replace_one_candidate (c, i, name);
1168caca 3317 }
3318 }
3319 else
3320 {
3321 slsr_cand_t basis = lookup_cand (c->basis);
3322 tree basis_name = gimple_assign_lhs (basis->cand_stmt);
d54ab372 3323 replace_one_candidate (c, i, basis_name);
1168caca 3324 }
9ce0359e 3325 }
3326 }
3327
3328 if (c->sibling)
3329 replace_profitable_candidates (lookup_cand (c->sibling));
3330
3331 if (c->dependent)
3332 replace_profitable_candidates (lookup_cand (c->dependent));
3333}
3334\f
4502f5d0 3335/* Analyze costs of related candidates in the candidate vector,
3336 and make beneficial replacements. */
3337
3338static void
3339analyze_candidates_and_replace (void)
3340{
3341 unsigned i;
3342 slsr_cand_t c;
3343
3344 /* Each candidate that has a null basis and a non-null
3345 dependent is the root of a tree of related statements.
3346 Analyze each tree to determine a subset of those
3347 statements that can be replaced with maximum benefit. */
f1f41a6c 3348 FOR_EACH_VEC_ELT (cand_vec, i, c)
4502f5d0 3349 {
3350 slsr_cand_t first_dep;
3351
3352 if (c->basis != 0 || c->dependent == 0)
3353 continue;
3354
3355 if (dump_file && (dump_flags & TDF_DETAILS))
3356 fprintf (dump_file, "\nProcessing dependency tree rooted at %d.\n",
3357 c->cand_num);
3358
3359 first_dep = lookup_cand (c->dependent);
3360
070bf980 3361 /* If this is a chain of CAND_REFs, unconditionally replace
3362 each of them with a strength-reduced data reference. */
3363 if (c->kind == CAND_REF)
3364 replace_refs (c);
3365
1168caca 3366 /* If the common stride of all related candidates is a known
3367 constant, each candidate without a phi-dependence can be
3368 profitably replaced. Each replaces a multiply by a single
3369 add, with the possibility that a feeding add also goes dead.
3370 A candidate with a phi-dependence is replaced only if the
3371 compensation code it requires is offset by the strength
3372 reduction savings. */
3373 else if (TREE_CODE (c->stride) == INTEGER_CST)
3374 replace_uncond_cands_and_profitable_phis (first_dep);
4502f5d0 3375
9ce0359e 3376 /* When the stride is an SSA name, it may still be profitable
3377 to replace some or all of the dependent candidates, depending
3378 on whether the introduced increments can be reused, or are
3379 less expensive to calculate than the replaced statements. */
3380 else
3381 {
9ce0359e 3382 enum machine_mode mode;
3383 bool speed;
3384
3385 /* Determine whether we'll be generating pointer arithmetic
3386 when replacing candidates. */
3387 address_arithmetic_p = (c->kind == CAND_ADD
fd291195 3388 && POINTER_TYPE_P (c->cand_type));
9ce0359e 3389
3390 /* If all candidates have already been replaced under other
3391 interpretations, nothing remains to be done. */
259c15e6 3392 if (!count_candidates (c))
9ce0359e 3393 continue;
3394
3395 /* Construct an array of increments for this candidate chain. */
259c15e6 3396 incr_vec = XNEWVEC (incr_info, MAX_INCR_VEC_LEN);
9ce0359e 3397 incr_vec_len = 0;
3398 record_increments (c);
3399
3400 /* Determine which increments are profitable to replace. */
3401 mode = TYPE_MODE (TREE_TYPE (gimple_assign_lhs (c->cand_stmt)));
3402 speed = optimize_cands_for_speed_p (c);
3403 analyze_increments (first_dep, mode, speed);
3404
3405 /* Insert initializers of the form T_0 = stride * increment
3406 for use in profitable replacements. */
3407 insert_initializers (first_dep);
3408 dump_incr_vec ();
3409
3410 /* Perform the replacements. */
3411 replace_profitable_candidates (first_dep);
3412 free (incr_vec);
3413 }
4502f5d0 3414 }
3415}
3416
3417static unsigned
3418execute_strength_reduction (void)
3419{
3420 struct dom_walk_data walk_data;
3421
3422 /* Create the obstack where candidates will reside. */
3423 gcc_obstack_init (&cand_obstack);
3424
3425 /* Allocate the candidate vector. */
f1f41a6c 3426 cand_vec.create (128);
4502f5d0 3427
3428 /* Allocate the mapping from statements to candidate indices. */
3429 stmt_cand_map = pointer_map_create ();
3430
3431 /* Create the obstack where candidate chains will reside. */
3432 gcc_obstack_init (&chain_obstack);
3433
c99e471e 3434 /* Allocate the mapping from base expressions to candidate chains. */
d9dd21a8 3435 base_cand_map.create (500);
4502f5d0 3436
3437 /* Initialize the loop optimizer. We need to detect flow across
3438 back edges, and this gives us dominator information as well. */
3439 loop_optimizer_init (AVOID_CFG_MODIFICATIONS);
3440
4502f5d0 3441 /* Set up callbacks for the generic dominator tree walker. */
3442 walk_data.dom_direction = CDI_DOMINATORS;
3443 walk_data.initialize_block_local_data = NULL;
3444 walk_data.before_dom_children = find_candidates_in_block;
3445 walk_data.after_dom_children = NULL;
3446 walk_data.global_data = NULL;
3447 walk_data.block_local_data_size = 0;
3448 init_walk_dominator_tree (&walk_data);
3449
3450 /* Walk the CFG in predominator order looking for strength reduction
3451 candidates. */
3452 walk_dominator_tree (&walk_data, ENTRY_BLOCK_PTR);
3453
3454 if (dump_file && (dump_flags & TDF_DETAILS))
3455 {
3456 dump_cand_vec ();
3457 dump_cand_chains ();
3458 }
3459
3460 /* Analyze costs and make appropriate replacements. */
3461 analyze_candidates_and_replace ();
3462
3463 /* Free resources. */
3464 fini_walk_dominator_tree (&walk_data);
3465 loop_optimizer_finalize ();
d9dd21a8 3466 base_cand_map.dispose ();
4502f5d0 3467 obstack_free (&chain_obstack, NULL);
3468 pointer_map_destroy (stmt_cand_map);
f1f41a6c 3469 cand_vec.release ();
4502f5d0 3470 obstack_free (&cand_obstack, NULL);
4502f5d0 3471
3472 return 0;
3473}
3474
3475static bool
3476gate_strength_reduction (void)
3477{
6de100ef 3478 return flag_tree_slsr;
4502f5d0 3479}
3480
cbe8bda8 3481namespace {
3482
3483const pass_data pass_data_strength_reduction =
3484{
3485 GIMPLE_PASS, /* type */
3486 "slsr", /* name */
3487 OPTGROUP_NONE, /* optinfo_flags */
3488 true, /* has_gate */
3489 true, /* has_execute */
3490 TV_GIMPLE_SLSR, /* tv_id */
3491 ( PROP_cfg | PROP_ssa ), /* properties_required */
3492 0, /* properties_provided */
3493 0, /* properties_destroyed */
3494 0, /* todo_flags_start */
3495 TODO_verify_ssa, /* todo_flags_finish */
4502f5d0 3496};
cbe8bda8 3497
3498class pass_strength_reduction : public gimple_opt_pass
3499{
3500public:
3501 pass_strength_reduction(gcc::context *ctxt)
3502 : gimple_opt_pass(pass_data_strength_reduction, ctxt)
3503 {}
3504
3505 /* opt_pass methods: */
3506 bool gate () { return gate_strength_reduction (); }
3507 unsigned int execute () { return execute_strength_reduction (); }
3508
3509}; // class pass_strength_reduction
3510
3511} // anon namespace
3512
3513gimple_opt_pass *
3514make_pass_strength_reduction (gcc::context *ctxt)
3515{
3516 return new pass_strength_reduction (ctxt);
3517}