]> git.ipfire.org Git - thirdparty/gcc.git/blob - gcc/lra-remat.c
Move MEMMODEL_* from coretypes.h to memmodel.h
[thirdparty/gcc.git] / gcc / lra-remat.c
1 /* Rematerialize pseudos values.
2 Copyright (C) 2014-2016 Free Software Foundation, Inc.
3 Contributed by Vladimir Makarov <vmakarov@redhat.com>.
4
5 This file is part of GCC.
6
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 3, or (at your option) any later
10 version.
11
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15 for more details.
16
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
20
21 /* This code objective is to rematerialize spilled pseudo values. To
22 do this we calculate available insn candidates. The candidate is
23 available at some point if there is dominated set of insns with the
24 same pattern, the insn inputs are not dying or modified on any path
25 from the set, the outputs are not modified.
26
27 The insns containing memory or spilled pseudos (except for the
28 rematerialized pseudo) are not considered as such insns are not
29 profitable in comparison with regular loads of spilled pseudo
30 values. That simplifies the implementation as we don't need to
31 deal with memory aliasing.
32
33 To speed up available candidate calculation, we calculate partially
34 available candidates first and use them for initialization of the
35 availability. That is because (partial) availability sets are
36 sparse.
37
38 The rematerialization sub-pass could be improved further in the
39 following ways:
40
41 o We could make longer live ranges of inputs in the
42 rematerialization candidates if their hard registers are not used
43 for other purposes. This could be complicated if we need to
44 update BB live info information as LRA does not use
45 DF-infrastructure for compile-time reasons. This problem could
46 be overcome if constrain making live ranges longer only in BB/EBB
47 scope.
48 o We could use cost-based decision to choose rematerialization insn
49 (currently all insns without memory is can be used).
50 o We could use other free hard regs for unused output pseudos in
51 rematerialization candidates although such cases probably will
52 be very rare. */
53
54
55 #include "config.h"
56 #include "system.h"
57 #include "coretypes.h"
58 #include "backend.h"
59 #include "rtl.h"
60 #include "df.h"
61 #include "insn-config.h"
62 #include "regs.h"
63 #include "memmodel.h"
64 #include "ira.h"
65 #include "recog.h"
66 #include "lra.h"
67 #include "lra-int.h"
68
69 /* Number of candidates for rematerialization. */
70 static unsigned int cands_num;
71
72 /* The following is used for representation of call_used_reg_set in
73 form array whose elements are hard register numbers with nonzero bit
74 in CALL_USED_REG_SET. */
75 static int call_used_regs_arr_len;
76 static int call_used_regs_arr[FIRST_PSEUDO_REGISTER];
77
78 /* Bitmap used for different calculations. */
79 static bitmap_head temp_bitmap;
80
81 /* Registers accessed via subreg_p. */
82 static bitmap_head subreg_regs;
83
84 typedef struct cand *cand_t;
85 typedef const struct cand *const_cand_t;
86
87 /* Insn candidates for rematerialization. The candidate insn should
88 have the following properies:
89 o no any memory (as access to memory is non-profitable)
90 o no INOUT regs (it means no non-paradoxical subreg of output reg)
91 o one output spilled pseudo (or reload pseudo of a spilled pseudo)
92 o all other pseudos are with assigned hard regs. */
93 struct cand
94 {
95 /* Index of the candidates in all_cands. */
96 int index;
97 /* The candidate insn. */
98 rtx_insn *insn;
99 /* Insn pseudo regno for rematerialization. */
100 int regno;
101 /* Non-negative if a reload pseudo is in the insn instead of the
102 pseudo for rematerialization. */
103 int reload_regno;
104 /* Number of the operand containing the regno or its reload
105 regno. */
106 int nop;
107 /* Next candidate for the same regno. */
108 cand_t next_regno_cand;
109 };
110
111 /* Vector containing all candidates. */
112 static vec<cand_t> all_cands;
113 /* Map: insn -> candidate representing it. It is null if the insn can
114 not be used for rematerialization. */
115 static cand_t *insn_to_cand;
116 /* A secondary map, for candidates that involve two insns, where the
117 second one makes the equivalence. The candidate must not be used
118 before seeing this activation insn. */
119 static cand_t *insn_to_cand_activation;
120
121 /* Map regno -> candidates can be used for the regno
122 rematerialization. */
123 static cand_t *regno_cands;
124
125 /* Data about basic blocks used for the rematerialization
126 sub-pass. */
127 struct remat_bb_data
128 {
129 /* Basic block about which the below data are. */
130 basic_block bb;
131 /* Registers changed in the basic block: */
132 bitmap_head changed_regs;
133 /* Registers becoming dead in the BB. */
134 bitmap_head dead_regs;
135 /* Cands present in the BB whose in/out regs are not changed after
136 the cands occurence and are not dead (except the reload
137 regno). */
138 bitmap_head gen_cands;
139 bitmap_head livein_cands; /* cands whose inputs live at the BB start. */
140 bitmap_head pavin_cands; /* cands partially available at BB entry. */
141 bitmap_head pavout_cands; /* cands partially available at BB exit. */
142 bitmap_head avin_cands; /* cands available at the entry of the BB. */
143 bitmap_head avout_cands; /* cands available at the exit of the BB. */
144 };
145
146 /* Array for all BB data. Indexed by the corresponding BB index. */
147 typedef struct remat_bb_data *remat_bb_data_t;
148
149 /* Basic blocks for data flow problems -- all bocks except the special
150 ones. */
151 static bitmap_head all_blocks;
152
153 /* All basic block data are referred through the following array. */
154 static remat_bb_data_t remat_bb_data;
155
156 /* Two small functions for access to the bb data. */
157 static inline remat_bb_data_t
158 get_remat_bb_data (basic_block bb)
159 {
160 return &remat_bb_data[(bb)->index];
161 }
162
163 static inline remat_bb_data_t
164 get_remat_bb_data_by_index (int index)
165 {
166 return &remat_bb_data[index];
167 }
168
169 \f
170
171 /* Hash table for the candidates. Different insns (e.g. structurally
172 the same insns or even insns with different unused output regs) can
173 be represented by the same candidate in the table. */
174 static htab_t cand_table;
175
176 /* Hash function for candidate CAND. */
177 static hashval_t
178 cand_hash (const void *cand)
179 {
180 const_cand_t c = (const_cand_t) cand;
181 lra_insn_recog_data_t id = lra_get_insn_recog_data (c->insn);
182 struct lra_static_insn_data *static_id = id->insn_static_data;
183 int nops = static_id->n_operands;
184 hashval_t hash = 0;
185
186 for (int i = 0; i < nops; i++)
187 if (i == c->nop)
188 hash = iterative_hash_object (c->regno, hash);
189 else if (static_id->operand[i].type == OP_IN)
190 hash = iterative_hash_object (*id->operand_loc[i], hash);
191 return hash;
192 }
193
194 /* Equal function for candidates CAND1 and CAND2. They are equal if
195 the corresponding candidate insns have the same code, the same
196 regno for rematerialization, the same input operands. */
197 static int
198 cand_eq_p (const void *cand1, const void *cand2)
199 {
200 const_cand_t c1 = (const_cand_t) cand1;
201 const_cand_t c2 = (const_cand_t) cand2;
202 lra_insn_recog_data_t id1 = lra_get_insn_recog_data (c1->insn);
203 lra_insn_recog_data_t id2 = lra_get_insn_recog_data (c2->insn);
204 struct lra_static_insn_data *static_id1 = id1->insn_static_data;
205 int nops = static_id1->n_operands;
206
207 if (c1->regno != c2->regno
208 || INSN_CODE (c1->insn) < 0
209 || INSN_CODE (c1->insn) != INSN_CODE (c2->insn))
210 return false;
211 gcc_assert (c1->nop == c2->nop);
212 for (int i = 0; i < nops; i++)
213 if (i != c1->nop && static_id1->operand[i].type == OP_IN
214 && *id1->operand_loc[i] != *id2->operand_loc[i])
215 return false;
216 return true;
217 }
218
219 /* Insert candidate CAND into the table if it is not there yet.
220 Return candidate which is in the table. */
221 static cand_t
222 insert_cand (cand_t cand)
223 {
224 void **entry_ptr;
225
226 entry_ptr = htab_find_slot (cand_table, cand, INSERT);
227 if (*entry_ptr == NULL)
228 *entry_ptr = (void *) cand;
229 return (cand_t) *entry_ptr;
230 }
231
232 /* Free candidate CAND memory. */
233 static void
234 free_cand (void *cand)
235 {
236 free (cand);
237 }
238
239 /* Initiate the candidate table. */
240 static void
241 initiate_cand_table (void)
242 {
243 cand_table = htab_create (8000, cand_hash, cand_eq_p,
244 (htab_del) free_cand);
245 }
246
247 /* Finish the candidate table. */
248 static void
249 finish_cand_table (void)
250 {
251 htab_delete (cand_table);
252 }
253
254 \f
255
256 /* Return true if X contains memory or some UNSPEC. We can not just
257 check insn operands as memory or unspec might be not an operand
258 itself but contain an operand. Insn with memory access is not
259 profitable for rematerialization. Rematerialization of UNSPEC
260 might result in wrong code generation as the UNPEC effect is
261 unknown (e.g. generating a label). */
262 static bool
263 bad_for_rematerialization_p (rtx x)
264 {
265 int i, j;
266 const char *fmt;
267 enum rtx_code code;
268
269 if (MEM_P (x) || GET_CODE (x) == UNSPEC || GET_CODE (x) == UNSPEC_VOLATILE)
270 return true;
271 code = GET_CODE (x);
272 fmt = GET_RTX_FORMAT (code);
273 for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
274 {
275 if (fmt[i] == 'e')
276 {
277 if (bad_for_rematerialization_p (XEXP (x, i)))
278 return true;
279 }
280 else if (fmt[i] == 'E')
281 {
282 for (j = XVECLEN (x, i) - 1; j >= 0; j--)
283 if (bad_for_rematerialization_p (XVECEXP (x, i, j)))
284 return true;
285 }
286 }
287 return false;
288 }
289
290 /* If INSN can not be used for rematerialization, return negative
291 value. If INSN can be considered as a candidate for
292 rematerialization, return value which is the operand number of the
293 pseudo for which the insn can be used for rematerialization. Here
294 we consider the insns without any memory, spilled pseudo (except
295 for the rematerialization pseudo), or dying or unused regs. */
296 static int
297 operand_to_remat (rtx_insn *insn)
298 {
299 lra_insn_recog_data_t id = lra_get_insn_recog_data (insn);
300 struct lra_static_insn_data *static_id = id->insn_static_data;
301 struct lra_insn_reg *reg, *found_reg = NULL;
302
303 /* Don't rematerialize insns which can change PC. */
304 if (JUMP_P (insn) || CALL_P (insn))
305 return -1;
306 /* First find a pseudo which can be rematerialized. */
307 for (reg = id->regs; reg != NULL; reg = reg->next)
308 {
309 /* True FRAME_POINTER_NEEDED might be because we can not follow
310 changing sp offsets, e.g. alloca is used. If the insn contains
311 stack pointer in such case, we can not rematerialize it as we
312 can not know sp offset at a rematerialization place. */
313 if (reg->regno == STACK_POINTER_REGNUM && frame_pointer_needed)
314 return -1;
315 else if (reg->type == OP_OUT && ! reg->subreg_p
316 && find_regno_note (insn, REG_UNUSED, reg->regno) == NULL)
317 {
318 /* We permits only one spilled reg. */
319 if (found_reg != NULL)
320 return -1;
321 found_reg = reg;
322 }
323 /* IRA calculates conflicts separately for subregs of two words
324 pseudo. Even if the pseudo lives, e.g. one its subreg can be
325 used lately, another subreg hard register can be already used
326 for something else. In such case, it is not safe to
327 rematerialize the insn. */
328 if (reg->regno >= FIRST_PSEUDO_REGISTER
329 && bitmap_bit_p (&subreg_regs, reg->regno))
330 return -1;
331
332 /* Don't allow hard registers to be rematerialized. */
333 if (reg->regno < FIRST_PSEUDO_REGISTER)
334 return -1;
335 }
336 if (found_reg == NULL)
337 return -1;
338 if (found_reg->regno < FIRST_PSEUDO_REGISTER)
339 return -1;
340 if (bad_for_rematerialization_p (PATTERN (insn)))
341 return -1;
342 /* Check the other regs are not spilled. */
343 for (reg = id->regs; reg != NULL; reg = reg->next)
344 if (found_reg == reg)
345 continue;
346 else if (reg->type == OP_INOUT)
347 return -1;
348 else if (reg->regno >= FIRST_PSEUDO_REGISTER
349 && reg_renumber[reg->regno] < 0)
350 /* Another spilled reg. */
351 return -1;
352 else if (reg->type == OP_IN)
353 {
354 if (find_regno_note (insn, REG_DEAD, reg->regno) != NULL)
355 /* We don't want to make live ranges longer. */
356 return -1;
357 /* Check that there is no output reg as the input one. */
358 for (struct lra_insn_reg *reg2 = id->regs;
359 reg2 != NULL;
360 reg2 = reg2->next)
361 if (reg2->type == OP_OUT && reg->regno == reg2->regno)
362 return -1;
363 if (reg->regno < FIRST_PSEUDO_REGISTER)
364 for (struct lra_insn_reg *reg2 = static_id->hard_regs;
365 reg2 != NULL;
366 reg2 = reg2->next)
367 if (reg2->type == OP_OUT
368 && reg->regno <= reg2->regno
369 && (reg2->regno
370 < (reg->regno
371 + hard_regno_nregs[reg->regno][reg->biggest_mode])))
372 return -1;
373 }
374 /* Check hard coded insn registers. */
375 for (struct lra_insn_reg *reg = static_id->hard_regs;
376 reg != NULL;
377 reg = reg->next)
378 if (reg->type == OP_INOUT)
379 return -1;
380 else if (reg->type == OP_IN)
381 {
382 /* Check that there is no output hard reg as the input
383 one. */
384 for (struct lra_insn_reg *reg2 = static_id->hard_regs;
385 reg2 != NULL;
386 reg2 = reg2->next)
387 if (reg2->type == OP_OUT && reg->regno == reg2->regno)
388 return -1;
389 }
390 /* Find the rematerialization operand. */
391 int nop = static_id->n_operands;
392 for (int i = 0; i < nop; i++)
393 if (REG_P (*id->operand_loc[i])
394 && (int) REGNO (*id->operand_loc[i]) == found_reg->regno)
395 return i;
396 return -1;
397 }
398
399 /* Create candidate for INSN with rematerialization operand NOP and
400 REGNO. Insert the candidate into the table and set up the
401 corresponding INSN_TO_CAND element. */
402 static void
403 create_cand (rtx_insn *insn, int nop, int regno, rtx_insn *activation = NULL)
404 {
405 lra_insn_recog_data_t id = lra_get_insn_recog_data (insn);
406 rtx reg = *id->operand_loc[nop];
407 gcc_assert (REG_P (reg));
408 int op_regno = REGNO (reg);
409 gcc_assert (op_regno >= FIRST_PSEUDO_REGISTER);
410 cand_t cand = XNEW (struct cand);
411 cand->insn = insn;
412 cand->nop = nop;
413 cand->regno = regno;
414 cand->reload_regno = op_regno == regno ? -1 : op_regno;
415 gcc_assert (cand->regno >= 0);
416 cand_t cand_in_table = insert_cand (cand);
417 insn_to_cand[INSN_UID (insn)] = cand_in_table;
418 if (cand != cand_in_table)
419 free (cand);
420 else
421 {
422 /* A new cand. */
423 cand->index = all_cands.length ();
424 all_cands.safe_push (cand);
425 cand->next_regno_cand = regno_cands[cand->regno];
426 regno_cands[cand->regno] = cand;
427 }
428 if (activation)
429 insn_to_cand_activation[INSN_UID (activation)] = cand_in_table;
430 }
431
432 /* Create rematerialization candidates (inserting them into the
433 table). */
434 static void
435 create_cands (void)
436 {
437 rtx_insn *insn;
438 struct potential_cand
439 {
440 rtx_insn *insn;
441 int nop;
442 };
443 struct potential_cand *regno_potential_cand;
444
445 /* Create candidates. */
446 regno_potential_cand = XCNEWVEC (struct potential_cand, max_reg_num ());
447 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
448 if (NONDEBUG_INSN_P (insn))
449 {
450 lra_insn_recog_data_t id = lra_get_insn_recog_data (insn);
451 int keep_regno = -1;
452 rtx set = single_set (insn);
453 int nop;
454
455 /* See if this is an output reload for a previous insn. */
456 if (set != NULL
457 && REG_P (SET_SRC (set)) && REG_P (SET_DEST (set)))
458 {
459 rtx dstreg = SET_DEST (set);
460 int src_regno = REGNO (SET_SRC (set));
461 int dst_regno = REGNO (dstreg);
462 rtx_insn *insn2 = regno_potential_cand[src_regno].insn;
463
464 if (insn2 != NULL
465 && dst_regno >= FIRST_PSEUDO_REGISTER
466 && reg_renumber[dst_regno] < 0
467 && BLOCK_FOR_INSN (insn2) == BLOCK_FOR_INSN (insn))
468 {
469 create_cand (insn2, regno_potential_cand[src_regno].nop,
470 dst_regno, insn);
471 goto done;
472 }
473 }
474
475 nop = operand_to_remat (insn);
476 if (nop >= 0)
477 {
478 gcc_assert (REG_P (*id->operand_loc[nop]));
479 int regno = REGNO (*id->operand_loc[nop]);
480 gcc_assert (regno >= FIRST_PSEUDO_REGISTER);
481 /* If we're setting an unrenumbered pseudo, make a candidate immediately.
482 If it's an output reload register, save it for later; the code above
483 looks for output reload insns later on. */
484 if (reg_renumber[regno] < 0)
485 create_cand (insn, nop, regno);
486 else if (regno >= lra_constraint_new_regno_start)
487 {
488 regno_potential_cand[regno].insn = insn;
489 regno_potential_cand[regno].nop = nop;
490 keep_regno = regno;
491 }
492 }
493
494 done:
495 for (struct lra_insn_reg *reg = id->regs; reg != NULL; reg = reg->next)
496 if (reg->type != OP_IN && reg->regno != keep_regno
497 && reg->regno >= FIRST_PSEUDO_REGISTER)
498 regno_potential_cand[reg->regno].insn = NULL;
499 }
500 cands_num = all_cands.length ();
501 free (regno_potential_cand);
502 }
503
504 \f
505
506 /* Create and initialize BB data. */
507 static void
508 create_remat_bb_data (void)
509 {
510 basic_block bb;
511 remat_bb_data_t bb_info;
512
513 remat_bb_data = XNEWVEC (struct remat_bb_data,
514 last_basic_block_for_fn (cfun));
515 FOR_ALL_BB_FN (bb, cfun)
516 {
517 gcc_checking_assert (bb->index >= 0
518 && bb->index < last_basic_block_for_fn (cfun));
519 bb_info = get_remat_bb_data (bb);
520 bb_info->bb = bb;
521 bitmap_initialize (&bb_info->changed_regs, &reg_obstack);
522 bitmap_initialize (&bb_info->dead_regs, &reg_obstack);
523 bitmap_initialize (&bb_info->gen_cands, &reg_obstack);
524 bitmap_initialize (&bb_info->livein_cands, &reg_obstack);
525 bitmap_initialize (&bb_info->pavin_cands, &reg_obstack);
526 bitmap_initialize (&bb_info->pavout_cands, &reg_obstack);
527 bitmap_initialize (&bb_info->avin_cands, &reg_obstack);
528 bitmap_initialize (&bb_info->avout_cands, &reg_obstack);
529 }
530 }
531
532 /* Dump all candidates to DUMP_FILE. */
533 static void
534 dump_cands (FILE *dump_file)
535 {
536 int i;
537 cand_t cand;
538
539 fprintf (dump_file, "\nCands:\n");
540 for (i = 0; i < (int) cands_num; i++)
541 {
542 cand = all_cands[i];
543 fprintf (dump_file, "%d (nop=%d, remat_regno=%d, reload_regno=%d):\n",
544 i, cand->nop, cand->regno, cand->reload_regno);
545 print_inline_rtx (dump_file, cand->insn, 6);
546 fprintf (dump_file, "\n");
547 }
548 }
549
550 /* Dump all candidates and BB data. */
551 static void
552 dump_candidates_and_remat_bb_data (void)
553 {
554 basic_block bb;
555
556 if (lra_dump_file == NULL)
557 return;
558 dump_cands (lra_dump_file);
559 FOR_EACH_BB_FN (bb, cfun)
560 {
561 fprintf (lra_dump_file, "\nBB %d:\n", bb->index);
562 /* Livein */
563 fprintf (lra_dump_file, " register live in:");
564 dump_regset (df_get_live_in (bb), lra_dump_file);
565 putc ('\n', lra_dump_file);
566 /* Liveout */
567 fprintf (lra_dump_file, " register live out:");
568 dump_regset (df_get_live_out (bb), lra_dump_file);
569 putc ('\n', lra_dump_file);
570 /* Changed/dead regs: */
571 fprintf (lra_dump_file, " changed regs:");
572 dump_regset (&get_remat_bb_data (bb)->changed_regs, lra_dump_file);
573 putc ('\n', lra_dump_file);
574 fprintf (lra_dump_file, " dead regs:");
575 dump_regset (&get_remat_bb_data (bb)->dead_regs, lra_dump_file);
576 putc ('\n', lra_dump_file);
577 lra_dump_bitmap_with_title ("cands generated in BB",
578 &get_remat_bb_data (bb)->gen_cands, bb->index);
579 lra_dump_bitmap_with_title ("livein cands in BB",
580 &get_remat_bb_data (bb)->livein_cands, bb->index);
581 lra_dump_bitmap_with_title ("pavin cands in BB",
582 &get_remat_bb_data (bb)->pavin_cands, bb->index);
583 lra_dump_bitmap_with_title ("pavout cands in BB",
584 &get_remat_bb_data (bb)->pavout_cands, bb->index);
585 lra_dump_bitmap_with_title ("avin cands in BB",
586 &get_remat_bb_data (bb)->avin_cands, bb->index);
587 lra_dump_bitmap_with_title ("avout cands in BB",
588 &get_remat_bb_data (bb)->avout_cands, bb->index);
589 }
590 fprintf (lra_dump_file, "subreg regs:");
591 dump_regset (&subreg_regs, lra_dump_file);
592 putc ('\n', lra_dump_file);
593 }
594
595 /* Free all BB data. */
596 static void
597 finish_remat_bb_data (void)
598 {
599 basic_block bb;
600
601 FOR_EACH_BB_FN (bb, cfun)
602 {
603 bitmap_clear (&get_remat_bb_data (bb)->avout_cands);
604 bitmap_clear (&get_remat_bb_data (bb)->avin_cands);
605 bitmap_clear (&get_remat_bb_data (bb)->pavout_cands);
606 bitmap_clear (&get_remat_bb_data (bb)->pavin_cands);
607 bitmap_clear (&get_remat_bb_data (bb)->livein_cands);
608 bitmap_clear (&get_remat_bb_data (bb)->gen_cands);
609 bitmap_clear (&get_remat_bb_data (bb)->dead_regs);
610 bitmap_clear (&get_remat_bb_data (bb)->changed_regs);
611 }
612 free (remat_bb_data);
613 }
614
615 \f
616
617 /* Update changed_regs, dead_regs, subreg_regs of BB from INSN. */
618 static void
619 set_bb_regs (basic_block bb, rtx_insn *insn)
620 {
621 lra_insn_recog_data_t id = lra_get_insn_recog_data (insn);
622 remat_bb_data_t bb_info = get_remat_bb_data (bb);
623 struct lra_insn_reg *reg;
624
625 for (reg = id->regs; reg != NULL; reg = reg->next)
626 {
627 unsigned regno = reg->regno;
628 if (reg->type != OP_IN)
629 bitmap_set_bit (&bb_info->changed_regs, regno);
630 else if (find_regno_note (insn, REG_DEAD, regno) != NULL)
631 bitmap_set_bit (&bb_info->dead_regs, regno);
632 if (regno >= FIRST_PSEUDO_REGISTER && reg->subreg_p)
633 bitmap_set_bit (&subreg_regs, regno);
634 }
635 if (CALL_P (insn))
636 for (int i = 0; i < call_used_regs_arr_len; i++)
637 bitmap_set_bit (&get_remat_bb_data (bb)->dead_regs,
638 call_used_regs_arr[i]);
639 }
640
641 /* Calculate changed_regs and dead_regs for each BB. */
642 static void
643 calculate_local_reg_remat_bb_data (void)
644 {
645 basic_block bb;
646 rtx_insn *insn;
647
648 FOR_EACH_BB_FN (bb, cfun)
649 FOR_BB_INSNS (bb, insn)
650 if (NONDEBUG_INSN_P (insn))
651 set_bb_regs (bb, insn);
652 }
653
654 \f
655
656 /* Return true if REG overlaps an input operand of INSN. */
657 static bool
658 reg_overlap_for_remat_p (lra_insn_reg *reg, rtx_insn *insn)
659 {
660 int iter;
661 lra_insn_recog_data_t id = lra_get_insn_recog_data (insn);
662 struct lra_static_insn_data *static_id = id->insn_static_data;
663 unsigned regno = reg->regno;
664 int nregs;
665
666 if (regno >= FIRST_PSEUDO_REGISTER && reg_renumber[regno] >= 0)
667 regno = reg_renumber[regno];
668 if (regno >= FIRST_PSEUDO_REGISTER)
669 nregs = 1;
670 else
671 nregs = hard_regno_nregs[regno][reg->biggest_mode];
672
673 struct lra_insn_reg *reg2;
674
675 for (iter = 0; iter < 2; iter++)
676 for (reg2 = (iter == 0 ? id->regs : static_id->hard_regs);
677 reg2 != NULL;
678 reg2 = reg2->next)
679 {
680 if (reg2->type != OP_IN)
681 continue;
682 unsigned regno2 = reg2->regno;
683 int nregs2;
684
685 if (regno2 >= FIRST_PSEUDO_REGISTER && reg_renumber[regno2] >= 0)
686 regno2 = reg_renumber[regno2];
687 if (regno >= FIRST_PSEUDO_REGISTER)
688 nregs2 = 1;
689 else
690 nregs2 = hard_regno_nregs[regno2][reg->biggest_mode];
691
692 if ((regno2 + nregs2 - 1 >= regno && regno2 < regno + nregs)
693 || (regno + nregs - 1 >= regno2 && regno < regno2 + nregs2))
694 return true;
695 }
696 return false;
697 }
698
699 /* Return true if a call used register is an input operand of INSN. */
700 static bool
701 call_used_input_regno_present_p (rtx_insn *insn)
702 {
703 int iter;
704 lra_insn_recog_data_t id = lra_get_insn_recog_data (insn);
705 struct lra_static_insn_data *static_id = id->insn_static_data;
706 struct lra_insn_reg *reg;
707
708 for (iter = 0; iter < 2; iter++)
709 for (reg = (iter == 0 ? id->regs : static_id->hard_regs);
710 reg != NULL;
711 reg = reg->next)
712 if (reg->type == OP_IN && reg->regno <= FIRST_PSEUDO_REGISTER
713 && TEST_HARD_REG_BIT (call_used_reg_set, reg->regno))
714 return true;
715 return false;
716 }
717
718 /* Calculate livein_cands for each BB. */
719 static void
720 calculate_livein_cands (void)
721 {
722 basic_block bb;
723
724 FOR_EACH_BB_FN (bb, cfun)
725 {
726 bitmap livein_regs = df_get_live_in (bb);
727 bitmap livein_cands = &get_remat_bb_data (bb)->livein_cands;
728 for (unsigned int i = 0; i < cands_num; i++)
729 {
730 cand_t cand = all_cands[i];
731 lra_insn_recog_data_t id = lra_get_insn_recog_data (cand->insn);
732 struct lra_insn_reg *reg;
733
734 for (reg = id->regs; reg != NULL; reg = reg->next)
735 if (reg->type == OP_IN && ! bitmap_bit_p (livein_regs, reg->regno))
736 break;
737 if (reg == NULL)
738 bitmap_set_bit (livein_cands, i);
739 }
740 }
741 }
742
743 /* Calculate gen_cands for each BB. */
744 static void
745 calculate_gen_cands (void)
746 {
747 basic_block bb;
748 bitmap gen_cands;
749 bitmap_head gen_insns;
750 rtx_insn *insn;
751
752 bitmap_initialize (&gen_insns, &reg_obstack);
753 FOR_EACH_BB_FN (bb, cfun)
754 {
755 gen_cands = &get_remat_bb_data (bb)->gen_cands;
756 bitmap_clear (&gen_insns);
757 FOR_BB_INSNS (bb, insn)
758 if (INSN_P (insn))
759 {
760 lra_insn_recog_data_t id = lra_get_insn_recog_data (insn);
761 struct lra_static_insn_data *static_id = id->insn_static_data;
762 struct lra_insn_reg *reg;
763 unsigned int uid;
764 bitmap_iterator bi;
765 cand_t cand;
766 rtx set;
767 int iter;
768 int src_regno = -1, dst_regno = -1;
769
770 if ((set = single_set (insn)) != NULL
771 && REG_P (SET_SRC (set)) && REG_P (SET_DEST (set)))
772 {
773 src_regno = REGNO (SET_SRC (set));
774 dst_regno = REGNO (SET_DEST (set));
775 }
776
777 /* Update gen_cands: */
778 bitmap_clear (&temp_bitmap);
779 for (iter = 0; iter < 2; iter++)
780 for (reg = (iter == 0 ? id->regs : static_id->hard_regs);
781 reg != NULL;
782 reg = reg->next)
783 if (reg->type != OP_IN
784 || find_regno_note (insn, REG_DEAD, reg->regno) != NULL)
785 EXECUTE_IF_SET_IN_BITMAP (&gen_insns, 0, uid, bi)
786 {
787 rtx_insn *insn2 = lra_insn_recog_data[uid]->insn;
788
789 cand = insn_to_cand[INSN_UID (insn2)];
790 gcc_assert (cand != NULL);
791 /* Ignore the reload insn. */
792 if (src_regno == cand->reload_regno
793 && dst_regno == cand->regno)
794 continue;
795 if (cand->regno == reg->regno
796 || reg_overlap_for_remat_p (reg, insn2))
797 {
798 bitmap_clear_bit (gen_cands, cand->index);
799 bitmap_set_bit (&temp_bitmap, uid);
800 }
801 }
802
803 if (CALL_P (insn))
804 EXECUTE_IF_SET_IN_BITMAP (&gen_insns, 0, uid, bi)
805 {
806 rtx_insn *insn2 = lra_insn_recog_data[uid]->insn;
807
808 cand = insn_to_cand[INSN_UID (insn2)];
809 gcc_assert (cand != NULL);
810 if (call_used_input_regno_present_p (insn2))
811 {
812 bitmap_clear_bit (gen_cands, cand->index);
813 bitmap_set_bit (&temp_bitmap, uid);
814 }
815 }
816 bitmap_and_compl_into (&gen_insns, &temp_bitmap);
817
818 cand = insn_to_cand[INSN_UID (insn)];
819 if (cand != NULL)
820 {
821 bitmap_set_bit (gen_cands, cand->index);
822 bitmap_set_bit (&gen_insns, INSN_UID (insn));
823 }
824 }
825 }
826 bitmap_clear (&gen_insns);
827 }
828
829 \f
830
831 /* The common transfer function used by the DF equation solver to
832 propagate (partial) availability info BB_IN to BB_OUT through block
833 with BB_INDEX according to the following equation:
834
835 bb.out = ((bb.in & bb.livein) - bb.killed) OR bb.gen
836 */
837 static bool
838 cand_trans_fun (int bb_index, bitmap bb_in, bitmap bb_out)
839 {
840 remat_bb_data_t bb_info;
841 bitmap bb_livein, bb_changed_regs, bb_dead_regs;
842 unsigned int cid;
843 bitmap_iterator bi;
844
845 bb_info = get_remat_bb_data_by_index (bb_index);
846 bb_livein = &bb_info->livein_cands;
847 bb_changed_regs = &bb_info->changed_regs;
848 bb_dead_regs = &bb_info->dead_regs;
849 /* Calculate killed avin cands -- cands whose regs are changed or
850 becoming dead in the BB. We calculate it here as we hope that
851 repeated calculations are compensated by smaller size of BB_IN in
852 comparison with all candidates number. */
853 bitmap_clear (&temp_bitmap);
854 EXECUTE_IF_SET_IN_BITMAP (bb_in, 0, cid, bi)
855 {
856 cand_t cand = all_cands[cid];
857 lra_insn_recog_data_t id = lra_get_insn_recog_data (cand->insn);
858 struct lra_insn_reg *reg;
859
860 if (! bitmap_bit_p (bb_livein, cid))
861 {
862 bitmap_set_bit (&temp_bitmap, cid);
863 continue;
864 }
865 for (reg = id->regs; reg != NULL; reg = reg->next)
866 /* Ignore all outputs which are not the regno for
867 rematerialization. */
868 if (reg->type == OP_OUT && reg->regno != cand->regno)
869 continue;
870 else if (bitmap_bit_p (bb_changed_regs, reg->regno)
871 || bitmap_bit_p (bb_dead_regs, reg->regno))
872 {
873 bitmap_set_bit (&temp_bitmap, cid);
874 break;
875 }
876 /* Check regno for rematerialization. */
877 if (bitmap_bit_p (bb_changed_regs, cand->regno)
878 || bitmap_bit_p (bb_dead_regs, cand->regno))
879 bitmap_set_bit (&temp_bitmap, cid);
880 }
881 return bitmap_ior_and_compl (bb_out,
882 &bb_info->gen_cands, bb_in, &temp_bitmap);
883 }
884
885 \f
886
887 /* The transfer function used by the DF equation solver to propagate
888 partial candidate availability info through block with BB_INDEX
889 according to the following equation:
890
891 bb.pavout = ((bb.pavin & bb.livein) - bb.killed) OR bb.gen
892 */
893 static bool
894 cand_pav_trans_fun (int bb_index)
895 {
896 remat_bb_data_t bb_info;
897
898 bb_info = get_remat_bb_data_by_index (bb_index);
899 return cand_trans_fun (bb_index, &bb_info->pavin_cands,
900 &bb_info->pavout_cands);
901 }
902
903 /* The confluence function used by the DF equation solver to set up
904 cand_pav info for a block BB without predecessor. */
905 static void
906 cand_pav_con_fun_0 (basic_block bb)
907 {
908 bitmap_clear (&get_remat_bb_data (bb)->pavin_cands);
909 }
910
911 /* The confluence function used by the DF equation solver to propagate
912 partial candidate availability info from predecessor to successor
913 on edge E (pred->bb) according to the following equation:
914
915 bb.pavin_cands = 0 for entry block | OR (pavout_cands of predecessors)
916 */
917 static bool
918 cand_pav_con_fun_n (edge e)
919 {
920 basic_block pred = e->src;
921 basic_block bb = e->dest;
922 remat_bb_data_t bb_info;
923 bitmap bb_pavin, pred_pavout;
924
925 bb_info = get_remat_bb_data (bb);
926 bb_pavin = &bb_info->pavin_cands;
927 pred_pavout = &get_remat_bb_data (pred)->pavout_cands;
928 return bitmap_ior_into (bb_pavin, pred_pavout);
929 }
930
931 \f
932
933 /* The transfer function used by the DF equation solver to propagate
934 candidate availability info through block with BB_INDEX according
935 to the following equation:
936
937 bb.avout = ((bb.avin & bb.livein) - bb.killed) OR bb.gen
938 */
939 static bool
940 cand_av_trans_fun (int bb_index)
941 {
942 remat_bb_data_t bb_info;
943
944 bb_info = get_remat_bb_data_by_index (bb_index);
945 return cand_trans_fun (bb_index, &bb_info->avin_cands,
946 &bb_info->avout_cands);
947 }
948
949 /* The confluence function used by the DF equation solver to set up
950 cand_av info for a block BB without predecessor. */
951 static void
952 cand_av_con_fun_0 (basic_block bb)
953 {
954 bitmap_clear (&get_remat_bb_data (bb)->avin_cands);
955 }
956
957 /* The confluence function used by the DF equation solver to propagate
958 cand_av info from predecessor to successor on edge E (pred->bb)
959 according to the following equation:
960
961 bb.avin_cands = 0 for entry block | AND (avout_cands of predecessors)
962 */
963 static bool
964 cand_av_con_fun_n (edge e)
965 {
966 basic_block pred = e->src;
967 basic_block bb = e->dest;
968 remat_bb_data_t bb_info;
969 bitmap bb_avin, pred_avout;
970
971 bb_info = get_remat_bb_data (bb);
972 bb_avin = &bb_info->avin_cands;
973 pred_avout = &get_remat_bb_data (pred)->avout_cands;
974 return bitmap_and_into (bb_avin, pred_avout);
975 }
976
977 /* Calculate available candidates for each BB. */
978 static void
979 calculate_global_remat_bb_data (void)
980 {
981 basic_block bb;
982
983 df_simple_dataflow
984 (DF_FORWARD, NULL, cand_pav_con_fun_0, cand_pav_con_fun_n,
985 cand_pav_trans_fun, &all_blocks,
986 df_get_postorder (DF_FORWARD), df_get_n_blocks (DF_FORWARD));
987 /* Initialize avin by pavin. */
988 FOR_EACH_BB_FN (bb, cfun)
989 bitmap_copy (&get_remat_bb_data (bb)->avin_cands,
990 &get_remat_bb_data (bb)->pavin_cands);
991 df_simple_dataflow
992 (DF_FORWARD, NULL, cand_av_con_fun_0, cand_av_con_fun_n,
993 cand_av_trans_fun, &all_blocks,
994 df_get_postorder (DF_FORWARD), df_get_n_blocks (DF_FORWARD));
995 }
996
997 \f
998
999 /* Setup sp offset attribute to SP_OFFSET for all INSNS. */
1000 static void
1001 change_sp_offset (rtx_insn *insns, HOST_WIDE_INT sp_offset)
1002 {
1003 for (rtx_insn *insn = insns; insn != NULL; insn = NEXT_INSN (insn))
1004 eliminate_regs_in_insn (insn, false, false, sp_offset);
1005 }
1006
1007 /* Return start hard register of REG (can be a hard or a pseudo reg)
1008 or -1 (if it is a spilled pseudo). Return number of hard registers
1009 occupied by REG through parameter NREGS if the start hard reg is
1010 not negative. */
1011 static int
1012 get_hard_regs (struct lra_insn_reg *reg, int &nregs)
1013 {
1014 int regno = reg->regno;
1015 int hard_regno = regno < FIRST_PSEUDO_REGISTER ? regno : reg_renumber[regno];
1016
1017 if (hard_regno >= 0)
1018 nregs = hard_regno_nregs[hard_regno][reg->biggest_mode];
1019 return hard_regno;
1020 }
1021
1022 /* Make copy of and register scratch pseudos in rematerialized insn
1023 REMAT_INSN. */
1024 static void
1025 update_scratch_ops (rtx_insn *remat_insn)
1026 {
1027 lra_insn_recog_data_t id = lra_get_insn_recog_data (remat_insn);
1028 struct lra_static_insn_data *static_id = id->insn_static_data;
1029 for (int i = 0; i < static_id->n_operands; i++)
1030 {
1031 rtx *loc = id->operand_loc[i];
1032 if (! REG_P (*loc))
1033 continue;
1034 int regno = REGNO (*loc);
1035 if (! lra_former_scratch_p (regno))
1036 continue;
1037 *loc = lra_create_new_reg (GET_MODE (*loc), *loc,
1038 lra_get_allocno_class (regno),
1039 "scratch pseudo copy");
1040 lra_register_new_scratch_op (remat_insn, i);
1041 }
1042
1043 }
1044
1045 /* Insert rematerialization insns using the data-flow data calculated
1046 earlier. */
1047 static bool
1048 do_remat (void)
1049 {
1050 rtx_insn *insn;
1051 basic_block bb;
1052 bitmap_head avail_cands;
1053 bitmap_head active_cands;
1054 bool changed_p = false;
1055 /* Living hard regs and hard registers of living pseudos. */
1056 HARD_REG_SET live_hard_regs;
1057
1058 bitmap_initialize (&avail_cands, &reg_obstack);
1059 bitmap_initialize (&active_cands, &reg_obstack);
1060 FOR_EACH_BB_FN (bb, cfun)
1061 {
1062 REG_SET_TO_HARD_REG_SET (live_hard_regs, df_get_live_out (bb));
1063 bitmap_and (&avail_cands, &get_remat_bb_data (bb)->avin_cands,
1064 &get_remat_bb_data (bb)->livein_cands);
1065 /* Activating insns are always in the same block as their corresponding
1066 remat insn, so at the start of a block the two bitsets are equal. */
1067 bitmap_copy (&active_cands, &avail_cands);
1068 FOR_BB_INSNS (bb, insn)
1069 {
1070 if (!NONDEBUG_INSN_P (insn))
1071 continue;
1072
1073 lra_insn_recog_data_t id = lra_get_insn_recog_data (insn);
1074 struct lra_static_insn_data *static_id = id->insn_static_data;
1075 struct lra_insn_reg *reg;
1076 cand_t cand;
1077 unsigned int cid;
1078 bitmap_iterator bi;
1079 rtx set;
1080 int iter;
1081 int src_regno = -1, dst_regno = -1;
1082
1083 if ((set = single_set (insn)) != NULL
1084 && REG_P (SET_SRC (set)) && REG_P (SET_DEST (set)))
1085 {
1086 src_regno = REGNO (SET_SRC (set));
1087 dst_regno = REGNO (SET_DEST (set));
1088 }
1089
1090 cand = NULL;
1091 /* Check possibility of rematerialization (hard reg or
1092 unpsilled pseudo <- spilled pseudo): */
1093 if (dst_regno >= 0 && src_regno >= FIRST_PSEUDO_REGISTER
1094 && reg_renumber[src_regno] < 0
1095 && (dst_regno < FIRST_PSEUDO_REGISTER
1096 || reg_renumber[dst_regno] >= 0))
1097 {
1098 for (cand = regno_cands[src_regno];
1099 cand != NULL;
1100 cand = cand->next_regno_cand)
1101 if (bitmap_bit_p (&avail_cands, cand->index)
1102 && bitmap_bit_p (&active_cands, cand->index))
1103 break;
1104 }
1105 int i, hard_regno, nregs;
1106 rtx_insn *remat_insn = NULL;
1107 HOST_WIDE_INT cand_sp_offset = 0;
1108 if (cand != NULL)
1109 {
1110 lra_insn_recog_data_t cand_id
1111 = lra_get_insn_recog_data (cand->insn);
1112 struct lra_static_insn_data *static_cand_id
1113 = cand_id->insn_static_data;
1114 rtx saved_op = *cand_id->operand_loc[cand->nop];
1115
1116 /* Check clobbers do not kill something living. */
1117 gcc_assert (REG_P (saved_op));
1118 int ignore_regno = REGNO (saved_op);
1119
1120 for (reg = cand_id->regs; reg != NULL; reg = reg->next)
1121 if (reg->type != OP_IN && reg->regno != ignore_regno)
1122 {
1123 hard_regno = get_hard_regs (reg, nregs);
1124 gcc_assert (hard_regno >= 0);
1125 for (i = 0; i < nregs; i++)
1126 if (TEST_HARD_REG_BIT (live_hard_regs, hard_regno + i))
1127 break;
1128 if (i < nregs)
1129 break;
1130 }
1131
1132 if (reg == NULL)
1133 {
1134 for (reg = static_cand_id->hard_regs;
1135 reg != NULL;
1136 reg = reg->next)
1137 if (reg->type != OP_IN
1138 && TEST_HARD_REG_BIT (live_hard_regs, reg->regno))
1139 break;
1140 }
1141
1142 if (reg == NULL)
1143 {
1144 *cand_id->operand_loc[cand->nop] = SET_DEST (set);
1145 lra_update_insn_regno_info (cand->insn);
1146 bool ok_p = lra_constrain_insn (cand->insn);
1147 if (ok_p)
1148 {
1149 rtx remat_pat = copy_insn (PATTERN (cand->insn));
1150
1151 start_sequence ();
1152 emit_insn (remat_pat);
1153 remat_insn = get_insns ();
1154 end_sequence ();
1155 if (recog_memoized (remat_insn) < 0)
1156 remat_insn = NULL;
1157 cand_sp_offset = cand_id->sp_offset;
1158 }
1159 *cand_id->operand_loc[cand->nop] = saved_op;
1160 lra_update_insn_regno_info (cand->insn);
1161 }
1162 }
1163
1164 bitmap_clear (&temp_bitmap);
1165 /* Update avail_cands (see analogous code for
1166 calculate_gen_cands). */
1167 for (iter = 0; iter < 2; iter++)
1168 for (reg = (iter == 0 ? id->regs : static_id->hard_regs);
1169 reg != NULL;
1170 reg = reg->next)
1171 if (reg->type != OP_IN
1172 || find_regno_note (insn, REG_DEAD, reg->regno) != NULL)
1173 EXECUTE_IF_SET_IN_BITMAP (&avail_cands, 0, cid, bi)
1174 {
1175 cand = all_cands[cid];
1176
1177 /* Ignore the reload insn. */
1178 if (src_regno == cand->reload_regno
1179 && dst_regno == cand->regno)
1180 continue;
1181 if (cand->regno == reg->regno
1182 || reg_overlap_for_remat_p (reg, cand->insn))
1183 bitmap_set_bit (&temp_bitmap, cand->index);
1184 }
1185
1186 if (CALL_P (insn))
1187 EXECUTE_IF_SET_IN_BITMAP (&avail_cands, 0, cid, bi)
1188 {
1189 cand = all_cands[cid];
1190
1191 if (call_used_input_regno_present_p (cand->insn))
1192 bitmap_set_bit (&temp_bitmap, cand->index);
1193 }
1194
1195 bitmap_and_compl_into (&avail_cands, &temp_bitmap);
1196
1197 /* Now see whether a candidate is made active or available
1198 by this insn. */
1199 cand = insn_to_cand_activation[INSN_UID (insn)];
1200 if (cand)
1201 bitmap_set_bit (&active_cands, cand->index);
1202
1203 cand = insn_to_cand[INSN_UID (insn)];
1204 if (cand != NULL)
1205 {
1206 bitmap_set_bit (&avail_cands, cand->index);
1207 if (cand->reload_regno == -1)
1208 bitmap_set_bit (&active_cands, cand->index);
1209 else
1210 bitmap_clear_bit (&active_cands, cand->index);
1211 }
1212
1213 if (remat_insn != NULL)
1214 {
1215 HOST_WIDE_INT sp_offset_change = cand_sp_offset - id->sp_offset;
1216 if (sp_offset_change != 0)
1217 change_sp_offset (remat_insn, sp_offset_change);
1218 update_scratch_ops (remat_insn);
1219 lra_process_new_insns (insn, remat_insn, NULL,
1220 "Inserting rematerialization insn");
1221 lra_set_insn_deleted (insn);
1222 changed_p = true;
1223 continue;
1224 }
1225
1226 /* Update live hard regs: */
1227 for (reg = id->regs; reg != NULL; reg = reg->next)
1228 if (reg->type == OP_IN
1229 && find_regno_note (insn, REG_DEAD, reg->regno) != NULL)
1230 {
1231 if ((hard_regno = get_hard_regs (reg, nregs)) < 0)
1232 continue;
1233 for (i = 0; i < nregs; i++)
1234 CLEAR_HARD_REG_BIT (live_hard_regs, hard_regno + i);
1235 }
1236 /* Process also hard regs (e.g. CC register) which are part
1237 of insn definition. */
1238 for (reg = static_id->hard_regs; reg != NULL; reg = reg->next)
1239 if (reg->type == OP_IN
1240 && find_regno_note (insn, REG_DEAD, reg->regno) != NULL)
1241 CLEAR_HARD_REG_BIT (live_hard_regs, reg->regno);
1242 /* Inputs have been processed, now process outputs. */
1243 for (reg = id->regs; reg != NULL; reg = reg->next)
1244 if (reg->type != OP_IN
1245 && find_regno_note (insn, REG_UNUSED, reg->regno) == NULL)
1246 {
1247 if ((hard_regno = get_hard_regs (reg, nregs)) < 0)
1248 continue;
1249 for (i = 0; i < nregs; i++)
1250 SET_HARD_REG_BIT (live_hard_regs, hard_regno + i);
1251 }
1252 for (reg = static_id->hard_regs; reg != NULL; reg = reg->next)
1253 if (reg->type != OP_IN
1254 && find_regno_note (insn, REG_UNUSED, reg->regno) == NULL)
1255 SET_HARD_REG_BIT (live_hard_regs, reg->regno);
1256 }
1257 }
1258 bitmap_clear (&avail_cands);
1259 bitmap_clear (&active_cands);
1260 return changed_p;
1261 }
1262
1263 \f
1264
1265 /* Current number of rematerialization iteration. */
1266 int lra_rematerialization_iter;
1267
1268 /* Entry point of the rematerialization sub-pass. Return true if we
1269 did any rematerialization. */
1270 bool
1271 lra_remat (void)
1272 {
1273 basic_block bb;
1274 bool result;
1275 int max_regno = max_reg_num ();
1276
1277 if (! flag_lra_remat)
1278 return false;
1279 lra_rematerialization_iter++;
1280 if (lra_rematerialization_iter > LRA_MAX_REMATERIALIZATION_PASSES)
1281 return false;
1282 if (lra_dump_file != NULL)
1283 fprintf (lra_dump_file,
1284 "\n******** Rematerialization #%d: ********\n\n",
1285 lra_rematerialization_iter);
1286 timevar_push (TV_LRA_REMAT);
1287 insn_to_cand = XCNEWVEC (cand_t, get_max_uid ());
1288 insn_to_cand_activation = XCNEWVEC (cand_t, get_max_uid ());
1289 regno_cands = XCNEWVEC (cand_t, max_regno);
1290 all_cands.create (8000);
1291 call_used_regs_arr_len = 0;
1292 for (int i = 0; i < FIRST_PSEUDO_REGISTER; i++)
1293 if (call_used_regs[i])
1294 call_used_regs_arr[call_used_regs_arr_len++] = i;
1295 initiate_cand_table ();
1296 create_remat_bb_data ();
1297 bitmap_initialize (&temp_bitmap, &reg_obstack);
1298 bitmap_initialize (&subreg_regs, &reg_obstack);
1299 calculate_local_reg_remat_bb_data ();
1300 create_cands ();
1301 calculate_livein_cands ();
1302 calculate_gen_cands ();
1303 bitmap_initialize (&all_blocks, &reg_obstack);
1304 FOR_ALL_BB_FN (bb, cfun)
1305 bitmap_set_bit (&all_blocks, bb->index);
1306 calculate_global_remat_bb_data ();
1307 dump_candidates_and_remat_bb_data ();
1308 result = do_remat ();
1309 all_cands.release ();
1310 bitmap_clear (&temp_bitmap);
1311 bitmap_clear (&subreg_regs);
1312 finish_remat_bb_data ();
1313 finish_cand_table ();
1314 bitmap_clear (&all_blocks);
1315 free (regno_cands);
1316 free (insn_to_cand);
1317 free (insn_to_cand_activation);
1318 timevar_pop (TV_LRA_REMAT);
1319 return result;
1320 }