]> git.ipfire.org Git - thirdparty/gcc.git/blame - gcc/lra-assigns.c
Remove AND_COMPL_HARD_REG_SET
[thirdparty/gcc.git] / gcc / lra-assigns.c
CommitLineData
55a2c322 1/* Assign reload pseudos.
a5544970 2 Copyright (C) 2010-2019 Free Software Foundation, Inc.
55a2c322
VM
3 Contributed by Vladimir Makarov <vmakarov@redhat.com>.
4
5This file is part of GCC.
6
7GCC is free software; you can redistribute it and/or modify it under
8the terms of the GNU General Public License as published by the Free
9Software Foundation; either version 3, or (at your option) any later
10version.
11
12GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13WARRANTY; without even the implied warranty of MERCHANTABILITY or
14FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15for more details.
16
17You should have received a copy of the GNU General Public License
18along with GCC; see the file COPYING3. If not see
19<http://www.gnu.org/licenses/>. */
20
21
22/* This file's main objective is to assign hard registers to reload
23 pseudos. It also tries to allocate hard registers to other
24 pseudos, but at a lower priority than the reload pseudos. The pass
25 does not transform the RTL.
26
27 We must allocate a hard register to every reload pseudo. We try to
28 increase the chances of finding a viable allocation by assigning
29 the pseudos in order of fewest available hard registers first. If
30 we still fail to find a hard register, we spill other (non-reload)
31 pseudos in order to make room.
32
33 find_hard_regno_for finds hard registers for allocation without
34 spilling. spill_for does the same with spilling. Both functions
35 use a cost model to determine the most profitable choice of hard
36 and spill registers.
37
38 Once we have finished allocating reload pseudos, we also try to
39 assign registers to other (non-reload) pseudos. This is useful if
40 hard registers were freed up by the spilling just described.
41
42 We try to assign hard registers by collecting pseudos into threads.
43 These threads contain reload and inheritance pseudos that are
44 connected by copies (move insns). Doing this improves the chances
45 of pseudos in the thread getting the same hard register and, as a
46 result, of allowing some move insns to be deleted.
47
48 When we assign a hard register to a pseudo, we decrease the cost of
49 using the same hard register for pseudos that are connected by
50 copies.
51
52 If two hard registers have the same frequency-derived cost, we
53 prefer hard registers with higher priorities. The mapping of
54 registers to priorities is controlled by the register_priority
55 target hook. For example, x86-64 has a few register priorities:
56 hard registers with and without REX prefixes have different
57 priorities. This permits us to generate smaller code as insns
58 without REX prefixes are shorter.
59
60 If a few hard registers are still equally good for the assignment,
61 we choose the least used hard register. It is called leveling and
62 may be profitable for some targets.
63
64 Only insns with changed allocation pseudos are processed on the
65 next constraint pass.
66
67 The pseudo live-ranges are used to find conflicting pseudos.
68
69 For understanding the code, it is important to keep in mind that
70 inheritance, split, and reload pseudos created since last
71 constraint pass have regno >= lra_constraint_new_regno_start.
72 Inheritance and split pseudos created on any pass are in the
73 corresponding bitmaps. Inheritance and split pseudos since the
74 last constraint pass have also the corresponding non-negative
75 restore_regno. */
76
77#include "config.h"
78#include "system.h"
79#include "coretypes.h"
c7131fb2 80#include "backend.h"
957060b5 81#include "target.h"
55a2c322 82#include "rtl.h"
957060b5
AM
83#include "tree.h"
84#include "predict.h"
c7131fb2 85#include "df.h"
4d0cdd0c 86#include "memmodel.h"
55a2c322 87#include "tm_p.h"
55a2c322 88#include "insn-config.h"
957060b5
AM
89#include "regs.h"
90#include "ira.h"
55a2c322 91#include "recog.h"
957060b5 92#include "rtl-error.h"
55a2c322 93#include "sparseset.h"
88def637 94#include "params.h"
c7131fb2 95#include "lra.h"
55a2c322
VM
96#include "lra-int.h"
97
f54437d5
VM
98/* Current iteration number of the pass and current iteration number
99 of the pass after the latest spill pass when any former reload
100 pseudo was spilled. */
101int lra_assignment_iter;
102int lra_assignment_iter_after_spill;
103
104/* Flag of spilling former reload pseudos on this pass. */
105static bool former_reload_pseudo_spill_p;
106
55a2c322
VM
107/* Array containing corresponding values of function
108 lra_get_allocno_class. It is used to speed up the code. */
109static enum reg_class *regno_allocno_class_array;
110
8a8330b7
VM
111/* Array containing lengths of pseudo live ranges. It is used to
112 speed up the code. */
113static int *regno_live_length;
114
55a2c322
VM
115/* Information about the thread to which a pseudo belongs. Threads are
116 a set of connected reload and inheritance pseudos with the same set of
117 available hard registers. Lone registers belong to their own threads. */
118struct regno_assign_info
119{
120 /* First/next pseudo of the same thread. */
121 int first, next;
122 /* Frequency of the thread (execution frequency of only reload
123 pseudos in the thread when the thread contains a reload pseudo).
124 Defined only for the first thread pseudo. */
125 int freq;
126};
127
128/* Map regno to the corresponding regno assignment info. */
129static struct regno_assign_info *regno_assign_info;
130
bc404e1b
VM
131/* All inherited, subreg or optional pseudos created before last spill
132 sub-pass. Such pseudos are permitted to get memory instead of hard
133 regs. */
134static bitmap_head non_reload_pseudos;
135
55a2c322
VM
136/* Process a pseudo copy with execution frequency COPY_FREQ connecting
137 REGNO1 and REGNO2 to form threads. */
138static void
139process_copy_to_form_thread (int regno1, int regno2, int copy_freq)
140{
141 int last, regno1_first, regno2_first;
142
143 lra_assert (regno1 >= lra_constraint_new_regno_start
144 && regno2 >= lra_constraint_new_regno_start);
145 regno1_first = regno_assign_info[regno1].first;
146 regno2_first = regno_assign_info[regno2].first;
147 if (regno1_first != regno2_first)
148 {
149 for (last = regno2_first;
150 regno_assign_info[last].next >= 0;
151 last = regno_assign_info[last].next)
152 regno_assign_info[last].first = regno1_first;
153 regno_assign_info[last].first = regno1_first;
154 regno_assign_info[last].next = regno_assign_info[regno1_first].next;
155 regno_assign_info[regno1_first].next = regno2_first;
156 regno_assign_info[regno1_first].freq
157 += regno_assign_info[regno2_first].freq;
158 }
159 regno_assign_info[regno1_first].freq -= 2 * copy_freq;
160 lra_assert (regno_assign_info[regno1_first].freq >= 0);
161}
162
163/* Initialize REGNO_ASSIGN_INFO and form threads. */
164static void
165init_regno_assign_info (void)
166{
167 int i, regno1, regno2, max_regno = max_reg_num ();
168 lra_copy_t cp;
f4eafc30 169
55a2c322
VM
170 regno_assign_info = XNEWVEC (struct regno_assign_info, max_regno);
171 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
172 {
173 regno_assign_info[i].first = i;
174 regno_assign_info[i].next = -1;
175 regno_assign_info[i].freq = lra_reg_info[i].freq;
176 }
177 /* Form the threads. */
178 for (i = 0; (cp = lra_get_copy (i)) != NULL; i++)
179 if ((regno1 = cp->regno1) >= lra_constraint_new_regno_start
180 && (regno2 = cp->regno2) >= lra_constraint_new_regno_start
181 && reg_renumber[regno1] < 0 && lra_reg_info[regno1].nrefs != 0
182 && reg_renumber[regno2] < 0 && lra_reg_info[regno2].nrefs != 0
183 && (ira_class_hard_regs_num[regno_allocno_class_array[regno1]]
184 == ira_class_hard_regs_num[regno_allocno_class_array[regno2]]))
185 process_copy_to_form_thread (regno1, regno2, cp->freq);
186}
187
188/* Free REGNO_ASSIGN_INFO. */
189static void
190finish_regno_assign_info (void)
191{
192 free (regno_assign_info);
193}
194
195/* The function is used to sort *reload* and *inheritance* pseudos to
196 try to assign them hard registers. We put pseudos from the same
197 thread always nearby. */
198static int
199reload_pseudo_compare_func (const void *v1p, const void *v2p)
200{
201 int r1 = *(const int *) v1p, r2 = *(const int *) v2p;
202 enum reg_class cl1 = regno_allocno_class_array[r1];
203 enum reg_class cl2 = regno_allocno_class_array[r2];
204 int diff;
f4eafc30 205
55a2c322
VM
206 lra_assert (r1 >= lra_constraint_new_regno_start
207 && r2 >= lra_constraint_new_regno_start);
f4eafc30 208
55a2c322
VM
209 /* Prefer to assign reload registers with smaller classes first to
210 guarantee assignment to all reload registers. */
211 if ((diff = (ira_class_hard_regs_num[cl1]
212 - ira_class_hard_regs_num[cl2])) != 0)
213 return diff;
47918951
VM
214 /* Allocate bigger pseudos first to avoid register file
215 fragmentation. */
216 if ((diff
217 = (ira_reg_class_max_nregs[cl2][lra_reg_info[r2].biggest_mode]
218 - ira_reg_class_max_nregs[cl1][lra_reg_info[r1].biggest_mode])) != 0)
219 return diff;
ffaea117
AM
220 if ((diff = (regno_assign_info[regno_assign_info[r2].first].freq
221 - regno_assign_info[regno_assign_info[r1].first].freq)) != 0)
222 return diff;
55a2c322
VM
223 /* Put pseudos from the thread nearby. */
224 if ((diff = regno_assign_info[r1].first - regno_assign_info[r2].first) != 0)
225 return diff;
8a8330b7
VM
226 /* Prefer pseudos with longer live ranges. It sets up better
227 prefered hard registers for the thread pseudos and decreases
228 register-register moves between the thread pseudos. */
229 if ((diff = regno_live_length[r2] - regno_live_length[r1]) != 0)
230 return diff;
55a2c322
VM
231 /* If regs are equally good, sort by their numbers, so that the
232 results of qsort leave nothing to chance. */
233 return r1 - r2;
234}
235
236/* The function is used to sort *non-reload* pseudos to try to assign
237 them hard registers. The order calculation is simpler than in the
238 previous function and based on the pseudo frequency usage. */
239static int
240pseudo_compare_func (const void *v1p, const void *v2p)
241{
242 int r1 = *(const int *) v1p, r2 = *(const int *) v2p;
243 int diff;
244
b81a2f0d
VM
245 /* Assign hard reg to static chain pointer first pseudo when
246 non-local goto is used. */
f0a40456
AM
247 if ((diff = (non_spilled_static_chain_regno_p (r2)
248 - non_spilled_static_chain_regno_p (r1))) != 0)
249 return diff;
b81a2f0d 250
55a2c322
VM
251 /* Prefer to assign more frequently used registers first. */
252 if ((diff = lra_reg_info[r2].freq - lra_reg_info[r1].freq) != 0)
253 return diff;
f4eafc30 254
55a2c322
VM
255 /* If regs are equally good, sort by their numbers, so that the
256 results of qsort leave nothing to chance. */
257 return r1 - r2;
258}
259
260/* Arrays of size LRA_LIVE_MAX_POINT mapping a program point to the
261 pseudo live ranges with given start point. We insert only live
262 ranges of pseudos interesting for assignment purposes. They are
263 reload pseudos and pseudos assigned to hard registers. */
264static lra_live_range_t *start_point_ranges;
265
266/* Used as a flag that a live range is not inserted in the start point
267 chain. */
268static struct lra_live_range not_in_chain_mark;
269
270/* Create and set up START_POINT_RANGES. */
271static void
272create_live_range_start_chains (void)
273{
274 int i, max_regno;
275 lra_live_range_t r;
276
277 start_point_ranges = XCNEWVEC (lra_live_range_t, lra_live_max_point);
278 max_regno = max_reg_num ();
279 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
280 if (i >= lra_constraint_new_regno_start || reg_renumber[i] >= 0)
281 {
282 for (r = lra_reg_info[i].live_ranges; r != NULL; r = r->next)
283 {
284 r->start_next = start_point_ranges[r->start];
285 start_point_ranges[r->start] = r;
286 }
287 }
288 else
289 {
290 for (r = lra_reg_info[i].live_ranges; r != NULL; r = r->next)
291 r->start_next = &not_in_chain_mark;
292 }
293}
294
295/* Insert live ranges of pseudo REGNO into start chains if they are
296 not there yet. */
297static void
298insert_in_live_range_start_chain (int regno)
299{
300 lra_live_range_t r = lra_reg_info[regno].live_ranges;
301
302 if (r->start_next != &not_in_chain_mark)
303 return;
304 for (; r != NULL; r = r->next)
305 {
306 r->start_next = start_point_ranges[r->start];
307 start_point_ranges[r->start] = r;
308 }
309}
310
311/* Free START_POINT_RANGES. */
312static void
313finish_live_range_start_chains (void)
314{
315 gcc_assert (start_point_ranges != NULL);
316 free (start_point_ranges);
317 start_point_ranges = NULL;
318}
319
320/* Map: program point -> bitmap of all pseudos living at the point and
321 assigned to hard registers. */
322static bitmap_head *live_hard_reg_pseudos;
323static bitmap_obstack live_hard_reg_pseudos_bitmap_obstack;
324
325/* reg_renumber corresponding to pseudos marked in
326 live_hard_reg_pseudos. reg_renumber might be not matched to
327 live_hard_reg_pseudos but live_pseudos_reg_renumber always reflects
328 live_hard_reg_pseudos. */
329static int *live_pseudos_reg_renumber;
330
331/* Sparseset used to calculate living hard reg pseudos for some program
332 point range. */
333static sparseset live_range_hard_reg_pseudos;
334
335/* Sparseset used to calculate living reload/inheritance pseudos for
336 some program point range. */
337static sparseset live_range_reload_inheritance_pseudos;
338
339/* Allocate and initialize the data about living pseudos at program
340 points. */
341static void
342init_lives (void)
343{
344 int i, max_regno = max_reg_num ();
345
346 live_range_hard_reg_pseudos = sparseset_alloc (max_regno);
347 live_range_reload_inheritance_pseudos = sparseset_alloc (max_regno);
348 live_hard_reg_pseudos = XNEWVEC (bitmap_head, lra_live_max_point);
349 bitmap_obstack_initialize (&live_hard_reg_pseudos_bitmap_obstack);
350 for (i = 0; i < lra_live_max_point; i++)
351 bitmap_initialize (&live_hard_reg_pseudos[i],
352 &live_hard_reg_pseudos_bitmap_obstack);
353 live_pseudos_reg_renumber = XNEWVEC (int, max_regno);
354 for (i = 0; i < max_regno; i++)
355 live_pseudos_reg_renumber[i] = -1;
356}
357
358/* Free the data about living pseudos at program points. */
359static void
360finish_lives (void)
361{
362 sparseset_free (live_range_hard_reg_pseudos);
363 sparseset_free (live_range_reload_inheritance_pseudos);
364 free (live_hard_reg_pseudos);
365 bitmap_obstack_release (&live_hard_reg_pseudos_bitmap_obstack);
366 free (live_pseudos_reg_renumber);
367}
368
369/* Update the LIVE_HARD_REG_PSEUDOS and LIVE_PSEUDOS_REG_RENUMBER
370 entries for pseudo REGNO. Assume that the register has been
371 spilled if FREE_P, otherwise assume that it has been assigned
372 reg_renumber[REGNO] (if >= 0). We also insert the pseudo live
373 ranges in the start chains when it is assumed to be assigned to a
374 hard register because we use the chains of pseudos assigned to hard
375 registers during allocation. */
376static void
377update_lives (int regno, bool free_p)
378{
379 int p;
380 lra_live_range_t r;
381
382 if (reg_renumber[regno] < 0)
383 return;
384 live_pseudos_reg_renumber[regno] = free_p ? -1 : reg_renumber[regno];
385 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
386 {
387 for (p = r->start; p <= r->finish; p++)
388 if (free_p)
389 bitmap_clear_bit (&live_hard_reg_pseudos[p], regno);
390 else
391 {
392 bitmap_set_bit (&live_hard_reg_pseudos[p], regno);
393 insert_in_live_range_start_chain (regno);
394 }
395 }
396}
397
398/* Sparseset used to calculate reload pseudos conflicting with a given
399 pseudo when we are trying to find a hard register for the given
400 pseudo. */
401static sparseset conflict_reload_and_inheritance_pseudos;
402
403/* Map: program point -> bitmap of all reload and inheritance pseudos
404 living at the point. */
405static bitmap_head *live_reload_and_inheritance_pseudos;
406static bitmap_obstack live_reload_and_inheritance_pseudos_bitmap_obstack;
407
408/* Allocate and initialize data about living reload pseudos at any
409 given program point. */
410static void
411init_live_reload_and_inheritance_pseudos (void)
412{
413 int i, p, max_regno = max_reg_num ();
414 lra_live_range_t r;
f4eafc30 415
55a2c322
VM
416 conflict_reload_and_inheritance_pseudos = sparseset_alloc (max_regno);
417 live_reload_and_inheritance_pseudos = XNEWVEC (bitmap_head, lra_live_max_point);
418 bitmap_obstack_initialize (&live_reload_and_inheritance_pseudos_bitmap_obstack);
419 for (p = 0; p < lra_live_max_point; p++)
420 bitmap_initialize (&live_reload_and_inheritance_pseudos[p],
421 &live_reload_and_inheritance_pseudos_bitmap_obstack);
422 for (i = lra_constraint_new_regno_start; i < max_regno; i++)
423 {
424 for (r = lra_reg_info[i].live_ranges; r != NULL; r = r->next)
425 for (p = r->start; p <= r->finish; p++)
426 bitmap_set_bit (&live_reload_and_inheritance_pseudos[p], i);
427 }
428}
429
430/* Finalize data about living reload pseudos at any given program
431 point. */
432static void
433finish_live_reload_and_inheritance_pseudos (void)
434{
435 sparseset_free (conflict_reload_and_inheritance_pseudos);
436 free (live_reload_and_inheritance_pseudos);
437 bitmap_obstack_release (&live_reload_and_inheritance_pseudos_bitmap_obstack);
438}
439
440/* The value used to check that cost of given hard reg is really
441 defined currently. */
442static int curr_hard_regno_costs_check = 0;
443/* Array used to check that cost of the corresponding hard reg (the
444 array element index) is really defined currently. */
445static int hard_regno_costs_check[FIRST_PSEUDO_REGISTER];
446/* The current costs of allocation of hard regs. Defined only if the
447 value of the corresponding element of the previous array is equal to
448 CURR_HARD_REGNO_COSTS_CHECK. */
449static int hard_regno_costs[FIRST_PSEUDO_REGISTER];
450
451/* Adjust cost of HARD_REGNO by INCR. Reset the cost first if it is
452 not defined yet. */
453static inline void
454adjust_hard_regno_cost (int hard_regno, int incr)
455{
456 if (hard_regno_costs_check[hard_regno] != curr_hard_regno_costs_check)
457 hard_regno_costs[hard_regno] = 0;
458 hard_regno_costs_check[hard_regno] = curr_hard_regno_costs_check;
459 hard_regno_costs[hard_regno] += incr;
460}
461
462/* Try to find a free hard register for pseudo REGNO. Return the
463 hard register on success and set *COST to the cost of using
464 that register. (If several registers have equal cost, the one with
465 the highest priority wins.) Return -1 on failure.
466
9e038952
VM
467 If FIRST_P, return the first available hard reg ignoring other
468 criteria, e.g. allocation cost. This approach results in less hard
469 reg pool fragmentation and permit to allocate hard regs to reload
470 pseudos in complicated situations where pseudo sizes are different.
471
55a2c322 472 If TRY_ONLY_HARD_REGNO >= 0, consider only that hard register,
34349d55
VM
473 otherwise consider all hard registers in REGNO's class.
474
475 If REGNO_SET is not empty, only hard registers from the set are
476 considered. */
55a2c322 477static int
34349d55
VM
478find_hard_regno_for_1 (int regno, int *cost, int try_only_hard_regno,
479 bool first_p, HARD_REG_SET regno_set)
55a2c322
VM
480{
481 HARD_REG_SET conflict_set;
482 int best_cost = INT_MAX, best_priority = INT_MIN, best_usage = INT_MAX;
483 lra_live_range_t r;
484 int p, i, j, rclass_size, best_hard_regno, priority, hard_regno;
485 int hr, conflict_hr, nregs;
ef4bddc2 486 machine_mode biggest_mode;
55a2c322 487 unsigned int k, conflict_regno;
73ca989c
RS
488 poly_int64 offset;
489 int val, biggest_nregs, nregs_diff;
55a2c322
VM
490 enum reg_class rclass;
491 bitmap_iterator bi;
492 bool *rclass_intersect_p;
a4971e68 493 HARD_REG_SET impossible_start_hard_regs, available_regs;
55a2c322 494
34349d55 495 if (hard_reg_set_empty_p (regno_set))
6576d245 496 conflict_set = lra_no_alloc_regs;
34349d55 497 else
44942965 498 conflict_set = ~regno_set | lra_no_alloc_regs;
55a2c322
VM
499 rclass = regno_allocno_class_array[regno];
500 rclass_intersect_p = ira_reg_classes_intersect_p[rclass];
501 curr_hard_regno_costs_check++;
502 sparseset_clear (conflict_reload_and_inheritance_pseudos);
503 sparseset_clear (live_range_hard_reg_pseudos);
44942965 504 conflict_set |= lra_reg_info[regno].conflict_hard_regs;
55a2c322
VM
505 biggest_mode = lra_reg_info[regno].biggest_mode;
506 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
507 {
508 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos[r->start], 0, k, bi)
509 if (rclass_intersect_p[regno_allocno_class_array[k]])
510 sparseset_set_bit (live_range_hard_reg_pseudos, k);
511 EXECUTE_IF_SET_IN_BITMAP (&live_reload_and_inheritance_pseudos[r->start],
512 0, k, bi)
513 if (lra_reg_info[k].preferred_hard_regno1 >= 0
514 && live_pseudos_reg_renumber[k] < 0
515 && rclass_intersect_p[regno_allocno_class_array[k]])
516 sparseset_set_bit (conflict_reload_and_inheritance_pseudos, k);
517 for (p = r->start + 1; p <= r->finish; p++)
518 {
519 lra_live_range_t r2;
f4eafc30 520
55a2c322
VM
521 for (r2 = start_point_ranges[p];
522 r2 != NULL;
523 r2 = r2->start_next)
524 {
525 if (r2->regno >= lra_constraint_new_regno_start
526 && lra_reg_info[r2->regno].preferred_hard_regno1 >= 0
527 && live_pseudos_reg_renumber[r2->regno] < 0
528 && rclass_intersect_p[regno_allocno_class_array[r2->regno]])
529 sparseset_set_bit (conflict_reload_and_inheritance_pseudos,
530 r2->regno);
531 if (live_pseudos_reg_renumber[r2->regno] >= 0
532 && rclass_intersect_p[regno_allocno_class_array[r2->regno]])
533 sparseset_set_bit (live_range_hard_reg_pseudos, r2->regno);
534 }
535 }
536 }
537 if ((hard_regno = lra_reg_info[regno].preferred_hard_regno1) >= 0)
538 {
539 adjust_hard_regno_cost
540 (hard_regno, -lra_reg_info[regno].preferred_hard_regno_profit1);
541 if ((hard_regno = lra_reg_info[regno].preferred_hard_regno2) >= 0)
542 adjust_hard_regno_cost
543 (hard_regno, -lra_reg_info[regno].preferred_hard_regno_profit2);
544 }
545#ifdef STACK_REGS
546 if (lra_reg_info[regno].no_stack_p)
547 for (i = FIRST_STACK_REG; i <= LAST_STACK_REG; i++)
548 SET_HARD_REG_BIT (conflict_set, i);
549#endif
550 sparseset_clear_bit (conflict_reload_and_inheritance_pseudos, regno);
551 val = lra_reg_info[regno].val;
d70a81dd 552 offset = lra_reg_info[regno].offset;
55a2c322
VM
553 CLEAR_HARD_REG_SET (impossible_start_hard_regs);
554 EXECUTE_IF_SET_IN_SPARSESET (live_range_hard_reg_pseudos, conflict_regno)
9eb7045b
VM
555 {
556 conflict_hr = live_pseudos_reg_renumber[conflict_regno];
557 if (lra_reg_val_equal_p (conflict_regno, val, offset))
558 {
559 conflict_hr = live_pseudos_reg_renumber[conflict_regno];
ad474626
RS
560 nregs = hard_regno_nregs (conflict_hr,
561 lra_reg_info[conflict_regno].biggest_mode);
9eb7045b
VM
562 /* Remember about multi-register pseudos. For example, 2
563 hard register pseudos can start on the same hard register
67914693 564 but cannot start on HR and HR+1/HR-1. */
9eb7045b
VM
565 for (hr = conflict_hr + 1;
566 hr < FIRST_PSEUDO_REGISTER && hr < conflict_hr + nregs;
567 hr++)
568 SET_HARD_REG_BIT (impossible_start_hard_regs, hr);
569 for (hr = conflict_hr - 1;
4edd6298 570 hr >= 0 && (int) end_hard_regno (biggest_mode, hr) > conflict_hr;
9eb7045b
VM
571 hr--)
572 SET_HARD_REG_BIT (impossible_start_hard_regs, hr);
573 }
574 else
575 {
b8506a8a 576 machine_mode biggest_conflict_mode
9eb7045b
VM
577 = lra_reg_info[conflict_regno].biggest_mode;
578 int biggest_conflict_nregs
ad474626 579 = hard_regno_nregs (conflict_hr, biggest_conflict_mode);
9eb7045b 580
ad474626
RS
581 nregs_diff
582 = (biggest_conflict_nregs
583 - hard_regno_nregs (conflict_hr,
584 PSEUDO_REGNO_MODE (conflict_regno)));
9eb7045b
VM
585 add_to_hard_reg_set (&conflict_set,
586 biggest_conflict_mode,
587 conflict_hr
588 - (WORDS_BIG_ENDIAN ? nregs_diff : 0));
589 if (hard_reg_set_subset_p (reg_class_contents[rclass],
590 conflict_set))
591 return -1;
592 }
593 }
55a2c322
VM
594 EXECUTE_IF_SET_IN_SPARSESET (conflict_reload_and_inheritance_pseudos,
595 conflict_regno)
d70a81dd 596 if (!lra_reg_val_equal_p (conflict_regno, val, offset))
55a2c322
VM
597 {
598 lra_assert (live_pseudos_reg_renumber[conflict_regno] < 0);
599 if ((hard_regno
600 = lra_reg_info[conflict_regno].preferred_hard_regno1) >= 0)
601 {
602 adjust_hard_regno_cost
603 (hard_regno,
604 lra_reg_info[conflict_regno].preferred_hard_regno_profit1);
605 if ((hard_regno
606 = lra_reg_info[conflict_regno].preferred_hard_regno2) >= 0)
607 adjust_hard_regno_cost
608 (hard_regno,
609 lra_reg_info[conflict_regno].preferred_hard_regno_profit2);
610 }
611 }
612 /* Make sure that all registers in a multi-word pseudo belong to the
613 required class. */
614 IOR_COMPL_HARD_REG_SET (conflict_set, reg_class_contents[rclass]);
615 lra_assert (rclass != NO_REGS);
616 rclass_size = ira_class_hard_regs_num[rclass];
617 best_hard_regno = -1;
618 hard_regno = ira_class_hard_regs[rclass][0];
ad474626 619 biggest_nregs = hard_regno_nregs (hard_regno, biggest_mode);
55a2c322 620 nregs_diff = (biggest_nregs
ad474626 621 - hard_regno_nregs (hard_regno, PSEUDO_REGNO_MODE (regno)));
d15e5131 622 available_regs = reg_class_contents[rclass] & ~lra_no_alloc_regs;
55a2c322
VM
623 for (i = 0; i < rclass_size; i++)
624 {
625 if (try_only_hard_regno >= 0)
626 hard_regno = try_only_hard_regno;
627 else
628 hard_regno = ira_class_hard_regs[rclass][i];
629 if (! overlaps_hard_reg_set_p (conflict_set,
630 PSEUDO_REGNO_MODE (regno), hard_regno)
f939c3e6
RS
631 && targetm.hard_regno_mode_ok (hard_regno,
632 PSEUDO_REGNO_MODE (regno))
67914693 633 /* We cannot use prohibited_class_mode_regs for all classes
7e964f49
VM
634 because it is not defined for all classes. */
635 && (ira_allocno_class_translate[rclass] != rclass
636 || ! TEST_HARD_REG_BIT (ira_prohibited_class_mode_regs
637 [rclass][PSEUDO_REGNO_MODE (regno)],
638 hard_regno))
55a2c322
VM
639 && ! TEST_HARD_REG_BIT (impossible_start_hard_regs, hard_regno)
640 && (nregs_diff == 0
a1b46e46
JR
641 || (WORDS_BIG_ENDIAN
642 ? (hard_regno - nregs_diff >= 0
a4971e68 643 && TEST_HARD_REG_BIT (available_regs,
a1b46e46 644 hard_regno - nregs_diff))
a4971e68 645 : TEST_HARD_REG_BIT (available_regs,
a1b46e46 646 hard_regno + nregs_diff))))
55a2c322
VM
647 {
648 if (hard_regno_costs_check[hard_regno]
649 != curr_hard_regno_costs_check)
650 {
651 hard_regno_costs_check[hard_regno] = curr_hard_regno_costs_check;
652 hard_regno_costs[hard_regno] = 0;
653 }
654 for (j = 0;
ad474626 655 j < hard_regno_nregs (hard_regno, PSEUDO_REGNO_MODE (regno));
55a2c322
VM
656 j++)
657 if (! TEST_HARD_REG_BIT (call_used_reg_set, hard_regno + j)
658 && ! df_regs_ever_live_p (hard_regno + j))
659 /* It needs save restore. */
660 hard_regno_costs[hard_regno]
fef37404
VM
661 += (2
662 * REG_FREQ_FROM_BB (ENTRY_BLOCK_PTR_FOR_FN (cfun)->next_bb)
663 + 1);
55a2c322
VM
664 priority = targetm.register_priority (hard_regno);
665 if (best_hard_regno < 0 || hard_regno_costs[hard_regno] < best_cost
666 || (hard_regno_costs[hard_regno] == best_cost
667 && (priority > best_priority
3b9ceb4b 668 || (targetm.register_usage_leveling_p ()
55a2c322
VM
669 && priority == best_priority
670 && best_usage > lra_hard_reg_usage[hard_regno]))))
671 {
672 best_hard_regno = hard_regno;
673 best_cost = hard_regno_costs[hard_regno];
674 best_priority = priority;
675 best_usage = lra_hard_reg_usage[hard_regno];
676 }
677 }
9e038952 678 if (try_only_hard_regno >= 0 || (first_p && best_hard_regno >= 0))
55a2c322
VM
679 break;
680 }
681 if (best_hard_regno >= 0)
682 *cost = best_cost - lra_reg_info[regno].freq;
683 return best_hard_regno;
684}
685
34349d55
VM
686/* A wrapper for find_hard_regno_for_1 (see comments for that function
687 description). This function tries to find a hard register for
688 preferred class first if it is worth. */
689static int
690find_hard_regno_for (int regno, int *cost, int try_only_hard_regno, bool first_p)
691{
692 int hard_regno;
693 HARD_REG_SET regno_set;
694
695 /* Only original pseudos can have a different preferred class. */
696 if (try_only_hard_regno < 0 && regno < lra_new_regno_start)
697 {
698 enum reg_class pref_class = reg_preferred_class (regno);
699
700 if (regno_allocno_class_array[regno] != pref_class)
701 {
702 hard_regno = find_hard_regno_for_1 (regno, cost, -1, first_p,
703 reg_class_contents[pref_class]);
704 if (hard_regno >= 0)
705 return hard_regno;
706 }
707 }
708 CLEAR_HARD_REG_SET (regno_set);
709 return find_hard_regno_for_1 (regno, cost, try_only_hard_regno, first_p,
710 regno_set);
711}
712
55a2c322
VM
713/* Current value used for checking elements in
714 update_hard_regno_preference_check. */
715static int curr_update_hard_regno_preference_check;
716/* If an element value is equal to the above variable value, then the
717 corresponding regno has been processed for preference
718 propagation. */
719static int *update_hard_regno_preference_check;
720
721/* Update the preference for using HARD_REGNO for pseudos that are
722 connected directly or indirectly with REGNO. Apply divisor DIV
723 to any preference adjustments.
724
725 The more indirectly a pseudo is connected, the smaller its effect
726 should be. We therefore increase DIV on each "hop". */
727static void
728update_hard_regno_preference (int regno, int hard_regno, int div)
729{
730 int another_regno, cost;
731 lra_copy_t cp, next_cp;
732
733 /* Search depth 5 seems to be enough. */
734 if (div > (1 << 5))
735 return;
736 for (cp = lra_reg_info[regno].copies; cp != NULL; cp = next_cp)
737 {
738 if (cp->regno1 == regno)
739 {
740 next_cp = cp->regno1_next;
741 another_regno = cp->regno2;
742 }
743 else if (cp->regno2 == regno)
744 {
745 next_cp = cp->regno2_next;
746 another_regno = cp->regno1;
747 }
748 else
749 gcc_unreachable ();
750 if (reg_renumber[another_regno] < 0
751 && (update_hard_regno_preference_check[another_regno]
752 != curr_update_hard_regno_preference_check))
753 {
754 update_hard_regno_preference_check[another_regno]
755 = curr_update_hard_regno_preference_check;
756 cost = cp->freq < div ? 1 : cp->freq / div;
757 lra_setup_reload_pseudo_preferenced_hard_reg
758 (another_regno, hard_regno, cost);
759 update_hard_regno_preference (another_regno, hard_regno, div * 2);
760 }
761 }
762}
763
2b778c9d
VM
764/* Return prefix title for pseudo REGNO. */
765static const char *
766pseudo_prefix_title (int regno)
767{
768 return
769 (regno < lra_constraint_new_regno_start ? ""
770 : bitmap_bit_p (&lra_inheritance_pseudos, regno) ? "inheritance "
771 : bitmap_bit_p (&lra_split_regs, regno) ? "split "
772 : bitmap_bit_p (&lra_optional_reload_pseudos, regno) ? "optional reload "
773 : bitmap_bit_p (&lra_subreg_reload_pseudos, regno) ? "subreg reload "
774 : "reload ");
775}
776
55a2c322
VM
777/* Update REG_RENUMBER and other pseudo preferences by assignment of
778 HARD_REGNO to pseudo REGNO and print about it if PRINT_P. */
779void
780lra_setup_reg_renumber (int regno, int hard_regno, bool print_p)
781{
782 int i, hr;
783
67914693 784 /* We cannot just reassign hard register. */
55a2c322
VM
785 lra_assert (hard_regno < 0 || reg_renumber[regno] < 0);
786 if ((hr = hard_regno) < 0)
787 hr = reg_renumber[regno];
788 reg_renumber[regno] = hard_regno;
789 lra_assert (hr >= 0);
ad474626 790 for (i = 0; i < hard_regno_nregs (hr, PSEUDO_REGNO_MODE (regno)); i++)
55a2c322
VM
791 if (hard_regno < 0)
792 lra_hard_reg_usage[hr + i] -= lra_reg_info[regno].freq;
793 else
794 lra_hard_reg_usage[hr + i] += lra_reg_info[regno].freq;
795 if (print_p && lra_dump_file != NULL)
796 fprintf (lra_dump_file, " Assign %d to %sr%d (freq=%d)\n",
2b778c9d 797 reg_renumber[regno], pseudo_prefix_title (regno),
55a2c322
VM
798 regno, lra_reg_info[regno].freq);
799 if (hard_regno >= 0)
800 {
801 curr_update_hard_regno_preference_check++;
802 update_hard_regno_preference (regno, hard_regno, 1);
803 }
804}
805
806/* Pseudos which occur in insns containing a particular pseudo. */
807static bitmap_head insn_conflict_pseudos;
808
809/* Bitmaps used to contain spill pseudos for given pseudo hard regno
810 and best spill pseudos for given pseudo (and best hard regno). */
811static bitmap_head spill_pseudos_bitmap, best_spill_pseudos_bitmap;
812
813/* Current pseudo check for validity of elements in
814 TRY_HARD_REG_PSEUDOS. */
815static int curr_pseudo_check;
816/* Array used for validity of elements in TRY_HARD_REG_PSEUDOS. */
817static int try_hard_reg_pseudos_check[FIRST_PSEUDO_REGISTER];
818/* Pseudos who hold given hard register at the considered points. */
819static bitmap_head try_hard_reg_pseudos[FIRST_PSEUDO_REGISTER];
820
821/* Set up try_hard_reg_pseudos for given program point P and class
822 RCLASS. Those are pseudos living at P and assigned to a hard
823 register of RCLASS. In other words, those are pseudos which can be
824 spilled to assign a hard register of RCLASS to a pseudo living at
825 P. */
826static void
827setup_try_hard_regno_pseudos (int p, enum reg_class rclass)
828{
829 int i, hard_regno;
ef4bddc2 830 machine_mode mode;
55a2c322
VM
831 unsigned int spill_regno;
832 bitmap_iterator bi;
833
834 /* Find what pseudos could be spilled. */
835 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos[p], 0, spill_regno, bi)
836 {
837 mode = PSEUDO_REGNO_MODE (spill_regno);
838 hard_regno = live_pseudos_reg_renumber[spill_regno];
839 if (overlaps_hard_reg_set_p (reg_class_contents[rclass],
840 mode, hard_regno))
841 {
ad474626 842 for (i = hard_regno_nregs (hard_regno, mode) - 1; i >= 0; i--)
55a2c322
VM
843 {
844 if (try_hard_reg_pseudos_check[hard_regno + i]
845 != curr_pseudo_check)
846 {
847 try_hard_reg_pseudos_check[hard_regno + i]
848 = curr_pseudo_check;
849 bitmap_clear (&try_hard_reg_pseudos[hard_regno + i]);
850 }
851 bitmap_set_bit (&try_hard_reg_pseudos[hard_regno + i],
852 spill_regno);
853 }
854 }
855 }
856}
857
858/* Assign temporarily HARD_REGNO to pseudo REGNO. Temporary
859 assignment means that we might undo the data change. */
860static void
861assign_temporarily (int regno, int hard_regno)
862{
863 int p;
864 lra_live_range_t r;
865
866 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
867 {
868 for (p = r->start; p <= r->finish; p++)
869 if (hard_regno < 0)
870 bitmap_clear_bit (&live_hard_reg_pseudos[p], regno);
871 else
872 {
873 bitmap_set_bit (&live_hard_reg_pseudos[p], regno);
874 insert_in_live_range_start_chain (regno);
875 }
876 }
877 live_pseudos_reg_renumber[regno] = hard_regno;
878}
879
8f2f6381
BS
880/* Return true iff there is a reason why pseudo SPILL_REGNO should not
881 be spilled. */
882static bool
883must_not_spill_p (unsigned spill_regno)
884{
885 if ((pic_offset_table_rtx != NULL
886 && spill_regno == REGNO (pic_offset_table_rtx))
887 || ((int) spill_regno >= lra_constraint_new_regno_start
888 && ! bitmap_bit_p (&lra_inheritance_pseudos, spill_regno)
889 && ! bitmap_bit_p (&lra_split_regs, spill_regno)
890 && ! bitmap_bit_p (&lra_subreg_reload_pseudos, spill_regno)
891 && ! bitmap_bit_p (&lra_optional_reload_pseudos, spill_regno)))
892 return true;
893 /* A reload pseudo that requires a singleton register class should
894 not be spilled.
895 FIXME: this mitigates the issue on certain i386 patterns, but
896 does not solve the general case where existing reloads fully
897 cover a limited register class. */
898 if (!bitmap_bit_p (&non_reload_pseudos, spill_regno)
5da906ca
BS
899 && reg_class_size [reg_preferred_class (spill_regno)] == 1
900 && reg_alternate_class (spill_regno) == NO_REGS)
8f2f6381
BS
901 return true;
902 return false;
903}
904
55a2c322
VM
905/* Array used for sorting reload pseudos for subsequent allocation
906 after spilling some pseudo. */
907static int *sorted_reload_pseudos;
908
909/* Spill some pseudos for a reload pseudo REGNO and return hard
910 register which should be used for pseudo after spilling. The
911 function adds spilled pseudos to SPILLED_PSEUDO_BITMAP. When we
912 choose hard register (and pseudos occupying the hard registers and
913 to be spilled), we take into account not only how REGNO will
914 benefit from the spills but also how other reload pseudos not yet
915 assigned to hard registers benefit from the spills too. In very
9e038952
VM
916 rare cases, the function can fail and return -1.
917
918 If FIRST_P, return the first available hard reg ignoring other
919 criteria, e.g. allocation cost and cost of spilling non-reload
920 pseudos. This approach results in less hard reg pool fragmentation
921 and permit to allocate hard regs to reload pseudos in complicated
922 situations where pseudo sizes are different. */
55a2c322 923static int
9e038952 924spill_for (int regno, bitmap spilled_pseudo_bitmap, bool first_p)
55a2c322
VM
925{
926 int i, j, n, p, hard_regno, best_hard_regno, cost, best_cost, rclass_size;
927 int reload_hard_regno, reload_cost;
b81a2f0d 928 bool static_p, best_static_p;
ef4bddc2 929 machine_mode mode;
55a2c322 930 enum reg_class rclass;
55a2c322
VM
931 unsigned int spill_regno, reload_regno, uid;
932 int insn_pseudos_num, best_insn_pseudos_num;
8fd827b8 933 int bad_spills_num, smallest_bad_spills_num;
55a2c322
VM
934 lra_live_range_t r;
935 bitmap_iterator bi;
936
937 rclass = regno_allocno_class_array[regno];
938 lra_assert (reg_renumber[regno] < 0 && rclass != NO_REGS);
939 bitmap_clear (&insn_conflict_pseudos);
940 bitmap_clear (&best_spill_pseudos_bitmap);
941 EXECUTE_IF_SET_IN_BITMAP (&lra_reg_info[regno].insn_bitmap, 0, uid, bi)
942 {
943 struct lra_insn_reg *ir;
f4eafc30 944
55a2c322
VM
945 for (ir = lra_get_insn_regs (uid); ir != NULL; ir = ir->next)
946 if (ir->regno >= FIRST_PSEUDO_REGISTER)
947 bitmap_set_bit (&insn_conflict_pseudos, ir->regno);
948 }
949 best_hard_regno = -1;
950 best_cost = INT_MAX;
b81a2f0d 951 best_static_p = TRUE;
55a2c322 952 best_insn_pseudos_num = INT_MAX;
8fd827b8 953 smallest_bad_spills_num = INT_MAX;
55a2c322
VM
954 rclass_size = ira_class_hard_regs_num[rclass];
955 mode = PSEUDO_REGNO_MODE (regno);
956 /* Invalidate try_hard_reg_pseudos elements. */
957 curr_pseudo_check++;
958 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
959 for (p = r->start; p <= r->finish; p++)
960 setup_try_hard_regno_pseudos (p, rclass);
961 for (i = 0; i < rclass_size; i++)
962 {
963 hard_regno = ira_class_hard_regs[rclass][i];
964 bitmap_clear (&spill_pseudos_bitmap);
ad474626 965 for (j = hard_regno_nregs (hard_regno, mode) - 1; j >= 0; j--)
55a2c322
VM
966 {
967 if (try_hard_reg_pseudos_check[hard_regno + j] != curr_pseudo_check)
968 continue;
969 lra_assert (!bitmap_empty_p (&try_hard_reg_pseudos[hard_regno + j]));
970 bitmap_ior_into (&spill_pseudos_bitmap,
971 &try_hard_reg_pseudos[hard_regno + j]);
972 }
973 /* Spill pseudos. */
b81a2f0d 974 static_p = false;
55a2c322 975 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
8f2f6381 976 if (must_not_spill_p (spill_regno))
55a2c322 977 goto fail;
b81a2f0d
VM
978 else if (non_spilled_static_chain_regno_p (spill_regno))
979 static_p = true;
55a2c322 980 insn_pseudos_num = 0;
8fd827b8 981 bad_spills_num = 0;
55a2c322
VM
982 if (lra_dump_file != NULL)
983 fprintf (lra_dump_file, " Trying %d:", hard_regno);
984 sparseset_clear (live_range_reload_inheritance_pseudos);
985 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
986 {
987 if (bitmap_bit_p (&insn_conflict_pseudos, spill_regno))
988 insn_pseudos_num++;
8fd827b8
VM
989 if (spill_regno >= (unsigned int) lra_bad_spill_regno_start)
990 bad_spills_num++;
55a2c322
VM
991 for (r = lra_reg_info[spill_regno].live_ranges;
992 r != NULL;
993 r = r->next)
994 {
995 for (p = r->start; p <= r->finish; p++)
996 {
997 lra_live_range_t r2;
f4eafc30 998
55a2c322
VM
999 for (r2 = start_point_ranges[p];
1000 r2 != NULL;
1001 r2 = r2->start_next)
1002 if (r2->regno >= lra_constraint_new_regno_start)
1003 sparseset_set_bit (live_range_reload_inheritance_pseudos,
1004 r2->regno);
1005 }
1006 }
1007 }
295d875c 1008 n = 0;
88def637 1009 if (sparseset_cardinality (live_range_reload_inheritance_pseudos)
bb750f4f 1010 <= (unsigned)LRA_MAX_CONSIDERED_RELOAD_PSEUDOS)
88def637
VM
1011 EXECUTE_IF_SET_IN_SPARSESET (live_range_reload_inheritance_pseudos,
1012 reload_regno)
1013 if ((int) reload_regno != regno
1014 && (ira_reg_classes_intersect_p
1015 [rclass][regno_allocno_class_array[reload_regno]])
1016 && live_pseudos_reg_renumber[reload_regno] < 0
9e038952 1017 && find_hard_regno_for (reload_regno, &cost, -1, first_p) < 0)
88def637 1018 sorted_reload_pseudos[n++] = reload_regno;
295d875c
VM
1019 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
1020 {
1021 update_lives (spill_regno, true);
1022 if (lra_dump_file != NULL)
1023 fprintf (lra_dump_file, " spill %d(freq=%d)",
1024 spill_regno, lra_reg_info[spill_regno].freq);
1025 }
9e038952 1026 hard_regno = find_hard_regno_for (regno, &cost, -1, first_p);
55a2c322
VM
1027 if (hard_regno >= 0)
1028 {
1029 assign_temporarily (regno, hard_regno);
55a2c322
VM
1030 qsort (sorted_reload_pseudos, n, sizeof (int),
1031 reload_pseudo_compare_func);
1032 for (j = 0; j < n; j++)
1033 {
1034 reload_regno = sorted_reload_pseudos[j];
1035 lra_assert (live_pseudos_reg_renumber[reload_regno] < 0);
1036 if ((reload_hard_regno
1037 = find_hard_regno_for (reload_regno,
9e038952 1038 &reload_cost, -1, first_p)) >= 0)
55a2c322
VM
1039 {
1040 if (lra_dump_file != NULL)
1041 fprintf (lra_dump_file, " assign %d(cost=%d)",
1042 reload_regno, reload_cost);
1043 assign_temporarily (reload_regno, reload_hard_regno);
1044 cost += reload_cost;
1045 }
1046 }
1047 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
1048 {
0cc97fc5 1049 rtx_insn_list *x;
f4eafc30 1050
55a2c322
VM
1051 cost += lra_reg_info[spill_regno].freq;
1052 if (ira_reg_equiv[spill_regno].memory != NULL
1053 || ira_reg_equiv[spill_regno].constant != NULL)
1054 for (x = ira_reg_equiv[spill_regno].init_insns;
1055 x != NULL;
0cc97fc5
DM
1056 x = x->next ())
1057 cost -= REG_FREQ_FROM_BB (BLOCK_FOR_INSN (x->insn ()));
55a2c322 1058 }
b81a2f0d
VM
1059 /* Avoid spilling static chain pointer pseudo when non-local
1060 goto is used. */
1061 if ((! static_p && best_static_p)
1062 || (static_p == best_static_p
1063 && (best_insn_pseudos_num > insn_pseudos_num
1064 || (best_insn_pseudos_num == insn_pseudos_num
1065 && (bad_spills_num < smallest_bad_spills_num
1066 || (bad_spills_num == smallest_bad_spills_num
1067 && best_cost > cost))))))
55a2c322
VM
1068 {
1069 best_insn_pseudos_num = insn_pseudos_num;
54e915b3 1070 smallest_bad_spills_num = bad_spills_num;
b81a2f0d 1071 best_static_p = static_p;
55a2c322
VM
1072 best_cost = cost;
1073 best_hard_regno = hard_regno;
1074 bitmap_copy (&best_spill_pseudos_bitmap, &spill_pseudos_bitmap);
1075 if (lra_dump_file != NULL)
54e915b3
VM
1076 fprintf (lra_dump_file,
1077 " Now best %d(cost=%d, bad_spills=%d, insn_pseudos=%d)\n",
1078 hard_regno, cost, bad_spills_num, insn_pseudos_num);
55a2c322
VM
1079 }
1080 assign_temporarily (regno, -1);
1081 for (j = 0; j < n; j++)
1082 {
1083 reload_regno = sorted_reload_pseudos[j];
1084 if (live_pseudos_reg_renumber[reload_regno] >= 0)
1085 assign_temporarily (reload_regno, -1);
1086 }
1087 }
1088 if (lra_dump_file != NULL)
1089 fprintf (lra_dump_file, "\n");
1090 /* Restore the live hard reg pseudo info for spilled pseudos. */
1091 EXECUTE_IF_SET_IN_BITMAP (&spill_pseudos_bitmap, 0, spill_regno, bi)
1092 update_lives (spill_regno, false);
1093 fail:
1094 ;
1095 }
1096 /* Spill: */
1097 EXECUTE_IF_SET_IN_BITMAP (&best_spill_pseudos_bitmap, 0, spill_regno, bi)
1098 {
f54437d5
VM
1099 if ((int) spill_regno >= lra_constraint_new_regno_start)
1100 former_reload_pseudo_spill_p = true;
55a2c322
VM
1101 if (lra_dump_file != NULL)
1102 fprintf (lra_dump_file, " Spill %sr%d(hr=%d, freq=%d) for r%d\n",
2b778c9d 1103 pseudo_prefix_title (spill_regno),
55a2c322
VM
1104 spill_regno, reg_renumber[spill_regno],
1105 lra_reg_info[spill_regno].freq, regno);
1106 update_lives (spill_regno, true);
1107 lra_setup_reg_renumber (spill_regno, -1, false);
1108 }
1109 bitmap_ior_into (spilled_pseudo_bitmap, &best_spill_pseudos_bitmap);
1110 return best_hard_regno;
1111}
1112
1113/* Assign HARD_REGNO to REGNO. */
1114static void
1115assign_hard_regno (int hard_regno, int regno)
1116{
1117 int i;
1118
1119 lra_assert (hard_regno >= 0);
1120 lra_setup_reg_renumber (regno, hard_regno, true);
1121 update_lives (regno, false);
1122 for (i = 0;
ad474626 1123 i < hard_regno_nregs (hard_regno, lra_reg_info[regno].biggest_mode);
55a2c322
VM
1124 i++)
1125 df_set_regs_ever_live (hard_regno + i, true);
1126}
1127
1128/* Array used for sorting different pseudos. */
1129static int *sorted_pseudos;
1130
1131/* The constraints pass is allowed to create equivalences between
1132 pseudos that make the current allocation "incorrect" (in the sense
1133 that pseudos are assigned to hard registers from their own conflict
1134 sets). The global variable lra_risky_transformations_p says
1135 whether this might have happened.
1136
1137 Process pseudos assigned to hard registers (less frequently used
1138 first), spill if a conflict is found, and mark the spilled pseudos
1139 in SPILLED_PSEUDO_BITMAP. Set up LIVE_HARD_REG_PSEUDOS from
1140 pseudos, assigned to hard registers. */
1141static void
1142setup_live_pseudos_and_spill_after_risky_transforms (bitmap
1143 spilled_pseudo_bitmap)
1144{
7e4d17a8 1145 int p, i, j, n, regno, hard_regno, biggest_nregs, nregs_diff;
55a2c322 1146 unsigned int k, conflict_regno;
73ca989c
RS
1147 poly_int64 offset;
1148 int val;
55a2c322 1149 HARD_REG_SET conflict_set;
7e4d17a8 1150 machine_mode mode, biggest_mode;
55a2c322
VM
1151 lra_live_range_t r;
1152 bitmap_iterator bi;
1153 int max_regno = max_reg_num ();
1154
1155 if (! lra_risky_transformations_p)
1156 {
1157 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1158 if (reg_renumber[i] >= 0 && lra_reg_info[i].nrefs > 0)
1159 update_lives (i, false);
1160 return;
1161 }
1162 for (n = 0, i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
bcb21886
KY
1163 if ((pic_offset_table_rtx == NULL_RTX
1164 || i != (int) REGNO (pic_offset_table_rtx))
7e4d17a8
VM
1165 && (hard_regno = reg_renumber[i]) >= 0 && lra_reg_info[i].nrefs > 0)
1166 {
1167 biggest_mode = lra_reg_info[i].biggest_mode;
1168 biggest_nregs = hard_regno_nregs (hard_regno, biggest_mode);
1169 nregs_diff = (biggest_nregs
1170 - hard_regno_nregs (hard_regno, PSEUDO_REGNO_MODE (i)));
1171 enum reg_class rclass = lra_get_allocno_class (i);
1172
4321da7b
VM
1173 if ((WORDS_BIG_ENDIAN
1174 && (hard_regno - nregs_diff < 0
1175 || !TEST_HARD_REG_BIT (reg_class_contents[rclass],
1176 hard_regno - nregs_diff)))
1177 || (!WORDS_BIG_ENDIAN
1178 && (hard_regno + nregs_diff >= FIRST_PSEUDO_REGISTER
1179 || !TEST_HARD_REG_BIT (reg_class_contents[rclass],
1180 hard_regno + nregs_diff))))
7e4d17a8
VM
1181 {
1182 /* Hard registers of paradoxical sub-registers are out of
1183 range of pseudo register class. Spill the pseudo. */
1184 reg_renumber[i] = -1;
1185 continue;
1186 }
1187 sorted_pseudos[n++] = i;
1188 }
55a2c322 1189 qsort (sorted_pseudos, n, sizeof (int), pseudo_compare_func);
bcb21886
KY
1190 if (pic_offset_table_rtx != NULL_RTX
1191 && (regno = REGNO (pic_offset_table_rtx)) >= FIRST_PSEUDO_REGISTER
1192 && reg_renumber[regno] >= 0 && lra_reg_info[regno].nrefs > 0)
1193 sorted_pseudos[n++] = regno;
55a2c322
VM
1194 for (i = n - 1; i >= 0; i--)
1195 {
1196 regno = sorted_pseudos[i];
1197 hard_regno = reg_renumber[regno];
1198 lra_assert (hard_regno >= 0);
1199 mode = lra_reg_info[regno].biggest_mode;
1200 sparseset_clear (live_range_hard_reg_pseudos);
1201 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
1202 {
1203 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos[r->start], 0, k, bi)
1204 sparseset_set_bit (live_range_hard_reg_pseudos, k);
1205 for (p = r->start + 1; p <= r->finish; p++)
1206 {
1207 lra_live_range_t r2;
f4eafc30 1208
55a2c322
VM
1209 for (r2 = start_point_ranges[p];
1210 r2 != NULL;
1211 r2 = r2->start_next)
1212 if (live_pseudos_reg_renumber[r2->regno] >= 0)
1213 sparseset_set_bit (live_range_hard_reg_pseudos, r2->regno);
1214 }
1215 }
6576d245 1216 conflict_set = lra_no_alloc_regs;
44942965 1217 conflict_set |= lra_reg_info[regno].conflict_hard_regs;
55a2c322 1218 val = lra_reg_info[regno].val;
d70a81dd 1219 offset = lra_reg_info[regno].offset;
55a2c322 1220 EXECUTE_IF_SET_IN_SPARSESET (live_range_hard_reg_pseudos, conflict_regno)
d70a81dd 1221 if (!lra_reg_val_equal_p (conflict_regno, val, offset)
55a2c322
VM
1222 /* If it is multi-register pseudos they should start on
1223 the same hard register. */
1224 || hard_regno != reg_renumber[conflict_regno])
15961e4a
VM
1225 {
1226 int conflict_hard_regno = reg_renumber[conflict_regno];
7e4d17a8
VM
1227
1228 biggest_mode = lra_reg_info[conflict_regno].biggest_mode;
1229 biggest_nregs = hard_regno_nregs (conflict_hard_regno,
1230 biggest_mode);
1231 nregs_diff
ad474626
RS
1232 = (biggest_nregs
1233 - hard_regno_nregs (conflict_hard_regno,
1234 PSEUDO_REGNO_MODE (conflict_regno)));
15961e4a
VM
1235 add_to_hard_reg_set (&conflict_set,
1236 biggest_mode,
1237 conflict_hard_regno
1238 - (WORDS_BIG_ENDIAN ? nregs_diff : 0));
1239 }
55a2c322
VM
1240 if (! overlaps_hard_reg_set_p (conflict_set, mode, hard_regno))
1241 {
1242 update_lives (regno, false);
1243 continue;
1244 }
1245 bitmap_set_bit (spilled_pseudo_bitmap, regno);
1246 for (j = 0;
ad474626 1247 j < hard_regno_nregs (hard_regno, PSEUDO_REGNO_MODE (regno));
55a2c322
VM
1248 j++)
1249 lra_hard_reg_usage[hard_regno + j] -= lra_reg_info[regno].freq;
1250 reg_renumber[regno] = -1;
f54437d5
VM
1251 if (regno >= lra_constraint_new_regno_start)
1252 former_reload_pseudo_spill_p = true;
55a2c322
VM
1253 if (lra_dump_file != NULL)
1254 fprintf (lra_dump_file, " Spill r%d after risky transformations\n",
1255 regno);
1256 }
1257}
1258
1259/* Improve allocation by assigning the same hard regno of inheritance
1260 pseudos to the connected pseudos. We need this because inheritance
1261 pseudos are allocated after reload pseudos in the thread and when
1262 we assign a hard register to a reload pseudo we don't know yet that
1263 the connected inheritance pseudos can get the same hard register.
1264 Add pseudos with changed allocation to bitmap CHANGED_PSEUDOS. */
1265static void
1266improve_inheritance (bitmap changed_pseudos)
1267{
1268 unsigned int k;
1269 int regno, another_regno, hard_regno, another_hard_regno, cost, i, n;
1270 lra_copy_t cp, next_cp;
1271 bitmap_iterator bi;
1272
8e3a4869
VM
1273 if (lra_inheritance_iter > LRA_MAX_INHERITANCE_PASSES)
1274 return;
55a2c322
VM
1275 n = 0;
1276 EXECUTE_IF_SET_IN_BITMAP (&lra_inheritance_pseudos, 0, k, bi)
1277 if (reg_renumber[k] >= 0 && lra_reg_info[k].nrefs != 0)
1278 sorted_pseudos[n++] = k;
1279 qsort (sorted_pseudos, n, sizeof (int), pseudo_compare_func);
1280 for (i = 0; i < n; i++)
1281 {
1282 regno = sorted_pseudos[i];
1283 hard_regno = reg_renumber[regno];
1284 lra_assert (hard_regno >= 0);
1285 for (cp = lra_reg_info[regno].copies; cp != NULL; cp = next_cp)
1286 {
1287 if (cp->regno1 == regno)
1288 {
1289 next_cp = cp->regno1_next;
1290 another_regno = cp->regno2;
1291 }
1292 else if (cp->regno2 == regno)
1293 {
1294 next_cp = cp->regno2_next;
1295 another_regno = cp->regno1;
1296 }
1297 else
1298 gcc_unreachable ();
1299 /* Don't change reload pseudo allocation. It might have
1300 this allocation for a purpose and changing it can result
1301 in LRA cycling. */
1302 if ((another_regno < lra_constraint_new_regno_start
1303 || bitmap_bit_p (&lra_inheritance_pseudos, another_regno))
1304 && (another_hard_regno = reg_renumber[another_regno]) >= 0
1305 && another_hard_regno != hard_regno)
1306 {
1307 if (lra_dump_file != NULL)
1308 fprintf
1309 (lra_dump_file,
1310 " Improving inheritance for %d(%d) and %d(%d)...\n",
1311 regno, hard_regno, another_regno, another_hard_regno);
1312 update_lives (another_regno, true);
1313 lra_setup_reg_renumber (another_regno, -1, false);
9e038952
VM
1314 if (hard_regno == find_hard_regno_for (another_regno, &cost,
1315 hard_regno, false))
55a2c322
VM
1316 assign_hard_regno (hard_regno, another_regno);
1317 else
1318 assign_hard_regno (another_hard_regno, another_regno);
1319 bitmap_set_bit (changed_pseudos, another_regno);
1320 }
1321 }
1322 }
1323}
1324
1325
1326/* Bitmap finally containing all pseudos spilled on this assignment
1327 pass. */
1328static bitmap_head all_spilled_pseudos;
1329/* All pseudos whose allocation was changed. */
1330static bitmap_head changed_pseudo_bitmap;
1331
9e038952
VM
1332
1333/* Add to LIVE_RANGE_HARD_REG_PSEUDOS all pseudos conflicting with
1334 REGNO and whose hard regs can be assigned to REGNO. */
1335static void
1336find_all_spills_for (int regno)
1337{
1338 int p;
1339 lra_live_range_t r;
1340 unsigned int k;
1341 bitmap_iterator bi;
1342 enum reg_class rclass;
1343 bool *rclass_intersect_p;
1344
1345 rclass = regno_allocno_class_array[regno];
1346 rclass_intersect_p = ira_reg_classes_intersect_p[rclass];
1347 for (r = lra_reg_info[regno].live_ranges; r != NULL; r = r->next)
1348 {
1349 EXECUTE_IF_SET_IN_BITMAP (&live_hard_reg_pseudos[r->start], 0, k, bi)
1350 if (rclass_intersect_p[regno_allocno_class_array[k]])
1351 sparseset_set_bit (live_range_hard_reg_pseudos, k);
1352 for (p = r->start + 1; p <= r->finish; p++)
1353 {
1354 lra_live_range_t r2;
1355
1356 for (r2 = start_point_ranges[p];
1357 r2 != NULL;
1358 r2 = r2->start_next)
1359 {
1360 if (live_pseudos_reg_renumber[r2->regno] >= 0
6027ea4c
VM
1361 && ! sparseset_bit_p (live_range_hard_reg_pseudos, r2->regno)
1362 && rclass_intersect_p[regno_allocno_class_array[r2->regno]]
1363 && ((int) r2->regno < lra_constraint_new_regno_start
1364 || bitmap_bit_p (&lra_inheritance_pseudos, r2->regno)
1365 || bitmap_bit_p (&lra_split_regs, r2->regno)
1366 || bitmap_bit_p (&lra_optional_reload_pseudos, r2->regno)
1367 /* There is no sense to consider another reload
1368 pseudo if it has the same class. */
1369 || regno_allocno_class_array[r2->regno] != rclass))
9e038952
VM
1370 sparseset_set_bit (live_range_hard_reg_pseudos, r2->regno);
1371 }
1372 }
1373 }
1374}
1375
6027ea4c
VM
1376/* Assign hard registers to reload pseudos and other pseudos. Return
1377 true if we was not able to assign hard registers to all reload
1378 pseudos. */
1379static bool
55a2c322
VM
1380assign_by_spills (void)
1381{
6027ea4c 1382 int i, n, nfails, iter, regno, regno2, hard_regno, cost;
8a8330b7 1383 rtx restore_rtx;
55a2c322 1384 bitmap_head changed_insns, do_not_assign_nonreload_pseudos;
9e038952 1385 unsigned int u, conflict_regno;
55a2c322 1386 bitmap_iterator bi;
6027ea4c 1387 bool reload_p, fails_p = false;
55a2c322
VM
1388 int max_regno = max_reg_num ();
1389
1390 for (n = 0, i = lra_constraint_new_regno_start; i < max_regno; i++)
1391 if (reg_renumber[i] < 0 && lra_reg_info[i].nrefs != 0
1392 && regno_allocno_class_array[i] != NO_REGS)
1393 sorted_pseudos[n++] = i;
1394 bitmap_initialize (&insn_conflict_pseudos, &reg_obstack);
1395 bitmap_initialize (&spill_pseudos_bitmap, &reg_obstack);
1396 bitmap_initialize (&best_spill_pseudos_bitmap, &reg_obstack);
1397 update_hard_regno_preference_check = XCNEWVEC (int, max_regno);
1398 curr_update_hard_regno_preference_check = 0;
1399 memset (try_hard_reg_pseudos_check, 0, sizeof (try_hard_reg_pseudos_check));
1400 for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
1401 bitmap_initialize (&try_hard_reg_pseudos[i], &reg_obstack);
1402 curr_pseudo_check = 0;
1403 bitmap_initialize (&changed_insns, &reg_obstack);
1404 bitmap_initialize (&non_reload_pseudos, &reg_obstack);
1405 bitmap_ior (&non_reload_pseudos, &lra_inheritance_pseudos, &lra_split_regs);
2b778c9d 1406 bitmap_ior_into (&non_reload_pseudos, &lra_subreg_reload_pseudos);
55a2c322
VM
1407 bitmap_ior_into (&non_reload_pseudos, &lra_optional_reload_pseudos);
1408 for (iter = 0; iter <= 1; iter++)
1409 {
1410 qsort (sorted_pseudos, n, sizeof (int), reload_pseudo_compare_func);
1411 nfails = 0;
1412 for (i = 0; i < n; i++)
1413 {
1414 regno = sorted_pseudos[i];
8a8330b7
VM
1415 if (reg_renumber[regno] >= 0)
1416 continue;
55a2c322
VM
1417 if (lra_dump_file != NULL)
1418 fprintf (lra_dump_file, " Assigning to %d "
1419 "(cl=%s, orig=%d, freq=%d, tfirst=%d, tfreq=%d)...\n",
1420 regno, reg_class_names[regno_allocno_class_array[regno]],
1421 ORIGINAL_REGNO (regno_reg_rtx[regno]),
1422 lra_reg_info[regno].freq, regno_assign_info[regno].first,
1423 regno_assign_info[regno_assign_info[regno].first].freq);
9e038952 1424 hard_regno = find_hard_regno_for (regno, &cost, -1, iter == 1);
992ca0f0
VM
1425 reload_p = ! bitmap_bit_p (&non_reload_pseudos, regno);
1426 if (hard_regno < 0 && reload_p)
9e038952 1427 hard_regno = spill_for (regno, &all_spilled_pseudos, iter == 1);
55a2c322
VM
1428 if (hard_regno < 0)
1429 {
6027ea4c
VM
1430 if (reload_p) {
1431 /* Put unassigned reload pseudo first in the
1432 array. */
1433 regno2 = sorted_pseudos[nfails];
55a2c322 1434 sorted_pseudos[nfails++] = regno;
6027ea4c
VM
1435 sorted_pseudos[i] = regno2;
1436 }
55a2c322
VM
1437 }
1438 else
1439 {
1440 /* This register might have been spilled by the previous
1441 pass. Indicate that it is no longer spilled. */
1442 bitmap_clear_bit (&all_spilled_pseudos, regno);
1443 assign_hard_regno (hard_regno, regno);
992ca0f0
VM
1444 if (! reload_p)
1445 /* As non-reload pseudo assignment is changed we
1446 should reconsider insns referring for the
1447 pseudo. */
1448 bitmap_set_bit (&changed_pseudo_bitmap, regno);
55a2c322
VM
1449 }
1450 }
6027ea4c 1451 if (nfails == 0 || iter > 0)
ce940020 1452 {
6027ea4c 1453 fails_p = nfails != 0;
ce940020
VM
1454 break;
1455 }
67914693 1456 /* This is a very rare event. We cannot assign a hard register
9e038952
VM
1457 to reload pseudo because the hard register was assigned to
1458 another reload pseudo on a previous assignment pass. For x86
1459 example, on the 1st pass we assigned CX (although another
1460 hard register could be used for this) to reload pseudo in an
1461 insn, on the 2nd pass we need CX (and only this) hard
1462 register for a new reload pseudo in the same insn. Another
1463 possible situation may occur in assigning to multi-regs
1464 reload pseudos when hard regs pool is too fragmented even
1465 after spilling non-reload pseudos.
1466
1467 We should do something radical here to succeed. Here we
1468 spill *all* conflicting pseudos and reassign them. */
55a2c322
VM
1469 if (lra_dump_file != NULL)
1470 fprintf (lra_dump_file, " 2nd iter for reload pseudo assignments:\n");
9e038952 1471 sparseset_clear (live_range_hard_reg_pseudos);
55a2c322
VM
1472 for (i = 0; i < nfails; i++)
1473 {
1474 if (lra_dump_file != NULL)
1475 fprintf (lra_dump_file, " Reload r%d assignment failure\n",
1476 sorted_pseudos[i]);
9e038952
VM
1477 find_all_spills_for (sorted_pseudos[i]);
1478 }
1479 EXECUTE_IF_SET_IN_SPARSESET (live_range_hard_reg_pseudos, conflict_regno)
1480 {
1481 if ((int) conflict_regno >= lra_constraint_new_regno_start)
f54437d5
VM
1482 {
1483 sorted_pseudos[nfails++] = conflict_regno;
1484 former_reload_pseudo_spill_p = true;
1485 }
fdcfea63
VM
1486 else
1487 /* It is better to do reloads before spilling as after the
1488 spill-subpass we will reload memory instead of pseudos
1489 and this will make reusing reload pseudos more
1490 complicated. Going directly to the spill pass in such
1491 case might result in worse code performance or even LRA
1492 cycling if we have few registers. */
1493 bitmap_set_bit (&all_spilled_pseudos, conflict_regno);
9e038952
VM
1494 if (lra_dump_file != NULL)
1495 fprintf (lra_dump_file, " Spill %s r%d(hr=%d, freq=%d)\n",
1496 pseudo_prefix_title (conflict_regno), conflict_regno,
1497 reg_renumber[conflict_regno],
1498 lra_reg_info[conflict_regno].freq);
1499 update_lives (conflict_regno, true);
1500 lra_setup_reg_renumber (conflict_regno, -1, false);
55a2c322 1501 }
6027ea4c
VM
1502 if (n < nfails)
1503 n = nfails;
55a2c322
VM
1504 }
1505 improve_inheritance (&changed_pseudo_bitmap);
1506 bitmap_clear (&non_reload_pseudos);
1507 bitmap_clear (&changed_insns);
1508 if (! lra_simple_p)
1509 {
1510 /* We should not assign to original pseudos of inheritance
1511 pseudos or split pseudos if any its inheritance pseudo did
1512 not get hard register or any its split pseudo was not split
1513 because undo inheritance/split pass will extend live range of
1514 such inheritance or split pseudos. */
1515 bitmap_initialize (&do_not_assign_nonreload_pseudos, &reg_obstack);
1516 EXECUTE_IF_SET_IN_BITMAP (&lra_inheritance_pseudos, 0, u, bi)
8a8330b7
VM
1517 if ((restore_rtx = lra_reg_info[u].restore_rtx) != NULL_RTX
1518 && REG_P (restore_rtx)
55a2c322
VM
1519 && reg_renumber[u] < 0
1520 && bitmap_bit_p (&lra_inheritance_pseudos, u))
8a8330b7 1521 bitmap_set_bit (&do_not_assign_nonreload_pseudos, REGNO (restore_rtx));
55a2c322 1522 EXECUTE_IF_SET_IN_BITMAP (&lra_split_regs, 0, u, bi)
8a8330b7 1523 if ((restore_rtx = lra_reg_info[u].restore_rtx) != NULL_RTX
55a2c322 1524 && reg_renumber[u] >= 0)
8a8330b7
VM
1525 {
1526 lra_assert (REG_P (restore_rtx));
1527 bitmap_set_bit (&do_not_assign_nonreload_pseudos, REGNO (restore_rtx));
1528 }
55a2c322
VM
1529 for (n = 0, i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1530 if (((i < lra_constraint_new_regno_start
1531 && ! bitmap_bit_p (&do_not_assign_nonreload_pseudos, i))
1532 || (bitmap_bit_p (&lra_inheritance_pseudos, i)
8a8330b7 1533 && lra_reg_info[i].restore_rtx != NULL_RTX)
55a2c322 1534 || (bitmap_bit_p (&lra_split_regs, i)
8a8330b7 1535 && lra_reg_info[i].restore_rtx != NULL_RTX)
2b778c9d 1536 || bitmap_bit_p (&lra_subreg_reload_pseudos, i)
55a2c322
VM
1537 || bitmap_bit_p (&lra_optional_reload_pseudos, i))
1538 && reg_renumber[i] < 0 && lra_reg_info[i].nrefs != 0
1539 && regno_allocno_class_array[i] != NO_REGS)
1540 sorted_pseudos[n++] = i;
1541 bitmap_clear (&do_not_assign_nonreload_pseudos);
1542 if (n != 0 && lra_dump_file != NULL)
1543 fprintf (lra_dump_file, " Reassigning non-reload pseudos\n");
1544 qsort (sorted_pseudos, n, sizeof (int), pseudo_compare_func);
1545 for (i = 0; i < n; i++)
1546 {
1547 regno = sorted_pseudos[i];
9e038952 1548 hard_regno = find_hard_regno_for (regno, &cost, -1, false);
55a2c322
VM
1549 if (hard_regno >= 0)
1550 {
1551 assign_hard_regno (hard_regno, regno);
992ca0f0
VM
1552 /* We change allocation for non-reload pseudo on this
1553 iteration -- mark the pseudo for invalidation of used
1554 alternatives of insns containing the pseudo. */
55a2c322
VM
1555 bitmap_set_bit (&changed_pseudo_bitmap, regno);
1556 }
9afb455c
VM
1557 else
1558 {
1559 enum reg_class rclass = lra_get_allocno_class (regno);
1560 enum reg_class spill_class;
1561
1df2287f 1562 if (targetm.spill_class == NULL
8a8330b7 1563 || lra_reg_info[regno].restore_rtx == NULL_RTX
9afb455c
VM
1564 || ! bitmap_bit_p (&lra_inheritance_pseudos, regno)
1565 || (spill_class
1566 = ((enum reg_class)
1567 targetm.spill_class
1568 ((reg_class_t) rclass,
1569 PSEUDO_REGNO_MODE (regno)))) == NO_REGS)
1570 continue;
1571 regno_allocno_class_array[regno] = spill_class;
1572 hard_regno = find_hard_regno_for (regno, &cost, -1, false);
1573 if (hard_regno < 0)
1574 regno_allocno_class_array[regno] = rclass;
1575 else
1576 {
1577 setup_reg_classes
1578 (regno, spill_class, spill_class, spill_class);
1579 assign_hard_regno (hard_regno, regno);
1580 bitmap_set_bit (&changed_pseudo_bitmap, regno);
1581 }
1582 }
55a2c322
VM
1583 }
1584 }
1585 free (update_hard_regno_preference_check);
1586 bitmap_clear (&best_spill_pseudos_bitmap);
1587 bitmap_clear (&spill_pseudos_bitmap);
1588 bitmap_clear (&insn_conflict_pseudos);
6027ea4c 1589 return fails_p;
55a2c322
VM
1590}
1591
55a2c322
VM
1592/* Entry function to assign hard registers to new reload pseudos
1593 starting with LRA_CONSTRAINT_NEW_REGNO_START (by possible spilling
1594 of old pseudos) and possibly to the old pseudos. The function adds
1595 what insns to process for the next constraint pass. Those are all
1596 insns who contains non-reload and non-inheritance pseudos with
1597 changed allocation.
1598
1599 Return true if we did not spill any non-reload and non-inheritance
6027ea4c
VM
1600 pseudos. Set up FAILS_P if we failed to assign hard registers to
1601 all reload pseudos. */
55a2c322 1602bool
6027ea4c 1603lra_assign (bool &fails_p)
55a2c322
VM
1604{
1605 int i;
1606 unsigned int u;
1607 bitmap_iterator bi;
1608 bitmap_head insns_to_process;
1609 bool no_spills_p;
1610 int max_regno = max_reg_num ();
1611
1612 timevar_push (TV_LRA_ASSIGN);
f54437d5
VM
1613 lra_assignment_iter++;
1614 if (lra_dump_file != NULL)
1615 fprintf (lra_dump_file, "\n********** Assignment #%d: **********\n\n",
1616 lra_assignment_iter);
55a2c322
VM
1617 init_lives ();
1618 sorted_pseudos = XNEWVEC (int, max_regno);
1619 sorted_reload_pseudos = XNEWVEC (int, max_regno);
1620 regno_allocno_class_array = XNEWVEC (enum reg_class, max_regno);
8a8330b7 1621 regno_live_length = XNEWVEC (int, max_regno);
55a2c322 1622 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
8a8330b7
VM
1623 {
1624 int l;
1625 lra_live_range_t r;
1626
1627 regno_allocno_class_array[i] = lra_get_allocno_class (i);
1628 for (l = 0, r = lra_reg_info[i].live_ranges; r != NULL; r = r->next)
1629 l += r->finish - r->start + 1;
1630 regno_live_length[i] = l;
1631 }
f54437d5 1632 former_reload_pseudo_spill_p = false;
55a2c322
VM
1633 init_regno_assign_info ();
1634 bitmap_initialize (&all_spilled_pseudos, &reg_obstack);
1635 create_live_range_start_chains ();
1636 setup_live_pseudos_and_spill_after_risky_transforms (&all_spilled_pseudos);
11067dee
VM
1637 if (! lra_asm_error_p && flag_checking && !flag_ipa_ra)
1638 /* Check correctness of allocation for call-crossed pseudos but
1639 only when there are no asm errors as in the case of errors the
1640 asm is removed and it can result in incorrect allocation. */
10e1bdb2
TV
1641 for (i = FIRST_PSEUDO_REGISTER; i < max_regno; i++)
1642 if (lra_reg_info[i].nrefs != 0 && reg_renumber[i] >= 0
473574ee 1643 && lra_reg_info[i].call_insn
10e1bdb2
TV
1644 && overlaps_hard_reg_set_p (call_used_reg_set,
1645 PSEUDO_REGNO_MODE (i), reg_renumber[i]))
1646 gcc_unreachable ();
55a2c322
VM
1647 /* Setup insns to process on the next constraint pass. */
1648 bitmap_initialize (&changed_pseudo_bitmap, &reg_obstack);
1649 init_live_reload_and_inheritance_pseudos ();
6027ea4c 1650 fails_p = assign_by_spills ();
55a2c322
VM
1651 finish_live_reload_and_inheritance_pseudos ();
1652 bitmap_ior_into (&changed_pseudo_bitmap, &all_spilled_pseudos);
1653 no_spills_p = true;
1654 EXECUTE_IF_SET_IN_BITMAP (&all_spilled_pseudos, 0, u, bi)
1655 /* We ignore spilled pseudos created on last inheritance pass
1656 because they will be removed. */
8a8330b7 1657 if (lra_reg_info[u].restore_rtx == NULL_RTX)
55a2c322
VM
1658 {
1659 no_spills_p = false;
1660 break;
1661 }
1662 finish_live_range_start_chains ();
1663 bitmap_clear (&all_spilled_pseudos);
1664 bitmap_initialize (&insns_to_process, &reg_obstack);
1665 EXECUTE_IF_SET_IN_BITMAP (&changed_pseudo_bitmap, 0, u, bi)
1666 bitmap_ior_into (&insns_to_process, &lra_reg_info[u].insn_bitmap);
1667 bitmap_clear (&changed_pseudo_bitmap);
1668 EXECUTE_IF_SET_IN_BITMAP (&insns_to_process, 0, u, bi)
1669 {
1670 lra_push_insn_by_uid (u);
1671 /* Invalidate alternatives for insn should be processed. */
1672 lra_set_used_insn_alternative_by_uid (u, -1);
1673 }
1674 bitmap_clear (&insns_to_process);
1675 finish_regno_assign_info ();
8a8330b7 1676 free (regno_live_length);
55a2c322
VM
1677 free (regno_allocno_class_array);
1678 free (sorted_pseudos);
1679 free (sorted_reload_pseudos);
1680 finish_lives ();
1681 timevar_pop (TV_LRA_ASSIGN);
f54437d5
VM
1682 if (former_reload_pseudo_spill_p)
1683 lra_assignment_iter_after_spill++;
b6c38c69
BS
1684 /* This is conditional on flag_checking because valid code can take
1685 more than this maximum number of iteration, but at the same time
1686 the test can uncover errors in machine descriptions. */
1687 if (flag_checking
1688 && (lra_assignment_iter_after_spill
1689 > LRA_MAX_ASSIGNMENT_ITERATION_NUMBER))
f54437d5 1690 internal_error
a9c697b8 1691 ("maximum number of LRA assignment passes is achieved (%d)",
f54437d5 1692 LRA_MAX_ASSIGNMENT_ITERATION_NUMBER);
55a2c322
VM
1693 return no_spills_p;
1694}
8a8330b7 1695
6027ea4c
VM
1696/* Find start and finish insns for reload pseudo REGNO. Return true
1697 if we managed to find the expected insns. Return false,
1698 otherwise. */
1699static bool
1700find_reload_regno_insns (int regno, rtx_insn * &start, rtx_insn * &finish)
1701{
1702 unsigned int uid;
1703 bitmap_iterator bi;
1704 int n = 0;
1705 rtx_insn *prev_insn, *next_insn;
1706 rtx_insn *start_insn = NULL, *first_insn = NULL, *second_insn = NULL;
1707
1708 EXECUTE_IF_SET_IN_BITMAP (&lra_reg_info[regno].insn_bitmap, 0, uid, bi)
1709 {
1710 if (start_insn == NULL)
1711 start_insn = lra_insn_recog_data[uid]->insn;
1712 n++;
1713 }
1714 /* For reload pseudo we should have at most 3 insns referring for it:
1715 input/output reload insns and the original insn. */
1716 if (n > 3)
1717 return false;
1718 if (n > 1)
1719 {
1720 for (prev_insn = PREV_INSN (start_insn),
1721 next_insn = NEXT_INSN (start_insn);
1722 n != 1 && (prev_insn != NULL || next_insn != NULL); )
1723 {
1724 if (prev_insn != NULL && first_insn == NULL)
1725 {
1726 if (! bitmap_bit_p (&lra_reg_info[regno].insn_bitmap,
1727 INSN_UID (prev_insn)))
1728 prev_insn = PREV_INSN (prev_insn);
1729 else
1730 {
1731 first_insn = prev_insn;
1732 n--;
1733 }
1734 }
1735 if (next_insn != NULL && second_insn == NULL)
1736 {
1737 if (! bitmap_bit_p (&lra_reg_info[regno].insn_bitmap,
1738 INSN_UID (next_insn)))
1739 next_insn = NEXT_INSN (next_insn);
1740 else
1741 {
1742 second_insn = next_insn;
1743 n--;
1744 }
1745 }
1746 }
1747 if (n > 1)
1748 return false;
1749 }
1750 start = first_insn != NULL ? first_insn : start_insn;
1751 finish = second_insn != NULL ? second_insn : start_insn;
1752 return true;
1753}
1754
1755/* Process reload pseudos which did not get a hard reg, split a hard
1756 reg live range in live range of a reload pseudo, and then return
1757 TRUE. If we did not split a hard reg live range, report an error,
1758 and return FALSE. */
1759bool
1760lra_split_hard_reg_for (void)
1761{
7293e3f5 1762 int i, regno;
6027ea4c
VM
1763 rtx_insn *insn, *first, *last;
1764 unsigned int u;
1765 bitmap_iterator bi;
7293e3f5 1766 enum reg_class rclass;
6027ea4c
VM
1767 int max_regno = max_reg_num ();
1768 /* We did not assign hard regs to reload pseudos after two
1769 iterations. Either it's an asm and something is wrong with the
1770 constraints, or we have run out of spill registers; error out in
1771 either case. */
1772 bool asm_p = false;
7293e3f5 1773 bitmap_head failed_reload_insns, failed_reload_pseudos;
6027ea4c
VM
1774
1775 if (lra_dump_file != NULL)
1776 fprintf (lra_dump_file,
1777 "\n****** Splitting a hard reg after assignment #%d: ******\n\n",
1778 lra_assignment_iter);
7293e3f5 1779 bitmap_initialize (&failed_reload_pseudos, &reg_obstack);
003cd04c
VM
1780 bitmap_initialize (&non_reload_pseudos, &reg_obstack);
1781 bitmap_ior (&non_reload_pseudos, &lra_inheritance_pseudos, &lra_split_regs);
1782 bitmap_ior_into (&non_reload_pseudos, &lra_subreg_reload_pseudos);
1783 bitmap_ior_into (&non_reload_pseudos, &lra_optional_reload_pseudos);
7293e3f5 1784 for (i = lra_constraint_new_regno_start; i < max_regno; i++)
6027ea4c 1785 if (reg_renumber[i] < 0 && lra_reg_info[i].nrefs != 0
7293e3f5 1786 && (rclass = lra_get_allocno_class (i)) != NO_REGS
6027ea4c
VM
1787 && ! bitmap_bit_p (&non_reload_pseudos, i))
1788 {
6027ea4c
VM
1789 if (! find_reload_regno_insns (i, first, last))
1790 continue;
7293e3f5
VM
1791 if (spill_hard_reg_in_range (i, rclass, first, last))
1792 {
1793 bitmap_clear (&failed_reload_pseudos);
1794 return true;
1795 }
1796 bitmap_set_bit (&failed_reload_pseudos, i);
6027ea4c 1797 }
003cd04c 1798 bitmap_clear (&non_reload_pseudos);
6027ea4c 1799 bitmap_initialize (&failed_reload_insns, &reg_obstack);
7293e3f5 1800 EXECUTE_IF_SET_IN_BITMAP (&failed_reload_pseudos, 0, u, bi)
6027ea4c 1801 {
7293e3f5 1802 regno = u;
6027ea4c
VM
1803 bitmap_ior_into (&failed_reload_insns,
1804 &lra_reg_info[regno].insn_bitmap);
7293e3f5
VM
1805 lra_setup_reg_renumber
1806 (regno, ira_class_hard_regs[lra_get_allocno_class (regno)][0], false);
6027ea4c
VM
1807 }
1808 EXECUTE_IF_SET_IN_BITMAP (&failed_reload_insns, 0, u, bi)
1809 {
1810 insn = lra_insn_recog_data[u]->insn;
1811 if (asm_noperands (PATTERN (insn)) >= 0)
1812 {
11067dee 1813 lra_asm_error_p = asm_p = true;
6027ea4c
VM
1814 error_for_asm (insn,
1815 "%<asm%> operand has impossible constraints");
1816 /* Avoid further trouble with this insn.
1817 For asm goto, instead of fixing up all the edges
1818 just clear the template and clear input operands
1819 (asm goto doesn't have any output operands). */
1820 if (JUMP_P (insn))
1821 {
1822 rtx asm_op = extract_asm_operands (PATTERN (insn));
1823 ASM_OPERANDS_TEMPLATE (asm_op) = ggc_strdup ("");
1824 ASM_OPERANDS_INPUT_VEC (asm_op) = rtvec_alloc (0);
1825 ASM_OPERANDS_INPUT_CONSTRAINT_VEC (asm_op) = rtvec_alloc (0);
1826 lra_update_insn_regno_info (insn);
1827 }
1828 else
1829 {
1830 PATTERN (insn) = gen_rtx_USE (VOIDmode, const0_rtx);
1831 lra_set_insn_deleted (insn);
1832 }
1833 }
1834 else if (!asm_p)
1835 {
1836 error ("unable to find a register to spill");
1837 fatal_insn ("this is the insn:", insn);
1838 }
1839 }
7293e3f5
VM
1840 bitmap_clear (&failed_reload_pseudos);
1841 bitmap_clear (&failed_reload_insns);
6027ea4c
VM
1842 return false;
1843}