]> git.ipfire.org Git - thirdparty/gcc.git/blob - gcc/sel-sched-ir.c
sel-sched-ir.c (invalidate_av_set): Remove the assert.
[thirdparty/gcc.git] / gcc / sel-sched-ir.c
1 /* Instruction scheduling pass. Selective scheduler and pipeliner.
2 Copyright (C) 2006, 2007, 2008, 2009, 2010, 2011
3 Free Software Foundation, Inc.
4
5 This file is part of GCC.
6
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 3, or (at your option) any later
10 version.
11
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15 for more details.
16
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
20
21 #include "config.h"
22 #include "system.h"
23 #include "coretypes.h"
24 #include "tm.h"
25 #include "diagnostic-core.h"
26 #include "rtl.h"
27 #include "tm_p.h"
28 #include "hard-reg-set.h"
29 #include "regs.h"
30 #include "function.h"
31 #include "flags.h"
32 #include "insn-config.h"
33 #include "insn-attr.h"
34 #include "except.h"
35 #include "recog.h"
36 #include "params.h"
37 #include "target.h"
38 #include "timevar.h"
39 #include "tree-pass.h"
40 #include "sched-int.h"
41 #include "ggc.h"
42 #include "tree.h"
43 #include "vec.h"
44 #include "langhooks.h"
45 #include "rtlhooks-def.h"
46 #include "emit-rtl.h" /* FIXME: Can go away once crtl is moved to rtl.h. */
47
48 #ifdef INSN_SCHEDULING
49 #include "sel-sched-ir.h"
50 /* We don't have to use it except for sel_print_insn. */
51 #include "sel-sched-dump.h"
52
53 /* A vector holding bb info for whole scheduling pass. */
54 VEC(sel_global_bb_info_def, heap) *sel_global_bb_info = NULL;
55
56 /* A vector holding bb info. */
57 VEC(sel_region_bb_info_def, heap) *sel_region_bb_info = NULL;
58
59 /* A pool for allocating all lists. */
60 alloc_pool sched_lists_pool;
61
62 /* This contains information about successors for compute_av_set. */
63 struct succs_info current_succs;
64
65 /* Data structure to describe interaction with the generic scheduler utils. */
66 static struct common_sched_info_def sel_common_sched_info;
67
68 /* The loop nest being pipelined. */
69 struct loop *current_loop_nest;
70
71 /* LOOP_NESTS is a vector containing the corresponding loop nest for
72 each region. */
73 static VEC(loop_p, heap) *loop_nests = NULL;
74
75 /* Saves blocks already in loop regions, indexed by bb->index. */
76 static sbitmap bbs_in_loop_rgns = NULL;
77
78 /* CFG hooks that are saved before changing create_basic_block hook. */
79 static struct cfg_hooks orig_cfg_hooks;
80 \f
81
82 /* Array containing reverse topological index of function basic blocks,
83 indexed by BB->INDEX. */
84 static int *rev_top_order_index = NULL;
85
86 /* Length of the above array. */
87 static int rev_top_order_index_len = -1;
88
89 /* A regset pool structure. */
90 static struct
91 {
92 /* The stack to which regsets are returned. */
93 regset *v;
94
95 /* Its pointer. */
96 int n;
97
98 /* Its size. */
99 int s;
100
101 /* In VV we save all generated regsets so that, when destructing the
102 pool, we can compare it with V and check that every regset was returned
103 back to pool. */
104 regset *vv;
105
106 /* The pointer of VV stack. */
107 int nn;
108
109 /* Its size. */
110 int ss;
111
112 /* The difference between allocated and returned regsets. */
113 int diff;
114 } regset_pool = { NULL, 0, 0, NULL, 0, 0, 0 };
115
116 /* This represents the nop pool. */
117 static struct
118 {
119 /* The vector which holds previously emitted nops. */
120 insn_t *v;
121
122 /* Its pointer. */
123 int n;
124
125 /* Its size. */
126 int s;
127 } nop_pool = { NULL, 0, 0 };
128
129 /* The pool for basic block notes. */
130 static rtx_vec_t bb_note_pool;
131
132 /* A NOP pattern used to emit placeholder insns. */
133 rtx nop_pattern = NULL_RTX;
134 /* A special instruction that resides in EXIT_BLOCK.
135 EXIT_INSN is successor of the insns that lead to EXIT_BLOCK. */
136 rtx exit_insn = NULL_RTX;
137
138 /* TRUE if while scheduling current region, which is loop, its preheader
139 was removed. */
140 bool preheader_removed = false;
141 \f
142
143 /* Forward static declarations. */
144 static void fence_clear (fence_t);
145
146 static void deps_init_id (idata_t, insn_t, bool);
147 static void init_id_from_df (idata_t, insn_t, bool);
148 static expr_t set_insn_init (expr_t, vinsn_t, int);
149
150 static void cfg_preds (basic_block, insn_t **, int *);
151 static void prepare_insn_expr (insn_t, int);
152 static void free_history_vect (VEC (expr_history_def, heap) **);
153
154 static void move_bb_info (basic_block, basic_block);
155 static void remove_empty_bb (basic_block, bool);
156 static void sel_merge_blocks (basic_block, basic_block);
157 static void sel_remove_loop_preheader (void);
158 static bool bb_has_removable_jump_to_p (basic_block, basic_block);
159
160 static bool insn_is_the_only_one_in_bb_p (insn_t);
161 static void create_initial_data_sets (basic_block);
162
163 static void free_av_set (basic_block);
164 static void invalidate_av_set (basic_block);
165 static void extend_insn_data (void);
166 static void sel_init_new_insn (insn_t, int);
167 static void finish_insns (void);
168 \f
169 /* Various list functions. */
170
171 /* Copy an instruction list L. */
172 ilist_t
173 ilist_copy (ilist_t l)
174 {
175 ilist_t head = NULL, *tailp = &head;
176
177 while (l)
178 {
179 ilist_add (tailp, ILIST_INSN (l));
180 tailp = &ILIST_NEXT (*tailp);
181 l = ILIST_NEXT (l);
182 }
183
184 return head;
185 }
186
187 /* Invert an instruction list L. */
188 ilist_t
189 ilist_invert (ilist_t l)
190 {
191 ilist_t res = NULL;
192
193 while (l)
194 {
195 ilist_add (&res, ILIST_INSN (l));
196 l = ILIST_NEXT (l);
197 }
198
199 return res;
200 }
201
202 /* Add a new boundary to the LP list with parameters TO, PTR, and DC. */
203 void
204 blist_add (blist_t *lp, insn_t to, ilist_t ptr, deps_t dc)
205 {
206 bnd_t bnd;
207
208 _list_add (lp);
209 bnd = BLIST_BND (*lp);
210
211 BND_TO (bnd) = to;
212 BND_PTR (bnd) = ptr;
213 BND_AV (bnd) = NULL;
214 BND_AV1 (bnd) = NULL;
215 BND_DC (bnd) = dc;
216 }
217
218 /* Remove the list note pointed to by LP. */
219 void
220 blist_remove (blist_t *lp)
221 {
222 bnd_t b = BLIST_BND (*lp);
223
224 av_set_clear (&BND_AV (b));
225 av_set_clear (&BND_AV1 (b));
226 ilist_clear (&BND_PTR (b));
227
228 _list_remove (lp);
229 }
230
231 /* Init a fence tail L. */
232 void
233 flist_tail_init (flist_tail_t l)
234 {
235 FLIST_TAIL_HEAD (l) = NULL;
236 FLIST_TAIL_TAILP (l) = &FLIST_TAIL_HEAD (l);
237 }
238
239 /* Try to find fence corresponding to INSN in L. */
240 fence_t
241 flist_lookup (flist_t l, insn_t insn)
242 {
243 while (l)
244 {
245 if (FENCE_INSN (FLIST_FENCE (l)) == insn)
246 return FLIST_FENCE (l);
247
248 l = FLIST_NEXT (l);
249 }
250
251 return NULL;
252 }
253
254 /* Init the fields of F before running fill_insns. */
255 static void
256 init_fence_for_scheduling (fence_t f)
257 {
258 FENCE_BNDS (f) = NULL;
259 FENCE_PROCESSED_P (f) = false;
260 FENCE_SCHEDULED_P (f) = false;
261 }
262
263 /* Add new fence consisting of INSN and STATE to the list pointed to by LP. */
264 static void
265 flist_add (flist_t *lp, insn_t insn, state_t state, deps_t dc, void *tc,
266 insn_t last_scheduled_insn, VEC(rtx,gc) *executing_insns,
267 int *ready_ticks, int ready_ticks_size, insn_t sched_next,
268 int cycle, int cycle_issued_insns, int issue_more,
269 bool starts_cycle_p, bool after_stall_p)
270 {
271 fence_t f;
272
273 _list_add (lp);
274 f = FLIST_FENCE (*lp);
275
276 FENCE_INSN (f) = insn;
277
278 gcc_assert (state != NULL);
279 FENCE_STATE (f) = state;
280
281 FENCE_CYCLE (f) = cycle;
282 FENCE_ISSUED_INSNS (f) = cycle_issued_insns;
283 FENCE_STARTS_CYCLE_P (f) = starts_cycle_p;
284 FENCE_AFTER_STALL_P (f) = after_stall_p;
285
286 gcc_assert (dc != NULL);
287 FENCE_DC (f) = dc;
288
289 gcc_assert (tc != NULL || targetm.sched.alloc_sched_context == NULL);
290 FENCE_TC (f) = tc;
291
292 FENCE_LAST_SCHEDULED_INSN (f) = last_scheduled_insn;
293 FENCE_ISSUE_MORE (f) = issue_more;
294 FENCE_EXECUTING_INSNS (f) = executing_insns;
295 FENCE_READY_TICKS (f) = ready_ticks;
296 FENCE_READY_TICKS_SIZE (f) = ready_ticks_size;
297 FENCE_SCHED_NEXT (f) = sched_next;
298
299 init_fence_for_scheduling (f);
300 }
301
302 /* Remove the head node of the list pointed to by LP. */
303 static void
304 flist_remove (flist_t *lp)
305 {
306 if (FENCE_INSN (FLIST_FENCE (*lp)))
307 fence_clear (FLIST_FENCE (*lp));
308 _list_remove (lp);
309 }
310
311 /* Clear the fence list pointed to by LP. */
312 void
313 flist_clear (flist_t *lp)
314 {
315 while (*lp)
316 flist_remove (lp);
317 }
318
319 /* Add ORIGINAL_INSN the def list DL honoring CROSSES_CALL. */
320 void
321 def_list_add (def_list_t *dl, insn_t original_insn, bool crosses_call)
322 {
323 def_t d;
324
325 _list_add (dl);
326 d = DEF_LIST_DEF (*dl);
327
328 d->orig_insn = original_insn;
329 d->crosses_call = crosses_call;
330 }
331 \f
332
333 /* Functions to work with target contexts. */
334
335 /* Bulk target context. It is convenient for debugging purposes to ensure
336 that there are no uninitialized (null) target contexts. */
337 static tc_t bulk_tc = (tc_t) 1;
338
339 /* Target hooks wrappers. In the future we can provide some default
340 implementations for them. */
341
342 /* Allocate a store for the target context. */
343 static tc_t
344 alloc_target_context (void)
345 {
346 return (targetm.sched.alloc_sched_context
347 ? targetm.sched.alloc_sched_context () : bulk_tc);
348 }
349
350 /* Init target context TC.
351 If CLEAN_P is true, then make TC as it is beginning of the scheduler.
352 Overwise, copy current backend context to TC. */
353 static void
354 init_target_context (tc_t tc, bool clean_p)
355 {
356 if (targetm.sched.init_sched_context)
357 targetm.sched.init_sched_context (tc, clean_p);
358 }
359
360 /* Allocate and initialize a target context. Meaning of CLEAN_P is the same as
361 int init_target_context (). */
362 tc_t
363 create_target_context (bool clean_p)
364 {
365 tc_t tc = alloc_target_context ();
366
367 init_target_context (tc, clean_p);
368 return tc;
369 }
370
371 /* Copy TC to the current backend context. */
372 void
373 set_target_context (tc_t tc)
374 {
375 if (targetm.sched.set_sched_context)
376 targetm.sched.set_sched_context (tc);
377 }
378
379 /* TC is about to be destroyed. Free any internal data. */
380 static void
381 clear_target_context (tc_t tc)
382 {
383 if (targetm.sched.clear_sched_context)
384 targetm.sched.clear_sched_context (tc);
385 }
386
387 /* Clear and free it. */
388 static void
389 delete_target_context (tc_t tc)
390 {
391 clear_target_context (tc);
392
393 if (targetm.sched.free_sched_context)
394 targetm.sched.free_sched_context (tc);
395 }
396
397 /* Make a copy of FROM in TO.
398 NB: May be this should be a hook. */
399 static void
400 copy_target_context (tc_t to, tc_t from)
401 {
402 tc_t tmp = create_target_context (false);
403
404 set_target_context (from);
405 init_target_context (to, false);
406
407 set_target_context (tmp);
408 delete_target_context (tmp);
409 }
410
411 /* Create a copy of TC. */
412 static tc_t
413 create_copy_of_target_context (tc_t tc)
414 {
415 tc_t copy = alloc_target_context ();
416
417 copy_target_context (copy, tc);
418
419 return copy;
420 }
421
422 /* Clear TC and initialize it according to CLEAN_P. The meaning of CLEAN_P
423 is the same as in init_target_context (). */
424 void
425 reset_target_context (tc_t tc, bool clean_p)
426 {
427 clear_target_context (tc);
428 init_target_context (tc, clean_p);
429 }
430 \f
431 /* Functions to work with dependence contexts.
432 Dc (aka deps context, aka deps_t, aka struct deps_desc *) is short for dependence
433 context. It accumulates information about processed insns to decide if
434 current insn is dependent on the processed ones. */
435
436 /* Make a copy of FROM in TO. */
437 static void
438 copy_deps_context (deps_t to, deps_t from)
439 {
440 init_deps (to, false);
441 deps_join (to, from);
442 }
443
444 /* Allocate store for dep context. */
445 static deps_t
446 alloc_deps_context (void)
447 {
448 return XNEW (struct deps_desc);
449 }
450
451 /* Allocate and initialize dep context. */
452 static deps_t
453 create_deps_context (void)
454 {
455 deps_t dc = alloc_deps_context ();
456
457 init_deps (dc, false);
458 return dc;
459 }
460
461 /* Create a copy of FROM. */
462 static deps_t
463 create_copy_of_deps_context (deps_t from)
464 {
465 deps_t to = alloc_deps_context ();
466
467 copy_deps_context (to, from);
468 return to;
469 }
470
471 /* Clean up internal data of DC. */
472 static void
473 clear_deps_context (deps_t dc)
474 {
475 free_deps (dc);
476 }
477
478 /* Clear and free DC. */
479 static void
480 delete_deps_context (deps_t dc)
481 {
482 clear_deps_context (dc);
483 free (dc);
484 }
485
486 /* Clear and init DC. */
487 static void
488 reset_deps_context (deps_t dc)
489 {
490 clear_deps_context (dc);
491 init_deps (dc, false);
492 }
493
494 /* This structure describes the dependence analysis hooks for advancing
495 dependence context. */
496 static struct sched_deps_info_def advance_deps_context_sched_deps_info =
497 {
498 NULL,
499
500 NULL, /* start_insn */
501 NULL, /* finish_insn */
502 NULL, /* start_lhs */
503 NULL, /* finish_lhs */
504 NULL, /* start_rhs */
505 NULL, /* finish_rhs */
506 haifa_note_reg_set,
507 haifa_note_reg_clobber,
508 haifa_note_reg_use,
509 NULL, /* note_mem_dep */
510 NULL, /* note_dep */
511
512 0, 0, 0
513 };
514
515 /* Process INSN and add its impact on DC. */
516 void
517 advance_deps_context (deps_t dc, insn_t insn)
518 {
519 sched_deps_info = &advance_deps_context_sched_deps_info;
520 deps_analyze_insn (dc, insn);
521 }
522 \f
523
524 /* Functions to work with DFA states. */
525
526 /* Allocate store for a DFA state. */
527 static state_t
528 state_alloc (void)
529 {
530 return xmalloc (dfa_state_size);
531 }
532
533 /* Allocate and initialize DFA state. */
534 static state_t
535 state_create (void)
536 {
537 state_t state = state_alloc ();
538
539 state_reset (state);
540 advance_state (state);
541 return state;
542 }
543
544 /* Free DFA state. */
545 static void
546 state_free (state_t state)
547 {
548 free (state);
549 }
550
551 /* Make a copy of FROM in TO. */
552 static void
553 state_copy (state_t to, state_t from)
554 {
555 memcpy (to, from, dfa_state_size);
556 }
557
558 /* Create a copy of FROM. */
559 static state_t
560 state_create_copy (state_t from)
561 {
562 state_t to = state_alloc ();
563
564 state_copy (to, from);
565 return to;
566 }
567 \f
568
569 /* Functions to work with fences. */
570
571 /* Clear the fence. */
572 static void
573 fence_clear (fence_t f)
574 {
575 state_t s = FENCE_STATE (f);
576 deps_t dc = FENCE_DC (f);
577 void *tc = FENCE_TC (f);
578
579 ilist_clear (&FENCE_BNDS (f));
580
581 gcc_assert ((s != NULL && dc != NULL && tc != NULL)
582 || (s == NULL && dc == NULL && tc == NULL));
583
584 free (s);
585
586 if (dc != NULL)
587 delete_deps_context (dc);
588
589 if (tc != NULL)
590 delete_target_context (tc);
591 VEC_free (rtx, gc, FENCE_EXECUTING_INSNS (f));
592 free (FENCE_READY_TICKS (f));
593 FENCE_READY_TICKS (f) = NULL;
594 }
595
596 /* Init a list of fences with successors of OLD_FENCE. */
597 void
598 init_fences (insn_t old_fence)
599 {
600 insn_t succ;
601 succ_iterator si;
602 bool first = true;
603 int ready_ticks_size = get_max_uid () + 1;
604
605 FOR_EACH_SUCC_1 (succ, si, old_fence,
606 SUCCS_NORMAL | SUCCS_SKIP_TO_LOOP_EXITS)
607 {
608
609 if (first)
610 first = false;
611 else
612 gcc_assert (flag_sel_sched_pipelining_outer_loops);
613
614 flist_add (&fences, succ,
615 state_create (),
616 create_deps_context () /* dc */,
617 create_target_context (true) /* tc */,
618 NULL_RTX /* last_scheduled_insn */,
619 NULL, /* executing_insns */
620 XCNEWVEC (int, ready_ticks_size), /* ready_ticks */
621 ready_ticks_size,
622 NULL_RTX /* sched_next */,
623 1 /* cycle */, 0 /* cycle_issued_insns */,
624 issue_rate, /* issue_more */
625 1 /* starts_cycle_p */, 0 /* after_stall_p */);
626 }
627 }
628
629 /* Merges two fences (filling fields of fence F with resulting values) by
630 following rules: 1) state, target context and last scheduled insn are
631 propagated from fallthrough edge if it is available;
632 2) deps context and cycle is propagated from more probable edge;
633 3) all other fields are set to corresponding constant values.
634
635 INSN, STATE, DC, TC, LAST_SCHEDULED_INSN, EXECUTING_INSNS,
636 READY_TICKS, READY_TICKS_SIZE, SCHED_NEXT, CYCLE, ISSUE_MORE
637 and AFTER_STALL_P are the corresponding fields of the second fence. */
638 static void
639 merge_fences (fence_t f, insn_t insn,
640 state_t state, deps_t dc, void *tc,
641 rtx last_scheduled_insn, VEC(rtx, gc) *executing_insns,
642 int *ready_ticks, int ready_ticks_size,
643 rtx sched_next, int cycle, int issue_more, bool after_stall_p)
644 {
645 insn_t last_scheduled_insn_old = FENCE_LAST_SCHEDULED_INSN (f);
646
647 gcc_assert (sel_bb_head_p (FENCE_INSN (f))
648 && !sched_next && !FENCE_SCHED_NEXT (f));
649
650 /* Check if we can decide which path fences came.
651 If we can't (or don't want to) - reset all. */
652 if (last_scheduled_insn == NULL
653 || last_scheduled_insn_old == NULL
654 /* This is a case when INSN is reachable on several paths from
655 one insn (this can happen when pipelining of outer loops is on and
656 there are two edges: one going around of inner loop and the other -
657 right through it; in such case just reset everything). */
658 || last_scheduled_insn == last_scheduled_insn_old)
659 {
660 state_reset (FENCE_STATE (f));
661 state_free (state);
662
663 reset_deps_context (FENCE_DC (f));
664 delete_deps_context (dc);
665
666 reset_target_context (FENCE_TC (f), true);
667 delete_target_context (tc);
668
669 if (cycle > FENCE_CYCLE (f))
670 FENCE_CYCLE (f) = cycle;
671
672 FENCE_LAST_SCHEDULED_INSN (f) = NULL;
673 FENCE_ISSUE_MORE (f) = issue_rate;
674 VEC_free (rtx, gc, executing_insns);
675 free (ready_ticks);
676 if (FENCE_EXECUTING_INSNS (f))
677 VEC_block_remove (rtx, FENCE_EXECUTING_INSNS (f), 0,
678 VEC_length (rtx, FENCE_EXECUTING_INSNS (f)));
679 if (FENCE_READY_TICKS (f))
680 memset (FENCE_READY_TICKS (f), 0, FENCE_READY_TICKS_SIZE (f));
681 }
682 else
683 {
684 edge edge_old = NULL, edge_new = NULL;
685 edge candidate;
686 succ_iterator si;
687 insn_t succ;
688
689 /* Find fallthrough edge. */
690 gcc_assert (BLOCK_FOR_INSN (insn)->prev_bb);
691 candidate = find_fallthru_edge_from (BLOCK_FOR_INSN (insn)->prev_bb);
692
693 if (!candidate
694 || (candidate->src != BLOCK_FOR_INSN (last_scheduled_insn)
695 && candidate->src != BLOCK_FOR_INSN (last_scheduled_insn_old)))
696 {
697 /* No fallthrough edge leading to basic block of INSN. */
698 state_reset (FENCE_STATE (f));
699 state_free (state);
700
701 reset_target_context (FENCE_TC (f), true);
702 delete_target_context (tc);
703
704 FENCE_LAST_SCHEDULED_INSN (f) = NULL;
705 FENCE_ISSUE_MORE (f) = issue_rate;
706 }
707 else
708 if (candidate->src == BLOCK_FOR_INSN (last_scheduled_insn))
709 {
710 /* Would be weird if same insn is successor of several fallthrough
711 edges. */
712 gcc_assert (BLOCK_FOR_INSN (insn)->prev_bb
713 != BLOCK_FOR_INSN (last_scheduled_insn_old));
714
715 state_free (FENCE_STATE (f));
716 FENCE_STATE (f) = state;
717
718 delete_target_context (FENCE_TC (f));
719 FENCE_TC (f) = tc;
720
721 FENCE_LAST_SCHEDULED_INSN (f) = last_scheduled_insn;
722 FENCE_ISSUE_MORE (f) = issue_more;
723 }
724 else
725 {
726 /* Leave STATE, TC and LAST_SCHEDULED_INSN fields untouched. */
727 state_free (state);
728 delete_target_context (tc);
729
730 gcc_assert (BLOCK_FOR_INSN (insn)->prev_bb
731 != BLOCK_FOR_INSN (last_scheduled_insn));
732 }
733
734 /* Find edge of first predecessor (last_scheduled_insn_old->insn). */
735 FOR_EACH_SUCC_1 (succ, si, last_scheduled_insn_old,
736 SUCCS_NORMAL | SUCCS_SKIP_TO_LOOP_EXITS)
737 {
738 if (succ == insn)
739 {
740 /* No same successor allowed from several edges. */
741 gcc_assert (!edge_old);
742 edge_old = si.e1;
743 }
744 }
745 /* Find edge of second predecessor (last_scheduled_insn->insn). */
746 FOR_EACH_SUCC_1 (succ, si, last_scheduled_insn,
747 SUCCS_NORMAL | SUCCS_SKIP_TO_LOOP_EXITS)
748 {
749 if (succ == insn)
750 {
751 /* No same successor allowed from several edges. */
752 gcc_assert (!edge_new);
753 edge_new = si.e1;
754 }
755 }
756
757 /* Check if we can choose most probable predecessor. */
758 if (edge_old == NULL || edge_new == NULL)
759 {
760 reset_deps_context (FENCE_DC (f));
761 delete_deps_context (dc);
762 VEC_free (rtx, gc, executing_insns);
763 free (ready_ticks);
764
765 FENCE_CYCLE (f) = MAX (FENCE_CYCLE (f), cycle);
766 if (FENCE_EXECUTING_INSNS (f))
767 VEC_block_remove (rtx, FENCE_EXECUTING_INSNS (f), 0,
768 VEC_length (rtx, FENCE_EXECUTING_INSNS (f)));
769 if (FENCE_READY_TICKS (f))
770 memset (FENCE_READY_TICKS (f), 0, FENCE_READY_TICKS_SIZE (f));
771 }
772 else
773 if (edge_new->probability > edge_old->probability)
774 {
775 delete_deps_context (FENCE_DC (f));
776 FENCE_DC (f) = dc;
777 VEC_free (rtx, gc, FENCE_EXECUTING_INSNS (f));
778 FENCE_EXECUTING_INSNS (f) = executing_insns;
779 free (FENCE_READY_TICKS (f));
780 FENCE_READY_TICKS (f) = ready_ticks;
781 FENCE_READY_TICKS_SIZE (f) = ready_ticks_size;
782 FENCE_CYCLE (f) = cycle;
783 }
784 else
785 {
786 /* Leave DC and CYCLE untouched. */
787 delete_deps_context (dc);
788 VEC_free (rtx, gc, executing_insns);
789 free (ready_ticks);
790 }
791 }
792
793 /* Fill remaining invariant fields. */
794 if (after_stall_p)
795 FENCE_AFTER_STALL_P (f) = 1;
796
797 FENCE_ISSUED_INSNS (f) = 0;
798 FENCE_STARTS_CYCLE_P (f) = 1;
799 FENCE_SCHED_NEXT (f) = NULL;
800 }
801
802 /* Add a new fence to NEW_FENCES list, initializing it from all
803 other parameters. */
804 static void
805 add_to_fences (flist_tail_t new_fences, insn_t insn,
806 state_t state, deps_t dc, void *tc, rtx last_scheduled_insn,
807 VEC(rtx, gc) *executing_insns, int *ready_ticks,
808 int ready_ticks_size, rtx sched_next, int cycle,
809 int cycle_issued_insns, int issue_rate,
810 bool starts_cycle_p, bool after_stall_p)
811 {
812 fence_t f = flist_lookup (FLIST_TAIL_HEAD (new_fences), insn);
813
814 if (! f)
815 {
816 flist_add (FLIST_TAIL_TAILP (new_fences), insn, state, dc, tc,
817 last_scheduled_insn, executing_insns, ready_ticks,
818 ready_ticks_size, sched_next, cycle, cycle_issued_insns,
819 issue_rate, starts_cycle_p, after_stall_p);
820
821 FLIST_TAIL_TAILP (new_fences)
822 = &FLIST_NEXT (*FLIST_TAIL_TAILP (new_fences));
823 }
824 else
825 {
826 merge_fences (f, insn, state, dc, tc, last_scheduled_insn,
827 executing_insns, ready_ticks, ready_ticks_size,
828 sched_next, cycle, issue_rate, after_stall_p);
829 }
830 }
831
832 /* Move the first fence in the OLD_FENCES list to NEW_FENCES. */
833 void
834 move_fence_to_fences (flist_t old_fences, flist_tail_t new_fences)
835 {
836 fence_t f, old;
837 flist_t *tailp = FLIST_TAIL_TAILP (new_fences);
838
839 old = FLIST_FENCE (old_fences);
840 f = flist_lookup (FLIST_TAIL_HEAD (new_fences),
841 FENCE_INSN (FLIST_FENCE (old_fences)));
842 if (f)
843 {
844 merge_fences (f, old->insn, old->state, old->dc, old->tc,
845 old->last_scheduled_insn, old->executing_insns,
846 old->ready_ticks, old->ready_ticks_size,
847 old->sched_next, old->cycle, old->issue_more,
848 old->after_stall_p);
849 }
850 else
851 {
852 _list_add (tailp);
853 FLIST_TAIL_TAILP (new_fences) = &FLIST_NEXT (*tailp);
854 *FLIST_FENCE (*tailp) = *old;
855 init_fence_for_scheduling (FLIST_FENCE (*tailp));
856 }
857 FENCE_INSN (old) = NULL;
858 }
859
860 /* Add a new fence to NEW_FENCES list and initialize most of its data
861 as a clean one. */
862 void
863 add_clean_fence_to_fences (flist_tail_t new_fences, insn_t succ, fence_t fence)
864 {
865 int ready_ticks_size = get_max_uid () + 1;
866
867 add_to_fences (new_fences,
868 succ, state_create (), create_deps_context (),
869 create_target_context (true),
870 NULL_RTX, NULL,
871 XCNEWVEC (int, ready_ticks_size), ready_ticks_size,
872 NULL_RTX, FENCE_CYCLE (fence) + 1,
873 0, issue_rate, 1, FENCE_AFTER_STALL_P (fence));
874 }
875
876 /* Add a new fence to NEW_FENCES list and initialize all of its data
877 from FENCE and SUCC. */
878 void
879 add_dirty_fence_to_fences (flist_tail_t new_fences, insn_t succ, fence_t fence)
880 {
881 int * new_ready_ticks
882 = XNEWVEC (int, FENCE_READY_TICKS_SIZE (fence));
883
884 memcpy (new_ready_ticks, FENCE_READY_TICKS (fence),
885 FENCE_READY_TICKS_SIZE (fence) * sizeof (int));
886 add_to_fences (new_fences,
887 succ, state_create_copy (FENCE_STATE (fence)),
888 create_copy_of_deps_context (FENCE_DC (fence)),
889 create_copy_of_target_context (FENCE_TC (fence)),
890 FENCE_LAST_SCHEDULED_INSN (fence),
891 VEC_copy (rtx, gc, FENCE_EXECUTING_INSNS (fence)),
892 new_ready_ticks,
893 FENCE_READY_TICKS_SIZE (fence),
894 FENCE_SCHED_NEXT (fence),
895 FENCE_CYCLE (fence),
896 FENCE_ISSUED_INSNS (fence),
897 FENCE_ISSUE_MORE (fence),
898 FENCE_STARTS_CYCLE_P (fence),
899 FENCE_AFTER_STALL_P (fence));
900 }
901 \f
902
903 /* Functions to work with regset and nop pools. */
904
905 /* Returns the new regset from pool. It might have some of the bits set
906 from the previous usage. */
907 regset
908 get_regset_from_pool (void)
909 {
910 regset rs;
911
912 if (regset_pool.n != 0)
913 rs = regset_pool.v[--regset_pool.n];
914 else
915 /* We need to create the regset. */
916 {
917 rs = ALLOC_REG_SET (&reg_obstack);
918
919 if (regset_pool.nn == regset_pool.ss)
920 regset_pool.vv = XRESIZEVEC (regset, regset_pool.vv,
921 (regset_pool.ss = 2 * regset_pool.ss + 1));
922 regset_pool.vv[regset_pool.nn++] = rs;
923 }
924
925 regset_pool.diff++;
926
927 return rs;
928 }
929
930 /* Same as above, but returns the empty regset. */
931 regset
932 get_clear_regset_from_pool (void)
933 {
934 regset rs = get_regset_from_pool ();
935
936 CLEAR_REG_SET (rs);
937 return rs;
938 }
939
940 /* Return regset RS to the pool for future use. */
941 void
942 return_regset_to_pool (regset rs)
943 {
944 gcc_assert (rs);
945 regset_pool.diff--;
946
947 if (regset_pool.n == regset_pool.s)
948 regset_pool.v = XRESIZEVEC (regset, regset_pool.v,
949 (regset_pool.s = 2 * regset_pool.s + 1));
950 regset_pool.v[regset_pool.n++] = rs;
951 }
952
953 #ifdef ENABLE_CHECKING
954 /* This is used as a qsort callback for sorting regset pool stacks.
955 X and XX are addresses of two regsets. They are never equal. */
956 static int
957 cmp_v_in_regset_pool (const void *x, const void *xx)
958 {
959 return *((const regset *) x) - *((const regset *) xx);
960 }
961 #endif
962
963 /* Free the regset pool possibly checking for memory leaks. */
964 void
965 free_regset_pool (void)
966 {
967 #ifdef ENABLE_CHECKING
968 {
969 regset *v = regset_pool.v;
970 int i = 0;
971 int n = regset_pool.n;
972
973 regset *vv = regset_pool.vv;
974 int ii = 0;
975 int nn = regset_pool.nn;
976
977 int diff = 0;
978
979 gcc_assert (n <= nn);
980
981 /* Sort both vectors so it will be possible to compare them. */
982 qsort (v, n, sizeof (*v), cmp_v_in_regset_pool);
983 qsort (vv, nn, sizeof (*vv), cmp_v_in_regset_pool);
984
985 while (ii < nn)
986 {
987 if (v[i] == vv[ii])
988 i++;
989 else
990 /* VV[II] was lost. */
991 diff++;
992
993 ii++;
994 }
995
996 gcc_assert (diff == regset_pool.diff);
997 }
998 #endif
999
1000 /* If not true - we have a memory leak. */
1001 gcc_assert (regset_pool.diff == 0);
1002
1003 while (regset_pool.n)
1004 {
1005 --regset_pool.n;
1006 FREE_REG_SET (regset_pool.v[regset_pool.n]);
1007 }
1008
1009 free (regset_pool.v);
1010 regset_pool.v = NULL;
1011 regset_pool.s = 0;
1012
1013 free (regset_pool.vv);
1014 regset_pool.vv = NULL;
1015 regset_pool.nn = 0;
1016 regset_pool.ss = 0;
1017
1018 regset_pool.diff = 0;
1019 }
1020 \f
1021
1022 /* Functions to work with nop pools. NOP insns are used as temporary
1023 placeholders of the insns being scheduled to allow correct update of
1024 the data sets. When update is finished, NOPs are deleted. */
1025
1026 /* A vinsn that is used to represent a nop. This vinsn is shared among all
1027 nops sel-sched generates. */
1028 static vinsn_t nop_vinsn = NULL;
1029
1030 /* Emit a nop before INSN, taking it from pool. */
1031 insn_t
1032 get_nop_from_pool (insn_t insn)
1033 {
1034 insn_t nop;
1035 bool old_p = nop_pool.n != 0;
1036 int flags;
1037
1038 if (old_p)
1039 nop = nop_pool.v[--nop_pool.n];
1040 else
1041 nop = nop_pattern;
1042
1043 nop = emit_insn_before (nop, insn);
1044
1045 if (old_p)
1046 flags = INSN_INIT_TODO_SSID;
1047 else
1048 flags = INSN_INIT_TODO_LUID | INSN_INIT_TODO_SSID;
1049
1050 set_insn_init (INSN_EXPR (insn), nop_vinsn, INSN_SEQNO (insn));
1051 sel_init_new_insn (nop, flags);
1052
1053 return nop;
1054 }
1055
1056 /* Remove NOP from the instruction stream and return it to the pool. */
1057 void
1058 return_nop_to_pool (insn_t nop, bool full_tidying)
1059 {
1060 gcc_assert (INSN_IN_STREAM_P (nop));
1061 sel_remove_insn (nop, false, full_tidying);
1062
1063 if (nop_pool.n == nop_pool.s)
1064 nop_pool.v = XRESIZEVEC (rtx, nop_pool.v,
1065 (nop_pool.s = 2 * nop_pool.s + 1));
1066 nop_pool.v[nop_pool.n++] = nop;
1067 }
1068
1069 /* Free the nop pool. */
1070 void
1071 free_nop_pool (void)
1072 {
1073 nop_pool.n = 0;
1074 nop_pool.s = 0;
1075 free (nop_pool.v);
1076 nop_pool.v = NULL;
1077 }
1078 \f
1079
1080 /* Skip unspec to support ia64 speculation. Called from rtx_equal_p_cb.
1081 The callback is given two rtxes XX and YY and writes the new rtxes
1082 to NX and NY in case some needs to be skipped. */
1083 static int
1084 skip_unspecs_callback (const_rtx *xx, const_rtx *yy, rtx *nx, rtx* ny)
1085 {
1086 const_rtx x = *xx;
1087 const_rtx y = *yy;
1088
1089 if (GET_CODE (x) == UNSPEC
1090 && (targetm.sched.skip_rtx_p == NULL
1091 || targetm.sched.skip_rtx_p (x)))
1092 {
1093 *nx = XVECEXP (x, 0, 0);
1094 *ny = CONST_CAST_RTX (y);
1095 return 1;
1096 }
1097
1098 if (GET_CODE (y) == UNSPEC
1099 && (targetm.sched.skip_rtx_p == NULL
1100 || targetm.sched.skip_rtx_p (y)))
1101 {
1102 *nx = CONST_CAST_RTX (x);
1103 *ny = XVECEXP (y, 0, 0);
1104 return 1;
1105 }
1106
1107 return 0;
1108 }
1109
1110 /* Callback, called from hash_rtx_cb. Helps to hash UNSPEC rtx X in a correct way
1111 to support ia64 speculation. When changes are needed, new rtx X and new mode
1112 NMODE are written, and the callback returns true. */
1113 static int
1114 hash_with_unspec_callback (const_rtx x, enum machine_mode mode ATTRIBUTE_UNUSED,
1115 rtx *nx, enum machine_mode* nmode)
1116 {
1117 if (GET_CODE (x) == UNSPEC
1118 && targetm.sched.skip_rtx_p
1119 && targetm.sched.skip_rtx_p (x))
1120 {
1121 *nx = XVECEXP (x, 0 ,0);
1122 *nmode = VOIDmode;
1123 return 1;
1124 }
1125
1126 return 0;
1127 }
1128
1129 /* Returns LHS and RHS are ok to be scheduled separately. */
1130 static bool
1131 lhs_and_rhs_separable_p (rtx lhs, rtx rhs)
1132 {
1133 if (lhs == NULL || rhs == NULL)
1134 return false;
1135
1136 /* Do not schedule CONST, CONST_INT and CONST_DOUBLE etc as rhs: no point
1137 to use reg, if const can be used. Moreover, scheduling const as rhs may
1138 lead to mode mismatch cause consts don't have modes but they could be
1139 merged from branches where the same const used in different modes. */
1140 if (CONSTANT_P (rhs))
1141 return false;
1142
1143 /* ??? Do not rename predicate registers to avoid ICEs in bundling. */
1144 if (COMPARISON_P (rhs))
1145 return false;
1146
1147 /* Do not allow single REG to be an rhs. */
1148 if (REG_P (rhs))
1149 return false;
1150
1151 /* See comment at find_used_regs_1 (*1) for explanation of this
1152 restriction. */
1153 /* FIXME: remove this later. */
1154 if (MEM_P (lhs))
1155 return false;
1156
1157 /* This will filter all tricky things like ZERO_EXTRACT etc.
1158 For now we don't handle it. */
1159 if (!REG_P (lhs) && !MEM_P (lhs))
1160 return false;
1161
1162 return true;
1163 }
1164
1165 /* Initialize vinsn VI for INSN. Only for use from vinsn_create (). When
1166 FORCE_UNIQUE_P is true, the resulting vinsn will not be clonable. This is
1167 used e.g. for insns from recovery blocks. */
1168 static void
1169 vinsn_init (vinsn_t vi, insn_t insn, bool force_unique_p)
1170 {
1171 hash_rtx_callback_function hrcf;
1172 int insn_class;
1173
1174 VINSN_INSN_RTX (vi) = insn;
1175 VINSN_COUNT (vi) = 0;
1176 vi->cost = -1;
1177
1178 if (INSN_NOP_P (insn))
1179 return;
1180
1181 if (DF_INSN_UID_SAFE_GET (INSN_UID (insn)) != NULL)
1182 init_id_from_df (VINSN_ID (vi), insn, force_unique_p);
1183 else
1184 deps_init_id (VINSN_ID (vi), insn, force_unique_p);
1185
1186 /* Hash vinsn depending on whether it is separable or not. */
1187 hrcf = targetm.sched.skip_rtx_p ? hash_with_unspec_callback : NULL;
1188 if (VINSN_SEPARABLE_P (vi))
1189 {
1190 rtx rhs = VINSN_RHS (vi);
1191
1192 VINSN_HASH (vi) = hash_rtx_cb (rhs, GET_MODE (rhs),
1193 NULL, NULL, false, hrcf);
1194 VINSN_HASH_RTX (vi) = hash_rtx_cb (VINSN_PATTERN (vi),
1195 VOIDmode, NULL, NULL,
1196 false, hrcf);
1197 }
1198 else
1199 {
1200 VINSN_HASH (vi) = hash_rtx_cb (VINSN_PATTERN (vi), VOIDmode,
1201 NULL, NULL, false, hrcf);
1202 VINSN_HASH_RTX (vi) = VINSN_HASH (vi);
1203 }
1204
1205 insn_class = haifa_classify_insn (insn);
1206 if (insn_class >= 2
1207 && (!targetm.sched.get_insn_spec_ds
1208 || ((targetm.sched.get_insn_spec_ds (insn) & BEGIN_CONTROL)
1209 == 0)))
1210 VINSN_MAY_TRAP_P (vi) = true;
1211 else
1212 VINSN_MAY_TRAP_P (vi) = false;
1213 }
1214
1215 /* Indicate that VI has become the part of an rtx object. */
1216 void
1217 vinsn_attach (vinsn_t vi)
1218 {
1219 /* Assert that VI is not pending for deletion. */
1220 gcc_assert (VINSN_INSN_RTX (vi));
1221
1222 VINSN_COUNT (vi)++;
1223 }
1224
1225 /* Create and init VI from the INSN. Use UNIQUE_P for determining the correct
1226 VINSN_TYPE (VI). */
1227 static vinsn_t
1228 vinsn_create (insn_t insn, bool force_unique_p)
1229 {
1230 vinsn_t vi = XCNEW (struct vinsn_def);
1231
1232 vinsn_init (vi, insn, force_unique_p);
1233 return vi;
1234 }
1235
1236 /* Return a copy of VI. When REATTACH_P is true, detach VI and attach
1237 the copy. */
1238 vinsn_t
1239 vinsn_copy (vinsn_t vi, bool reattach_p)
1240 {
1241 rtx copy;
1242 bool unique = VINSN_UNIQUE_P (vi);
1243 vinsn_t new_vi;
1244
1245 copy = create_copy_of_insn_rtx (VINSN_INSN_RTX (vi));
1246 new_vi = create_vinsn_from_insn_rtx (copy, unique);
1247 if (reattach_p)
1248 {
1249 vinsn_detach (vi);
1250 vinsn_attach (new_vi);
1251 }
1252
1253 return new_vi;
1254 }
1255
1256 /* Delete the VI vinsn and free its data. */
1257 static void
1258 vinsn_delete (vinsn_t vi)
1259 {
1260 gcc_assert (VINSN_COUNT (vi) == 0);
1261
1262 if (!INSN_NOP_P (VINSN_INSN_RTX (vi)))
1263 {
1264 return_regset_to_pool (VINSN_REG_SETS (vi));
1265 return_regset_to_pool (VINSN_REG_USES (vi));
1266 return_regset_to_pool (VINSN_REG_CLOBBERS (vi));
1267 }
1268
1269 free (vi);
1270 }
1271
1272 /* Indicate that VI is no longer a part of some rtx object.
1273 Remove VI if it is no longer needed. */
1274 void
1275 vinsn_detach (vinsn_t vi)
1276 {
1277 gcc_assert (VINSN_COUNT (vi) > 0);
1278
1279 if (--VINSN_COUNT (vi) == 0)
1280 vinsn_delete (vi);
1281 }
1282
1283 /* Returns TRUE if VI is a branch. */
1284 bool
1285 vinsn_cond_branch_p (vinsn_t vi)
1286 {
1287 insn_t insn;
1288
1289 if (!VINSN_UNIQUE_P (vi))
1290 return false;
1291
1292 insn = VINSN_INSN_RTX (vi);
1293 if (BB_END (BLOCK_FOR_INSN (insn)) != insn)
1294 return false;
1295
1296 return control_flow_insn_p (insn);
1297 }
1298
1299 /* Return latency of INSN. */
1300 static int
1301 sel_insn_rtx_cost (rtx insn)
1302 {
1303 int cost;
1304
1305 /* A USE insn, or something else we don't need to
1306 understand. We can't pass these directly to
1307 result_ready_cost or insn_default_latency because it will
1308 trigger a fatal error for unrecognizable insns. */
1309 if (recog_memoized (insn) < 0)
1310 cost = 0;
1311 else
1312 {
1313 cost = insn_default_latency (insn);
1314
1315 if (cost < 0)
1316 cost = 0;
1317 }
1318
1319 return cost;
1320 }
1321
1322 /* Return the cost of the VI.
1323 !!! FIXME: Unify with haifa-sched.c: insn_cost (). */
1324 int
1325 sel_vinsn_cost (vinsn_t vi)
1326 {
1327 int cost = vi->cost;
1328
1329 if (cost < 0)
1330 {
1331 cost = sel_insn_rtx_cost (VINSN_INSN_RTX (vi));
1332 vi->cost = cost;
1333 }
1334
1335 return cost;
1336 }
1337 \f
1338
1339 /* Functions for insn emitting. */
1340
1341 /* Emit new insn after AFTER based on PATTERN and initialize its data from
1342 EXPR and SEQNO. */
1343 insn_t
1344 sel_gen_insn_from_rtx_after (rtx pattern, expr_t expr, int seqno, insn_t after)
1345 {
1346 insn_t new_insn;
1347
1348 gcc_assert (EXPR_TARGET_AVAILABLE (expr) == true);
1349
1350 new_insn = emit_insn_after (pattern, after);
1351 set_insn_init (expr, NULL, seqno);
1352 sel_init_new_insn (new_insn, INSN_INIT_TODO_LUID | INSN_INIT_TODO_SSID);
1353
1354 return new_insn;
1355 }
1356
1357 /* Force newly generated vinsns to be unique. */
1358 static bool init_insn_force_unique_p = false;
1359
1360 /* Emit new speculation recovery insn after AFTER based on PATTERN and
1361 initialize its data from EXPR and SEQNO. */
1362 insn_t
1363 sel_gen_recovery_insn_from_rtx_after (rtx pattern, expr_t expr, int seqno,
1364 insn_t after)
1365 {
1366 insn_t insn;
1367
1368 gcc_assert (!init_insn_force_unique_p);
1369
1370 init_insn_force_unique_p = true;
1371 insn = sel_gen_insn_from_rtx_after (pattern, expr, seqno, after);
1372 CANT_MOVE (insn) = 1;
1373 init_insn_force_unique_p = false;
1374
1375 return insn;
1376 }
1377
1378 /* Emit new insn after AFTER based on EXPR and SEQNO. If VINSN is not NULL,
1379 take it as a new vinsn instead of EXPR's vinsn.
1380 We simplify insns later, after scheduling region in
1381 simplify_changed_insns. */
1382 insn_t
1383 sel_gen_insn_from_expr_after (expr_t expr, vinsn_t vinsn, int seqno,
1384 insn_t after)
1385 {
1386 expr_t emit_expr;
1387 insn_t insn;
1388 int flags;
1389
1390 emit_expr = set_insn_init (expr, vinsn ? vinsn : EXPR_VINSN (expr),
1391 seqno);
1392 insn = EXPR_INSN_RTX (emit_expr);
1393 add_insn_after (insn, after, BLOCK_FOR_INSN (insn));
1394
1395 flags = INSN_INIT_TODO_SSID;
1396 if (INSN_LUID (insn) == 0)
1397 flags |= INSN_INIT_TODO_LUID;
1398 sel_init_new_insn (insn, flags);
1399
1400 return insn;
1401 }
1402
1403 /* Move insn from EXPR after AFTER. */
1404 insn_t
1405 sel_move_insn (expr_t expr, int seqno, insn_t after)
1406 {
1407 insn_t insn = EXPR_INSN_RTX (expr);
1408 basic_block bb = BLOCK_FOR_INSN (after);
1409 insn_t next = NEXT_INSN (after);
1410
1411 /* Assert that in move_op we disconnected this insn properly. */
1412 gcc_assert (EXPR_VINSN (INSN_EXPR (insn)) != NULL);
1413 PREV_INSN (insn) = after;
1414 NEXT_INSN (insn) = next;
1415
1416 NEXT_INSN (after) = insn;
1417 PREV_INSN (next) = insn;
1418
1419 /* Update links from insn to bb and vice versa. */
1420 df_insn_change_bb (insn, bb);
1421 if (BB_END (bb) == after)
1422 BB_END (bb) = insn;
1423
1424 prepare_insn_expr (insn, seqno);
1425 return insn;
1426 }
1427
1428 \f
1429 /* Functions to work with right-hand sides. */
1430
1431 /* Search for a hash value determined by UID/NEW_VINSN in a sorted vector
1432 VECT and return true when found. Use NEW_VINSN for comparison only when
1433 COMPARE_VINSNS is true. Write to INDP the index on which
1434 the search has stopped, such that inserting the new element at INDP will
1435 retain VECT's sort order. */
1436 static bool
1437 find_in_history_vect_1 (VEC(expr_history_def, heap) *vect,
1438 unsigned uid, vinsn_t new_vinsn,
1439 bool compare_vinsns, int *indp)
1440 {
1441 expr_history_def *arr;
1442 int i, j, len = VEC_length (expr_history_def, vect);
1443
1444 if (len == 0)
1445 {
1446 *indp = 0;
1447 return false;
1448 }
1449
1450 arr = VEC_address (expr_history_def, vect);
1451 i = 0, j = len - 1;
1452
1453 while (i <= j)
1454 {
1455 unsigned auid = arr[i].uid;
1456 vinsn_t avinsn = arr[i].new_expr_vinsn;
1457
1458 if (auid == uid
1459 /* When undoing transformation on a bookkeeping copy, the new vinsn
1460 may not be exactly equal to the one that is saved in the vector.
1461 This is because the insn whose copy we're checking was possibly
1462 substituted itself. */
1463 && (! compare_vinsns
1464 || vinsn_equal_p (avinsn, new_vinsn)))
1465 {
1466 *indp = i;
1467 return true;
1468 }
1469 else if (auid > uid)
1470 break;
1471 i++;
1472 }
1473
1474 *indp = i;
1475 return false;
1476 }
1477
1478 /* Search for a uid of INSN and NEW_VINSN in a sorted vector VECT. Return
1479 the position found or -1, if no such value is in vector.
1480 Search also for UIDs of insn's originators, if ORIGINATORS_P is true. */
1481 int
1482 find_in_history_vect (VEC(expr_history_def, heap) *vect, rtx insn,
1483 vinsn_t new_vinsn, bool originators_p)
1484 {
1485 int ind;
1486
1487 if (find_in_history_vect_1 (vect, INSN_UID (insn), new_vinsn,
1488 false, &ind))
1489 return ind;
1490
1491 if (INSN_ORIGINATORS (insn) && originators_p)
1492 {
1493 unsigned uid;
1494 bitmap_iterator bi;
1495
1496 EXECUTE_IF_SET_IN_BITMAP (INSN_ORIGINATORS (insn), 0, uid, bi)
1497 if (find_in_history_vect_1 (vect, uid, new_vinsn, false, &ind))
1498 return ind;
1499 }
1500
1501 return -1;
1502 }
1503
1504 /* Insert new element in a sorted history vector pointed to by PVECT,
1505 if it is not there already. The element is searched using
1506 UID/NEW_EXPR_VINSN pair. TYPE, OLD_EXPR_VINSN and SPEC_DS save
1507 the history of a transformation. */
1508 void
1509 insert_in_history_vect (VEC (expr_history_def, heap) **pvect,
1510 unsigned uid, enum local_trans_type type,
1511 vinsn_t old_expr_vinsn, vinsn_t new_expr_vinsn,
1512 ds_t spec_ds)
1513 {
1514 VEC(expr_history_def, heap) *vect = *pvect;
1515 expr_history_def temp;
1516 bool res;
1517 int ind;
1518
1519 res = find_in_history_vect_1 (vect, uid, new_expr_vinsn, true, &ind);
1520
1521 if (res)
1522 {
1523 expr_history_def *phist = VEC_index (expr_history_def, vect, ind);
1524
1525 /* It is possible that speculation types of expressions that were
1526 propagated through different paths will be different here. In this
1527 case, merge the status to get the correct check later. */
1528 if (phist->spec_ds != spec_ds)
1529 phist->spec_ds = ds_max_merge (phist->spec_ds, spec_ds);
1530 return;
1531 }
1532
1533 temp.uid = uid;
1534 temp.old_expr_vinsn = old_expr_vinsn;
1535 temp.new_expr_vinsn = new_expr_vinsn;
1536 temp.spec_ds = spec_ds;
1537 temp.type = type;
1538
1539 vinsn_attach (old_expr_vinsn);
1540 vinsn_attach (new_expr_vinsn);
1541 VEC_safe_insert (expr_history_def, heap, vect, ind, &temp);
1542 *pvect = vect;
1543 }
1544
1545 /* Free history vector PVECT. */
1546 static void
1547 free_history_vect (VEC (expr_history_def, heap) **pvect)
1548 {
1549 unsigned i;
1550 expr_history_def *phist;
1551
1552 if (! *pvect)
1553 return;
1554
1555 for (i = 0;
1556 VEC_iterate (expr_history_def, *pvect, i, phist);
1557 i++)
1558 {
1559 vinsn_detach (phist->old_expr_vinsn);
1560 vinsn_detach (phist->new_expr_vinsn);
1561 }
1562
1563 VEC_free (expr_history_def, heap, *pvect);
1564 *pvect = NULL;
1565 }
1566
1567 /* Merge vector FROM to PVECT. */
1568 static void
1569 merge_history_vect (VEC (expr_history_def, heap) **pvect,
1570 VEC (expr_history_def, heap) *from)
1571 {
1572 expr_history_def *phist;
1573 int i;
1574
1575 /* We keep this vector sorted. */
1576 for (i = 0; VEC_iterate (expr_history_def, from, i, phist); i++)
1577 insert_in_history_vect (pvect, phist->uid, phist->type,
1578 phist->old_expr_vinsn, phist->new_expr_vinsn,
1579 phist->spec_ds);
1580 }
1581
1582 /* Compare two vinsns as rhses if possible and as vinsns otherwise. */
1583 bool
1584 vinsn_equal_p (vinsn_t x, vinsn_t y)
1585 {
1586 rtx_equal_p_callback_function repcf;
1587
1588 if (x == y)
1589 return true;
1590
1591 if (VINSN_TYPE (x) != VINSN_TYPE (y))
1592 return false;
1593
1594 if (VINSN_HASH (x) != VINSN_HASH (y))
1595 return false;
1596
1597 repcf = targetm.sched.skip_rtx_p ? skip_unspecs_callback : NULL;
1598 if (VINSN_SEPARABLE_P (x))
1599 {
1600 /* Compare RHSes of VINSNs. */
1601 gcc_assert (VINSN_RHS (x));
1602 gcc_assert (VINSN_RHS (y));
1603
1604 return rtx_equal_p_cb (VINSN_RHS (x), VINSN_RHS (y), repcf);
1605 }
1606
1607 return rtx_equal_p_cb (VINSN_PATTERN (x), VINSN_PATTERN (y), repcf);
1608 }
1609 \f
1610
1611 /* Functions for working with expressions. */
1612
1613 /* Initialize EXPR. */
1614 static void
1615 init_expr (expr_t expr, vinsn_t vi, int spec, int use, int priority,
1616 int sched_times, int orig_bb_index, ds_t spec_done_ds,
1617 ds_t spec_to_check_ds, int orig_sched_cycle,
1618 VEC(expr_history_def, heap) *history, signed char target_available,
1619 bool was_substituted, bool was_renamed, bool needs_spec_check_p,
1620 bool cant_move)
1621 {
1622 vinsn_attach (vi);
1623
1624 EXPR_VINSN (expr) = vi;
1625 EXPR_SPEC (expr) = spec;
1626 EXPR_USEFULNESS (expr) = use;
1627 EXPR_PRIORITY (expr) = priority;
1628 EXPR_PRIORITY_ADJ (expr) = 0;
1629 EXPR_SCHED_TIMES (expr) = sched_times;
1630 EXPR_ORIG_BB_INDEX (expr) = orig_bb_index;
1631 EXPR_ORIG_SCHED_CYCLE (expr) = orig_sched_cycle;
1632 EXPR_SPEC_DONE_DS (expr) = spec_done_ds;
1633 EXPR_SPEC_TO_CHECK_DS (expr) = spec_to_check_ds;
1634
1635 if (history)
1636 EXPR_HISTORY_OF_CHANGES (expr) = history;
1637 else
1638 EXPR_HISTORY_OF_CHANGES (expr) = NULL;
1639
1640 EXPR_TARGET_AVAILABLE (expr) = target_available;
1641 EXPR_WAS_SUBSTITUTED (expr) = was_substituted;
1642 EXPR_WAS_RENAMED (expr) = was_renamed;
1643 EXPR_NEEDS_SPEC_CHECK_P (expr) = needs_spec_check_p;
1644 EXPR_CANT_MOVE (expr) = cant_move;
1645 }
1646
1647 /* Make a copy of the expr FROM into the expr TO. */
1648 void
1649 copy_expr (expr_t to, expr_t from)
1650 {
1651 VEC(expr_history_def, heap) *temp = NULL;
1652
1653 if (EXPR_HISTORY_OF_CHANGES (from))
1654 {
1655 unsigned i;
1656 expr_history_def *phist;
1657
1658 temp = VEC_copy (expr_history_def, heap, EXPR_HISTORY_OF_CHANGES (from));
1659 for (i = 0;
1660 VEC_iterate (expr_history_def, temp, i, phist);
1661 i++)
1662 {
1663 vinsn_attach (phist->old_expr_vinsn);
1664 vinsn_attach (phist->new_expr_vinsn);
1665 }
1666 }
1667
1668 init_expr (to, EXPR_VINSN (from), EXPR_SPEC (from),
1669 EXPR_USEFULNESS (from), EXPR_PRIORITY (from),
1670 EXPR_SCHED_TIMES (from), EXPR_ORIG_BB_INDEX (from),
1671 EXPR_SPEC_DONE_DS (from), EXPR_SPEC_TO_CHECK_DS (from),
1672 EXPR_ORIG_SCHED_CYCLE (from), temp,
1673 EXPR_TARGET_AVAILABLE (from), EXPR_WAS_SUBSTITUTED (from),
1674 EXPR_WAS_RENAMED (from), EXPR_NEEDS_SPEC_CHECK_P (from),
1675 EXPR_CANT_MOVE (from));
1676 }
1677
1678 /* Same, but the final expr will not ever be in av sets, so don't copy
1679 "uninteresting" data such as bitmap cache. */
1680 void
1681 copy_expr_onside (expr_t to, expr_t from)
1682 {
1683 init_expr (to, EXPR_VINSN (from), EXPR_SPEC (from), EXPR_USEFULNESS (from),
1684 EXPR_PRIORITY (from), EXPR_SCHED_TIMES (from), 0,
1685 EXPR_SPEC_DONE_DS (from), EXPR_SPEC_TO_CHECK_DS (from), 0, NULL,
1686 EXPR_TARGET_AVAILABLE (from), EXPR_WAS_SUBSTITUTED (from),
1687 EXPR_WAS_RENAMED (from), EXPR_NEEDS_SPEC_CHECK_P (from),
1688 EXPR_CANT_MOVE (from));
1689 }
1690
1691 /* Prepare the expr of INSN for scheduling. Used when moving insn and when
1692 initializing new insns. */
1693 static void
1694 prepare_insn_expr (insn_t insn, int seqno)
1695 {
1696 expr_t expr = INSN_EXPR (insn);
1697 ds_t ds;
1698
1699 INSN_SEQNO (insn) = seqno;
1700 EXPR_ORIG_BB_INDEX (expr) = BLOCK_NUM (insn);
1701 EXPR_SPEC (expr) = 0;
1702 EXPR_ORIG_SCHED_CYCLE (expr) = 0;
1703 EXPR_WAS_SUBSTITUTED (expr) = 0;
1704 EXPR_WAS_RENAMED (expr) = 0;
1705 EXPR_TARGET_AVAILABLE (expr) = 1;
1706 INSN_LIVE_VALID_P (insn) = false;
1707
1708 /* ??? If this expression is speculative, make its dependence
1709 as weak as possible. We can filter this expression later
1710 in process_spec_exprs, because we do not distinguish
1711 between the status we got during compute_av_set and the
1712 existing status. To be fixed. */
1713 ds = EXPR_SPEC_DONE_DS (expr);
1714 if (ds)
1715 EXPR_SPEC_DONE_DS (expr) = ds_get_max_dep_weak (ds);
1716
1717 free_history_vect (&EXPR_HISTORY_OF_CHANGES (expr));
1718 }
1719
1720 /* Update target_available bits when merging exprs TO and FROM. SPLIT_POINT
1721 is non-null when expressions are merged from different successors at
1722 a split point. */
1723 static void
1724 update_target_availability (expr_t to, expr_t from, insn_t split_point)
1725 {
1726 if (EXPR_TARGET_AVAILABLE (to) < 0
1727 || EXPR_TARGET_AVAILABLE (from) < 0)
1728 EXPR_TARGET_AVAILABLE (to) = -1;
1729 else
1730 {
1731 /* We try to detect the case when one of the expressions
1732 can only be reached through another one. In this case,
1733 we can do better. */
1734 if (split_point == NULL)
1735 {
1736 int toind, fromind;
1737
1738 toind = EXPR_ORIG_BB_INDEX (to);
1739 fromind = EXPR_ORIG_BB_INDEX (from);
1740
1741 if (toind && toind == fromind)
1742 /* Do nothing -- everything is done in
1743 merge_with_other_exprs. */
1744 ;
1745 else
1746 EXPR_TARGET_AVAILABLE (to) = -1;
1747 }
1748 else
1749 EXPR_TARGET_AVAILABLE (to) &= EXPR_TARGET_AVAILABLE (from);
1750 }
1751 }
1752
1753 /* Update speculation bits when merging exprs TO and FROM. SPLIT_POINT
1754 is non-null when expressions are merged from different successors at
1755 a split point. */
1756 static void
1757 update_speculative_bits (expr_t to, expr_t from, insn_t split_point)
1758 {
1759 ds_t old_to_ds, old_from_ds;
1760
1761 old_to_ds = EXPR_SPEC_DONE_DS (to);
1762 old_from_ds = EXPR_SPEC_DONE_DS (from);
1763
1764 EXPR_SPEC_DONE_DS (to) = ds_max_merge (old_to_ds, old_from_ds);
1765 EXPR_SPEC_TO_CHECK_DS (to) |= EXPR_SPEC_TO_CHECK_DS (from);
1766 EXPR_NEEDS_SPEC_CHECK_P (to) |= EXPR_NEEDS_SPEC_CHECK_P (from);
1767
1768 /* When merging e.g. control & data speculative exprs, or a control
1769 speculative with a control&data speculative one, we really have
1770 to change vinsn too. Also, when speculative status is changed,
1771 we also need to record this as a transformation in expr's history. */
1772 if ((old_to_ds & SPECULATIVE) || (old_from_ds & SPECULATIVE))
1773 {
1774 old_to_ds = ds_get_speculation_types (old_to_ds);
1775 old_from_ds = ds_get_speculation_types (old_from_ds);
1776
1777 if (old_to_ds != old_from_ds)
1778 {
1779 ds_t record_ds;
1780
1781 /* When both expressions are speculative, we need to change
1782 the vinsn first. */
1783 if ((old_to_ds & SPECULATIVE) && (old_from_ds & SPECULATIVE))
1784 {
1785 int res;
1786
1787 res = speculate_expr (to, EXPR_SPEC_DONE_DS (to));
1788 gcc_assert (res >= 0);
1789 }
1790
1791 if (split_point != NULL)
1792 {
1793 /* Record the change with proper status. */
1794 record_ds = EXPR_SPEC_DONE_DS (to) & SPECULATIVE;
1795 record_ds &= ~(old_to_ds & SPECULATIVE);
1796 record_ds &= ~(old_from_ds & SPECULATIVE);
1797
1798 insert_in_history_vect (&EXPR_HISTORY_OF_CHANGES (to),
1799 INSN_UID (split_point), TRANS_SPECULATION,
1800 EXPR_VINSN (from), EXPR_VINSN (to),
1801 record_ds);
1802 }
1803 }
1804 }
1805 }
1806
1807
1808 /* Merge bits of FROM expr to TO expr. When SPLIT_POINT is not NULL,
1809 this is done along different paths. */
1810 void
1811 merge_expr_data (expr_t to, expr_t from, insn_t split_point)
1812 {
1813 /* Choose the maximum of the specs of merged exprs. This is required
1814 for correctness of bookkeeping. */
1815 if (EXPR_SPEC (to) < EXPR_SPEC (from))
1816 EXPR_SPEC (to) = EXPR_SPEC (from);
1817
1818 if (split_point)
1819 EXPR_USEFULNESS (to) += EXPR_USEFULNESS (from);
1820 else
1821 EXPR_USEFULNESS (to) = MAX (EXPR_USEFULNESS (to),
1822 EXPR_USEFULNESS (from));
1823
1824 if (EXPR_PRIORITY (to) < EXPR_PRIORITY (from))
1825 EXPR_PRIORITY (to) = EXPR_PRIORITY (from);
1826
1827 if (EXPR_SCHED_TIMES (to) > EXPR_SCHED_TIMES (from))
1828 EXPR_SCHED_TIMES (to) = EXPR_SCHED_TIMES (from);
1829
1830 if (EXPR_ORIG_BB_INDEX (to) != EXPR_ORIG_BB_INDEX (from))
1831 EXPR_ORIG_BB_INDEX (to) = 0;
1832
1833 EXPR_ORIG_SCHED_CYCLE (to) = MIN (EXPR_ORIG_SCHED_CYCLE (to),
1834 EXPR_ORIG_SCHED_CYCLE (from));
1835
1836 EXPR_WAS_SUBSTITUTED (to) |= EXPR_WAS_SUBSTITUTED (from);
1837 EXPR_WAS_RENAMED (to) |= EXPR_WAS_RENAMED (from);
1838 EXPR_CANT_MOVE (to) |= EXPR_CANT_MOVE (from);
1839
1840 merge_history_vect (&EXPR_HISTORY_OF_CHANGES (to),
1841 EXPR_HISTORY_OF_CHANGES (from));
1842 update_target_availability (to, from, split_point);
1843 update_speculative_bits (to, from, split_point);
1844 }
1845
1846 /* Merge bits of FROM expr to TO expr. Vinsns in the exprs should be equal
1847 in terms of vinsn_equal_p. SPLIT_POINT is non-null when expressions
1848 are merged from different successors at a split point. */
1849 void
1850 merge_expr (expr_t to, expr_t from, insn_t split_point)
1851 {
1852 vinsn_t to_vi = EXPR_VINSN (to);
1853 vinsn_t from_vi = EXPR_VINSN (from);
1854
1855 gcc_assert (vinsn_equal_p (to_vi, from_vi));
1856
1857 /* Make sure that speculative pattern is propagated into exprs that
1858 have non-speculative one. This will provide us with consistent
1859 speculative bits and speculative patterns inside expr. */
1860 if (EXPR_SPEC_DONE_DS (to) == 0
1861 && EXPR_SPEC_DONE_DS (from) != 0)
1862 change_vinsn_in_expr (to, EXPR_VINSN (from));
1863
1864 merge_expr_data (to, from, split_point);
1865 gcc_assert (EXPR_USEFULNESS (to) <= REG_BR_PROB_BASE);
1866 }
1867
1868 /* Clear the information of this EXPR. */
1869 void
1870 clear_expr (expr_t expr)
1871 {
1872
1873 vinsn_detach (EXPR_VINSN (expr));
1874 EXPR_VINSN (expr) = NULL;
1875
1876 free_history_vect (&EXPR_HISTORY_OF_CHANGES (expr));
1877 }
1878
1879 /* For a given LV_SET, mark EXPR having unavailable target register. */
1880 static void
1881 set_unavailable_target_for_expr (expr_t expr, regset lv_set)
1882 {
1883 if (EXPR_SEPARABLE_P (expr))
1884 {
1885 if (REG_P (EXPR_LHS (expr))
1886 && register_unavailable_p (lv_set, EXPR_LHS (expr)))
1887 {
1888 /* If it's an insn like r1 = use (r1, ...), and it exists in
1889 different forms in each of the av_sets being merged, we can't say
1890 whether original destination register is available or not.
1891 However, this still works if destination register is not used
1892 in the original expression: if the branch at which LV_SET we're
1893 looking here is not actually 'other branch' in sense that same
1894 expression is available through it (but it can't be determined
1895 at computation stage because of transformations on one of the
1896 branches), it still won't affect the availability.
1897 Liveness of a register somewhere on a code motion path means
1898 it's either read somewhere on a codemotion path, live on
1899 'other' branch, live at the point immediately following
1900 the original operation, or is read by the original operation.
1901 The latter case is filtered out in the condition below.
1902 It still doesn't cover the case when register is defined and used
1903 somewhere within the code motion path, and in this case we could
1904 miss a unifying code motion along both branches using a renamed
1905 register, but it won't affect a code correctness since upon
1906 an actual code motion a bookkeeping code would be generated. */
1907 if (register_unavailable_p (VINSN_REG_USES (EXPR_VINSN (expr)),
1908 EXPR_LHS (expr)))
1909 EXPR_TARGET_AVAILABLE (expr) = -1;
1910 else
1911 EXPR_TARGET_AVAILABLE (expr) = false;
1912 }
1913 }
1914 else
1915 {
1916 unsigned regno;
1917 reg_set_iterator rsi;
1918
1919 EXECUTE_IF_SET_IN_REG_SET (VINSN_REG_SETS (EXPR_VINSN (expr)),
1920 0, regno, rsi)
1921 if (bitmap_bit_p (lv_set, regno))
1922 {
1923 EXPR_TARGET_AVAILABLE (expr) = false;
1924 break;
1925 }
1926
1927 EXECUTE_IF_SET_IN_REG_SET (VINSN_REG_CLOBBERS (EXPR_VINSN (expr)),
1928 0, regno, rsi)
1929 if (bitmap_bit_p (lv_set, regno))
1930 {
1931 EXPR_TARGET_AVAILABLE (expr) = false;
1932 break;
1933 }
1934 }
1935 }
1936
1937 /* Try to make EXPR speculative. Return 1 when EXPR's pattern
1938 or dependence status have changed, 2 when also the target register
1939 became unavailable, 0 if nothing had to be changed. */
1940 int
1941 speculate_expr (expr_t expr, ds_t ds)
1942 {
1943 int res;
1944 rtx orig_insn_rtx;
1945 rtx spec_pat;
1946 ds_t target_ds, current_ds;
1947
1948 /* Obtain the status we need to put on EXPR. */
1949 target_ds = (ds & SPECULATIVE);
1950 current_ds = EXPR_SPEC_DONE_DS (expr);
1951 ds = ds_full_merge (current_ds, target_ds, NULL_RTX, NULL_RTX);
1952
1953 orig_insn_rtx = EXPR_INSN_RTX (expr);
1954
1955 res = sched_speculate_insn (orig_insn_rtx, ds, &spec_pat);
1956
1957 switch (res)
1958 {
1959 case 0:
1960 EXPR_SPEC_DONE_DS (expr) = ds;
1961 return current_ds != ds ? 1 : 0;
1962
1963 case 1:
1964 {
1965 rtx spec_insn_rtx = create_insn_rtx_from_pattern (spec_pat, NULL_RTX);
1966 vinsn_t spec_vinsn = create_vinsn_from_insn_rtx (spec_insn_rtx, false);
1967
1968 change_vinsn_in_expr (expr, spec_vinsn);
1969 EXPR_SPEC_DONE_DS (expr) = ds;
1970 EXPR_NEEDS_SPEC_CHECK_P (expr) = true;
1971
1972 /* Do not allow clobbering the address register of speculative
1973 insns. */
1974 if (register_unavailable_p (VINSN_REG_USES (EXPR_VINSN (expr)),
1975 expr_dest_reg (expr)))
1976 {
1977 EXPR_TARGET_AVAILABLE (expr) = false;
1978 return 2;
1979 }
1980
1981 return 1;
1982 }
1983
1984 case -1:
1985 return -1;
1986
1987 default:
1988 gcc_unreachable ();
1989 return -1;
1990 }
1991 }
1992
1993 /* Return a destination register, if any, of EXPR. */
1994 rtx
1995 expr_dest_reg (expr_t expr)
1996 {
1997 rtx dest = VINSN_LHS (EXPR_VINSN (expr));
1998
1999 if (dest != NULL_RTX && REG_P (dest))
2000 return dest;
2001
2002 return NULL_RTX;
2003 }
2004
2005 /* Returns the REGNO of the R's destination. */
2006 unsigned
2007 expr_dest_regno (expr_t expr)
2008 {
2009 rtx dest = expr_dest_reg (expr);
2010
2011 gcc_assert (dest != NULL_RTX);
2012 return REGNO (dest);
2013 }
2014
2015 /* For a given LV_SET, mark all expressions in JOIN_SET, but not present in
2016 AV_SET having unavailable target register. */
2017 void
2018 mark_unavailable_targets (av_set_t join_set, av_set_t av_set, regset lv_set)
2019 {
2020 expr_t expr;
2021 av_set_iterator avi;
2022
2023 FOR_EACH_EXPR (expr, avi, join_set)
2024 if (av_set_lookup (av_set, EXPR_VINSN (expr)) == NULL)
2025 set_unavailable_target_for_expr (expr, lv_set);
2026 }
2027 \f
2028
2029 /* Returns true if REG (at least partially) is present in REGS. */
2030 bool
2031 register_unavailable_p (regset regs, rtx reg)
2032 {
2033 unsigned regno, end_regno;
2034
2035 regno = REGNO (reg);
2036 if (bitmap_bit_p (regs, regno))
2037 return true;
2038
2039 end_regno = END_REGNO (reg);
2040
2041 while (++regno < end_regno)
2042 if (bitmap_bit_p (regs, regno))
2043 return true;
2044
2045 return false;
2046 }
2047
2048 /* Av set functions. */
2049
2050 /* Add a new element to av set SETP.
2051 Return the element added. */
2052 static av_set_t
2053 av_set_add_element (av_set_t *setp)
2054 {
2055 /* Insert at the beginning of the list. */
2056 _list_add (setp);
2057 return *setp;
2058 }
2059
2060 /* Add EXPR to SETP. */
2061 void
2062 av_set_add (av_set_t *setp, expr_t expr)
2063 {
2064 av_set_t elem;
2065
2066 gcc_assert (!INSN_NOP_P (EXPR_INSN_RTX (expr)));
2067 elem = av_set_add_element (setp);
2068 copy_expr (_AV_SET_EXPR (elem), expr);
2069 }
2070
2071 /* Same, but do not copy EXPR. */
2072 static void
2073 av_set_add_nocopy (av_set_t *setp, expr_t expr)
2074 {
2075 av_set_t elem;
2076
2077 elem = av_set_add_element (setp);
2078 *_AV_SET_EXPR (elem) = *expr;
2079 }
2080
2081 /* Remove expr pointed to by IP from the av_set. */
2082 void
2083 av_set_iter_remove (av_set_iterator *ip)
2084 {
2085 clear_expr (_AV_SET_EXPR (*ip->lp));
2086 _list_iter_remove (ip);
2087 }
2088
2089 /* Search for an expr in SET, such that it's equivalent to SOUGHT_VINSN in the
2090 sense of vinsn_equal_p function. Return NULL if no such expr is
2091 in SET was found. */
2092 expr_t
2093 av_set_lookup (av_set_t set, vinsn_t sought_vinsn)
2094 {
2095 expr_t expr;
2096 av_set_iterator i;
2097
2098 FOR_EACH_EXPR (expr, i, set)
2099 if (vinsn_equal_p (EXPR_VINSN (expr), sought_vinsn))
2100 return expr;
2101 return NULL;
2102 }
2103
2104 /* Same, but also remove the EXPR found. */
2105 static expr_t
2106 av_set_lookup_and_remove (av_set_t *setp, vinsn_t sought_vinsn)
2107 {
2108 expr_t expr;
2109 av_set_iterator i;
2110
2111 FOR_EACH_EXPR_1 (expr, i, setp)
2112 if (vinsn_equal_p (EXPR_VINSN (expr), sought_vinsn))
2113 {
2114 _list_iter_remove_nofree (&i);
2115 return expr;
2116 }
2117 return NULL;
2118 }
2119
2120 /* Search for an expr in SET, such that it's equivalent to EXPR in the
2121 sense of vinsn_equal_p function of their vinsns, but not EXPR itself.
2122 Returns NULL if no such expr is in SET was found. */
2123 static expr_t
2124 av_set_lookup_other_equiv_expr (av_set_t set, expr_t expr)
2125 {
2126 expr_t cur_expr;
2127 av_set_iterator i;
2128
2129 FOR_EACH_EXPR (cur_expr, i, set)
2130 {
2131 if (cur_expr == expr)
2132 continue;
2133 if (vinsn_equal_p (EXPR_VINSN (cur_expr), EXPR_VINSN (expr)))
2134 return cur_expr;
2135 }
2136
2137 return NULL;
2138 }
2139
2140 /* If other expression is already in AVP, remove one of them. */
2141 expr_t
2142 merge_with_other_exprs (av_set_t *avp, av_set_iterator *ip, expr_t expr)
2143 {
2144 expr_t expr2;
2145
2146 expr2 = av_set_lookup_other_equiv_expr (*avp, expr);
2147 if (expr2 != NULL)
2148 {
2149 /* Reset target availability on merge, since taking it only from one
2150 of the exprs would be controversial for different code. */
2151 EXPR_TARGET_AVAILABLE (expr2) = -1;
2152 EXPR_USEFULNESS (expr2) = 0;
2153
2154 merge_expr (expr2, expr, NULL);
2155
2156 /* Fix usefulness as it should be now REG_BR_PROB_BASE. */
2157 EXPR_USEFULNESS (expr2) = REG_BR_PROB_BASE;
2158
2159 av_set_iter_remove (ip);
2160 return expr2;
2161 }
2162
2163 return expr;
2164 }
2165
2166 /* Return true if there is an expr that correlates to VI in SET. */
2167 bool
2168 av_set_is_in_p (av_set_t set, vinsn_t vi)
2169 {
2170 return av_set_lookup (set, vi) != NULL;
2171 }
2172
2173 /* Return a copy of SET. */
2174 av_set_t
2175 av_set_copy (av_set_t set)
2176 {
2177 expr_t expr;
2178 av_set_iterator i;
2179 av_set_t res = NULL;
2180
2181 FOR_EACH_EXPR (expr, i, set)
2182 av_set_add (&res, expr);
2183
2184 return res;
2185 }
2186
2187 /* Join two av sets that do not have common elements by attaching second set
2188 (pointed to by FROMP) to the end of first set (TO_TAILP must point to
2189 _AV_SET_NEXT of first set's last element). */
2190 static void
2191 join_distinct_sets (av_set_t *to_tailp, av_set_t *fromp)
2192 {
2193 gcc_assert (*to_tailp == NULL);
2194 *to_tailp = *fromp;
2195 *fromp = NULL;
2196 }
2197
2198 /* Makes set pointed to by TO to be the union of TO and FROM. Clear av_set
2199 pointed to by FROMP afterwards. */
2200 void
2201 av_set_union_and_clear (av_set_t *top, av_set_t *fromp, insn_t insn)
2202 {
2203 expr_t expr1;
2204 av_set_iterator i;
2205
2206 /* Delete from TOP all exprs, that present in FROMP. */
2207 FOR_EACH_EXPR_1 (expr1, i, top)
2208 {
2209 expr_t expr2 = av_set_lookup (*fromp, EXPR_VINSN (expr1));
2210
2211 if (expr2)
2212 {
2213 merge_expr (expr2, expr1, insn);
2214 av_set_iter_remove (&i);
2215 }
2216 }
2217
2218 join_distinct_sets (i.lp, fromp);
2219 }
2220
2221 /* Same as above, but also update availability of target register in
2222 TOP judging by TO_LV_SET and FROM_LV_SET. */
2223 void
2224 av_set_union_and_live (av_set_t *top, av_set_t *fromp, regset to_lv_set,
2225 regset from_lv_set, insn_t insn)
2226 {
2227 expr_t expr1;
2228 av_set_iterator i;
2229 av_set_t *to_tailp, in_both_set = NULL;
2230
2231 /* Delete from TOP all expres, that present in FROMP. */
2232 FOR_EACH_EXPR_1 (expr1, i, top)
2233 {
2234 expr_t expr2 = av_set_lookup_and_remove (fromp, EXPR_VINSN (expr1));
2235
2236 if (expr2)
2237 {
2238 /* It may be that the expressions have different destination
2239 registers, in which case we need to check liveness here. */
2240 if (EXPR_SEPARABLE_P (expr1))
2241 {
2242 int regno1 = (REG_P (EXPR_LHS (expr1))
2243 ? (int) expr_dest_regno (expr1) : -1);
2244 int regno2 = (REG_P (EXPR_LHS (expr2))
2245 ? (int) expr_dest_regno (expr2) : -1);
2246
2247 /* ??? We don't have a way to check restrictions for
2248 *other* register on the current path, we did it only
2249 for the current target register. Give up. */
2250 if (regno1 != regno2)
2251 EXPR_TARGET_AVAILABLE (expr2) = -1;
2252 }
2253 else if (EXPR_INSN_RTX (expr1) != EXPR_INSN_RTX (expr2))
2254 EXPR_TARGET_AVAILABLE (expr2) = -1;
2255
2256 merge_expr (expr2, expr1, insn);
2257 av_set_add_nocopy (&in_both_set, expr2);
2258 av_set_iter_remove (&i);
2259 }
2260 else
2261 /* EXPR1 is present in TOP, but not in FROMP. Check it on
2262 FROM_LV_SET. */
2263 set_unavailable_target_for_expr (expr1, from_lv_set);
2264 }
2265 to_tailp = i.lp;
2266
2267 /* These expressions are not present in TOP. Check liveness
2268 restrictions on TO_LV_SET. */
2269 FOR_EACH_EXPR (expr1, i, *fromp)
2270 set_unavailable_target_for_expr (expr1, to_lv_set);
2271
2272 join_distinct_sets (i.lp, &in_both_set);
2273 join_distinct_sets (to_tailp, fromp);
2274 }
2275
2276 /* Clear av_set pointed to by SETP. */
2277 void
2278 av_set_clear (av_set_t *setp)
2279 {
2280 expr_t expr;
2281 av_set_iterator i;
2282
2283 FOR_EACH_EXPR_1 (expr, i, setp)
2284 av_set_iter_remove (&i);
2285
2286 gcc_assert (*setp == NULL);
2287 }
2288
2289 /* Leave only one non-speculative element in the SETP. */
2290 void
2291 av_set_leave_one_nonspec (av_set_t *setp)
2292 {
2293 expr_t expr;
2294 av_set_iterator i;
2295 bool has_one_nonspec = false;
2296
2297 /* Keep all speculative exprs, and leave one non-speculative
2298 (the first one). */
2299 FOR_EACH_EXPR_1 (expr, i, setp)
2300 {
2301 if (!EXPR_SPEC_DONE_DS (expr))
2302 {
2303 if (has_one_nonspec)
2304 av_set_iter_remove (&i);
2305 else
2306 has_one_nonspec = true;
2307 }
2308 }
2309 }
2310
2311 /* Return the N'th element of the SET. */
2312 expr_t
2313 av_set_element (av_set_t set, int n)
2314 {
2315 expr_t expr;
2316 av_set_iterator i;
2317
2318 FOR_EACH_EXPR (expr, i, set)
2319 if (n-- == 0)
2320 return expr;
2321
2322 gcc_unreachable ();
2323 return NULL;
2324 }
2325
2326 /* Deletes all expressions from AVP that are conditional branches (IFs). */
2327 void
2328 av_set_substract_cond_branches (av_set_t *avp)
2329 {
2330 av_set_iterator i;
2331 expr_t expr;
2332
2333 FOR_EACH_EXPR_1 (expr, i, avp)
2334 if (vinsn_cond_branch_p (EXPR_VINSN (expr)))
2335 av_set_iter_remove (&i);
2336 }
2337
2338 /* Multiplies usefulness attribute of each member of av-set *AVP by
2339 value PROB / ALL_PROB. */
2340 void
2341 av_set_split_usefulness (av_set_t av, int prob, int all_prob)
2342 {
2343 av_set_iterator i;
2344 expr_t expr;
2345
2346 FOR_EACH_EXPR (expr, i, av)
2347 EXPR_USEFULNESS (expr) = (all_prob
2348 ? (EXPR_USEFULNESS (expr) * prob) / all_prob
2349 : 0);
2350 }
2351
2352 /* Leave in AVP only those expressions, which are present in AV,
2353 and return it, merging history expressions. */
2354 void
2355 av_set_code_motion_filter (av_set_t *avp, av_set_t av)
2356 {
2357 av_set_iterator i;
2358 expr_t expr, expr2;
2359
2360 FOR_EACH_EXPR_1 (expr, i, avp)
2361 if ((expr2 = av_set_lookup (av, EXPR_VINSN (expr))) == NULL)
2362 av_set_iter_remove (&i);
2363 else
2364 /* When updating av sets in bookkeeping blocks, we can add more insns
2365 there which will be transformed but the upper av sets will not
2366 reflect those transformations. We then fail to undo those
2367 when searching for such insns. So merge the history saved
2368 in the av set of the block we are processing. */
2369 merge_history_vect (&EXPR_HISTORY_OF_CHANGES (expr),
2370 EXPR_HISTORY_OF_CHANGES (expr2));
2371 }
2372
2373 \f
2374
2375 /* Dependence hooks to initialize insn data. */
2376
2377 /* This is used in hooks callable from dependence analysis when initializing
2378 instruction's data. */
2379 static struct
2380 {
2381 /* Where the dependence was found (lhs/rhs). */
2382 deps_where_t where;
2383
2384 /* The actual data object to initialize. */
2385 idata_t id;
2386
2387 /* True when the insn should not be made clonable. */
2388 bool force_unique_p;
2389
2390 /* True when insn should be treated as of type USE, i.e. never renamed. */
2391 bool force_use_p;
2392 } deps_init_id_data;
2393
2394
2395 /* Setup ID for INSN. FORCE_UNIQUE_P is true when INSN should not be
2396 clonable. */
2397 static void
2398 setup_id_for_insn (idata_t id, insn_t insn, bool force_unique_p)
2399 {
2400 int type;
2401
2402 /* Determine whether INSN could be cloned and return appropriate vinsn type.
2403 That clonable insns which can be separated into lhs and rhs have type SET.
2404 Other clonable insns have type USE. */
2405 type = GET_CODE (insn);
2406
2407 /* Only regular insns could be cloned. */
2408 if (type == INSN && !force_unique_p)
2409 type = SET;
2410 else if (type == JUMP_INSN && simplejump_p (insn))
2411 type = PC;
2412 else if (type == DEBUG_INSN)
2413 type = !force_unique_p ? USE : INSN;
2414
2415 IDATA_TYPE (id) = type;
2416 IDATA_REG_SETS (id) = get_clear_regset_from_pool ();
2417 IDATA_REG_USES (id) = get_clear_regset_from_pool ();
2418 IDATA_REG_CLOBBERS (id) = get_clear_regset_from_pool ();
2419 }
2420
2421 /* Start initializing insn data. */
2422 static void
2423 deps_init_id_start_insn (insn_t insn)
2424 {
2425 gcc_assert (deps_init_id_data.where == DEPS_IN_NOWHERE);
2426
2427 setup_id_for_insn (deps_init_id_data.id, insn,
2428 deps_init_id_data.force_unique_p);
2429 deps_init_id_data.where = DEPS_IN_INSN;
2430 }
2431
2432 /* Start initializing lhs data. */
2433 static void
2434 deps_init_id_start_lhs (rtx lhs)
2435 {
2436 gcc_assert (deps_init_id_data.where == DEPS_IN_INSN);
2437 gcc_assert (IDATA_LHS (deps_init_id_data.id) == NULL);
2438
2439 if (IDATA_TYPE (deps_init_id_data.id) == SET)
2440 {
2441 IDATA_LHS (deps_init_id_data.id) = lhs;
2442 deps_init_id_data.where = DEPS_IN_LHS;
2443 }
2444 }
2445
2446 /* Finish initializing lhs data. */
2447 static void
2448 deps_init_id_finish_lhs (void)
2449 {
2450 deps_init_id_data.where = DEPS_IN_INSN;
2451 }
2452
2453 /* Note a set of REGNO. */
2454 static void
2455 deps_init_id_note_reg_set (int regno)
2456 {
2457 haifa_note_reg_set (regno);
2458
2459 if (deps_init_id_data.where == DEPS_IN_RHS)
2460 deps_init_id_data.force_use_p = true;
2461
2462 if (IDATA_TYPE (deps_init_id_data.id) != PC)
2463 SET_REGNO_REG_SET (IDATA_REG_SETS (deps_init_id_data.id), regno);
2464
2465 #ifdef STACK_REGS
2466 /* Make instructions that set stack registers to be ineligible for
2467 renaming to avoid issues with find_used_regs. */
2468 if (IN_RANGE (regno, FIRST_STACK_REG, LAST_STACK_REG))
2469 deps_init_id_data.force_use_p = true;
2470 #endif
2471 }
2472
2473 /* Note a clobber of REGNO. */
2474 static void
2475 deps_init_id_note_reg_clobber (int regno)
2476 {
2477 haifa_note_reg_clobber (regno);
2478
2479 if (deps_init_id_data.where == DEPS_IN_RHS)
2480 deps_init_id_data.force_use_p = true;
2481
2482 if (IDATA_TYPE (deps_init_id_data.id) != PC)
2483 SET_REGNO_REG_SET (IDATA_REG_CLOBBERS (deps_init_id_data.id), regno);
2484 }
2485
2486 /* Note a use of REGNO. */
2487 static void
2488 deps_init_id_note_reg_use (int regno)
2489 {
2490 haifa_note_reg_use (regno);
2491
2492 if (IDATA_TYPE (deps_init_id_data.id) != PC)
2493 SET_REGNO_REG_SET (IDATA_REG_USES (deps_init_id_data.id), regno);
2494 }
2495
2496 /* Start initializing rhs data. */
2497 static void
2498 deps_init_id_start_rhs (rtx rhs)
2499 {
2500 gcc_assert (deps_init_id_data.where == DEPS_IN_INSN);
2501
2502 /* And there was no sel_deps_reset_to_insn (). */
2503 if (IDATA_LHS (deps_init_id_data.id) != NULL)
2504 {
2505 IDATA_RHS (deps_init_id_data.id) = rhs;
2506 deps_init_id_data.where = DEPS_IN_RHS;
2507 }
2508 }
2509
2510 /* Finish initializing rhs data. */
2511 static void
2512 deps_init_id_finish_rhs (void)
2513 {
2514 gcc_assert (deps_init_id_data.where == DEPS_IN_RHS
2515 || deps_init_id_data.where == DEPS_IN_INSN);
2516 deps_init_id_data.where = DEPS_IN_INSN;
2517 }
2518
2519 /* Finish initializing insn data. */
2520 static void
2521 deps_init_id_finish_insn (void)
2522 {
2523 gcc_assert (deps_init_id_data.where == DEPS_IN_INSN);
2524
2525 if (IDATA_TYPE (deps_init_id_data.id) == SET)
2526 {
2527 rtx lhs = IDATA_LHS (deps_init_id_data.id);
2528 rtx rhs = IDATA_RHS (deps_init_id_data.id);
2529
2530 if (lhs == NULL || rhs == NULL || !lhs_and_rhs_separable_p (lhs, rhs)
2531 || deps_init_id_data.force_use_p)
2532 {
2533 /* This should be a USE, as we don't want to schedule its RHS
2534 separately. However, we still want to have them recorded
2535 for the purposes of substitution. That's why we don't
2536 simply call downgrade_to_use () here. */
2537 gcc_assert (IDATA_TYPE (deps_init_id_data.id) == SET);
2538 gcc_assert (!lhs == !rhs);
2539
2540 IDATA_TYPE (deps_init_id_data.id) = USE;
2541 }
2542 }
2543
2544 deps_init_id_data.where = DEPS_IN_NOWHERE;
2545 }
2546
2547 /* This is dependence info used for initializing insn's data. */
2548 static struct sched_deps_info_def deps_init_id_sched_deps_info;
2549
2550 /* This initializes most of the static part of the above structure. */
2551 static const struct sched_deps_info_def const_deps_init_id_sched_deps_info =
2552 {
2553 NULL,
2554
2555 deps_init_id_start_insn,
2556 deps_init_id_finish_insn,
2557 deps_init_id_start_lhs,
2558 deps_init_id_finish_lhs,
2559 deps_init_id_start_rhs,
2560 deps_init_id_finish_rhs,
2561 deps_init_id_note_reg_set,
2562 deps_init_id_note_reg_clobber,
2563 deps_init_id_note_reg_use,
2564 NULL, /* note_mem_dep */
2565 NULL, /* note_dep */
2566
2567 0, /* use_cselib */
2568 0, /* use_deps_list */
2569 0 /* generate_spec_deps */
2570 };
2571
2572 /* Initialize INSN's lhs and rhs in ID. When FORCE_UNIQUE_P is true,
2573 we don't actually need information about lhs and rhs. */
2574 static void
2575 setup_id_lhs_rhs (idata_t id, insn_t insn, bool force_unique_p)
2576 {
2577 rtx pat = PATTERN (insn);
2578
2579 if (NONJUMP_INSN_P (insn)
2580 && GET_CODE (pat) == SET
2581 && !force_unique_p)
2582 {
2583 IDATA_RHS (id) = SET_SRC (pat);
2584 IDATA_LHS (id) = SET_DEST (pat);
2585 }
2586 else
2587 IDATA_LHS (id) = IDATA_RHS (id) = NULL;
2588 }
2589
2590 /* Possibly downgrade INSN to USE. */
2591 static void
2592 maybe_downgrade_id_to_use (idata_t id, insn_t insn)
2593 {
2594 bool must_be_use = false;
2595 unsigned uid = INSN_UID (insn);
2596 df_ref *rec;
2597 rtx lhs = IDATA_LHS (id);
2598 rtx rhs = IDATA_RHS (id);
2599
2600 /* We downgrade only SETs. */
2601 if (IDATA_TYPE (id) != SET)
2602 return;
2603
2604 if (!lhs || !lhs_and_rhs_separable_p (lhs, rhs))
2605 {
2606 IDATA_TYPE (id) = USE;
2607 return;
2608 }
2609
2610 for (rec = DF_INSN_UID_DEFS (uid); *rec; rec++)
2611 {
2612 df_ref def = *rec;
2613
2614 if (DF_REF_INSN (def)
2615 && DF_REF_FLAGS_IS_SET (def, DF_REF_PRE_POST_MODIFY)
2616 && loc_mentioned_in_p (DF_REF_LOC (def), IDATA_RHS (id)))
2617 {
2618 must_be_use = true;
2619 break;
2620 }
2621
2622 #ifdef STACK_REGS
2623 /* Make instructions that set stack registers to be ineligible for
2624 renaming to avoid issues with find_used_regs. */
2625 if (IN_RANGE (DF_REF_REGNO (def), FIRST_STACK_REG, LAST_STACK_REG))
2626 {
2627 must_be_use = true;
2628 break;
2629 }
2630 #endif
2631 }
2632
2633 if (must_be_use)
2634 IDATA_TYPE (id) = USE;
2635 }
2636
2637 /* Setup register sets describing INSN in ID. */
2638 static void
2639 setup_id_reg_sets (idata_t id, insn_t insn)
2640 {
2641 unsigned uid = INSN_UID (insn);
2642 df_ref *rec;
2643 regset tmp = get_clear_regset_from_pool ();
2644
2645 for (rec = DF_INSN_UID_DEFS (uid); *rec; rec++)
2646 {
2647 df_ref def = *rec;
2648 unsigned int regno = DF_REF_REGNO (def);
2649
2650 /* Post modifies are treated like clobbers by sched-deps.c. */
2651 if (DF_REF_FLAGS_IS_SET (def, (DF_REF_MUST_CLOBBER
2652 | DF_REF_PRE_POST_MODIFY)))
2653 SET_REGNO_REG_SET (IDATA_REG_CLOBBERS (id), regno);
2654 else if (! DF_REF_FLAGS_IS_SET (def, DF_REF_MAY_CLOBBER))
2655 {
2656 SET_REGNO_REG_SET (IDATA_REG_SETS (id), regno);
2657
2658 #ifdef STACK_REGS
2659 /* For stack registers, treat writes to them as writes
2660 to the first one to be consistent with sched-deps.c. */
2661 if (IN_RANGE (regno, FIRST_STACK_REG, LAST_STACK_REG))
2662 SET_REGNO_REG_SET (IDATA_REG_SETS (id), FIRST_STACK_REG);
2663 #endif
2664 }
2665 /* Mark special refs that generate read/write def pair. */
2666 if (DF_REF_FLAGS_IS_SET (def, DF_REF_CONDITIONAL)
2667 || regno == STACK_POINTER_REGNUM)
2668 bitmap_set_bit (tmp, regno);
2669 }
2670
2671 for (rec = DF_INSN_UID_USES (uid); *rec; rec++)
2672 {
2673 df_ref use = *rec;
2674 unsigned int regno = DF_REF_REGNO (use);
2675
2676 /* When these refs are met for the first time, skip them, as
2677 these uses are just counterparts of some defs. */
2678 if (bitmap_bit_p (tmp, regno))
2679 bitmap_clear_bit (tmp, regno);
2680 else if (! DF_REF_FLAGS_IS_SET (use, DF_REF_CALL_STACK_USAGE))
2681 {
2682 SET_REGNO_REG_SET (IDATA_REG_USES (id), regno);
2683
2684 #ifdef STACK_REGS
2685 /* For stack registers, treat reads from them as reads from
2686 the first one to be consistent with sched-deps.c. */
2687 if (IN_RANGE (regno, FIRST_STACK_REG, LAST_STACK_REG))
2688 SET_REGNO_REG_SET (IDATA_REG_USES (id), FIRST_STACK_REG);
2689 #endif
2690 }
2691 }
2692
2693 return_regset_to_pool (tmp);
2694 }
2695
2696 /* Initialize instruction data for INSN in ID using DF's data. */
2697 static void
2698 init_id_from_df (idata_t id, insn_t insn, bool force_unique_p)
2699 {
2700 gcc_assert (DF_INSN_UID_SAFE_GET (INSN_UID (insn)) != NULL);
2701
2702 setup_id_for_insn (id, insn, force_unique_p);
2703 setup_id_lhs_rhs (id, insn, force_unique_p);
2704
2705 if (INSN_NOP_P (insn))
2706 return;
2707
2708 maybe_downgrade_id_to_use (id, insn);
2709 setup_id_reg_sets (id, insn);
2710 }
2711
2712 /* Initialize instruction data for INSN in ID. */
2713 static void
2714 deps_init_id (idata_t id, insn_t insn, bool force_unique_p)
2715 {
2716 struct deps_desc _dc, *dc = &_dc;
2717
2718 deps_init_id_data.where = DEPS_IN_NOWHERE;
2719 deps_init_id_data.id = id;
2720 deps_init_id_data.force_unique_p = force_unique_p;
2721 deps_init_id_data.force_use_p = false;
2722
2723 init_deps (dc, false);
2724
2725 memcpy (&deps_init_id_sched_deps_info,
2726 &const_deps_init_id_sched_deps_info,
2727 sizeof (deps_init_id_sched_deps_info));
2728
2729 if (spec_info != NULL)
2730 deps_init_id_sched_deps_info.generate_spec_deps = 1;
2731
2732 sched_deps_info = &deps_init_id_sched_deps_info;
2733
2734 deps_analyze_insn (dc, insn);
2735
2736 free_deps (dc);
2737
2738 deps_init_id_data.id = NULL;
2739 }
2740
2741 \f
2742 struct sched_scan_info_def
2743 {
2744 /* This hook notifies scheduler frontend to extend its internal per basic
2745 block data structures. This hook should be called once before a series of
2746 calls to bb_init (). */
2747 void (*extend_bb) (void);
2748
2749 /* This hook makes scheduler frontend to initialize its internal data
2750 structures for the passed basic block. */
2751 void (*init_bb) (basic_block);
2752
2753 /* This hook notifies scheduler frontend to extend its internal per insn data
2754 structures. This hook should be called once before a series of calls to
2755 insn_init (). */
2756 void (*extend_insn) (void);
2757
2758 /* This hook makes scheduler frontend to initialize its internal data
2759 structures for the passed insn. */
2760 void (*init_insn) (rtx);
2761 };
2762
2763 /* A driver function to add a set of basic blocks (BBS) to the
2764 scheduling region. */
2765 static void
2766 sched_scan (const struct sched_scan_info_def *ssi, bb_vec_t bbs)
2767 {
2768 unsigned i;
2769 basic_block bb;
2770
2771 if (ssi->extend_bb)
2772 ssi->extend_bb ();
2773
2774 if (ssi->init_bb)
2775 FOR_EACH_VEC_ELT (basic_block, bbs, i, bb)
2776 ssi->init_bb (bb);
2777
2778 if (ssi->extend_insn)
2779 ssi->extend_insn ();
2780
2781 if (ssi->init_insn)
2782 FOR_EACH_VEC_ELT (basic_block, bbs, i, bb)
2783 {
2784 rtx insn;
2785
2786 FOR_BB_INSNS (bb, insn)
2787 ssi->init_insn (insn);
2788 }
2789 }
2790
2791 /* Implement hooks for collecting fundamental insn properties like if insn is
2792 an ASM or is within a SCHED_GROUP. */
2793
2794 /* True when a "one-time init" data for INSN was already inited. */
2795 static bool
2796 first_time_insn_init (insn_t insn)
2797 {
2798 return INSN_LIVE (insn) == NULL;
2799 }
2800
2801 /* Hash an entry in a transformed_insns hashtable. */
2802 static hashval_t
2803 hash_transformed_insns (const void *p)
2804 {
2805 return VINSN_HASH_RTX (((const struct transformed_insns *) p)->vinsn_old);
2806 }
2807
2808 /* Compare the entries in a transformed_insns hashtable. */
2809 static int
2810 eq_transformed_insns (const void *p, const void *q)
2811 {
2812 rtx i1 = VINSN_INSN_RTX (((const struct transformed_insns *) p)->vinsn_old);
2813 rtx i2 = VINSN_INSN_RTX (((const struct transformed_insns *) q)->vinsn_old);
2814
2815 if (INSN_UID (i1) == INSN_UID (i2))
2816 return 1;
2817 return rtx_equal_p (PATTERN (i1), PATTERN (i2));
2818 }
2819
2820 /* Free an entry in a transformed_insns hashtable. */
2821 static void
2822 free_transformed_insns (void *p)
2823 {
2824 struct transformed_insns *pti = (struct transformed_insns *) p;
2825
2826 vinsn_detach (pti->vinsn_old);
2827 vinsn_detach (pti->vinsn_new);
2828 free (pti);
2829 }
2830
2831 /* Init the s_i_d data for INSN which should be inited just once, when
2832 we first see the insn. */
2833 static void
2834 init_first_time_insn_data (insn_t insn)
2835 {
2836 /* This should not be set if this is the first time we init data for
2837 insn. */
2838 gcc_assert (first_time_insn_init (insn));
2839
2840 /* These are needed for nops too. */
2841 INSN_LIVE (insn) = get_regset_from_pool ();
2842 INSN_LIVE_VALID_P (insn) = false;
2843
2844 if (!INSN_NOP_P (insn))
2845 {
2846 INSN_ANALYZED_DEPS (insn) = BITMAP_ALLOC (NULL);
2847 INSN_FOUND_DEPS (insn) = BITMAP_ALLOC (NULL);
2848 INSN_TRANSFORMED_INSNS (insn)
2849 = htab_create (16, hash_transformed_insns,
2850 eq_transformed_insns, free_transformed_insns);
2851 init_deps (&INSN_DEPS_CONTEXT (insn), true);
2852 }
2853 }
2854
2855 /* Free almost all above data for INSN that is scheduled already.
2856 Used for extra-large basic blocks. */
2857 void
2858 free_data_for_scheduled_insn (insn_t insn)
2859 {
2860 gcc_assert (! first_time_insn_init (insn));
2861
2862 if (! INSN_ANALYZED_DEPS (insn))
2863 return;
2864
2865 BITMAP_FREE (INSN_ANALYZED_DEPS (insn));
2866 BITMAP_FREE (INSN_FOUND_DEPS (insn));
2867 htab_delete (INSN_TRANSFORMED_INSNS (insn));
2868
2869 /* This is allocated only for bookkeeping insns. */
2870 if (INSN_ORIGINATORS (insn))
2871 BITMAP_FREE (INSN_ORIGINATORS (insn));
2872 free_deps (&INSN_DEPS_CONTEXT (insn));
2873
2874 INSN_ANALYZED_DEPS (insn) = NULL;
2875
2876 /* Clear the readonly flag so we would ICE when trying to recalculate
2877 the deps context (as we believe that it should not happen). */
2878 (&INSN_DEPS_CONTEXT (insn))->readonly = 0;
2879 }
2880
2881 /* Free the same data as above for INSN. */
2882 static void
2883 free_first_time_insn_data (insn_t insn)
2884 {
2885 gcc_assert (! first_time_insn_init (insn));
2886
2887 free_data_for_scheduled_insn (insn);
2888 return_regset_to_pool (INSN_LIVE (insn));
2889 INSN_LIVE (insn) = NULL;
2890 INSN_LIVE_VALID_P (insn) = false;
2891 }
2892
2893 /* Initialize region-scope data structures for basic blocks. */
2894 static void
2895 init_global_and_expr_for_bb (basic_block bb)
2896 {
2897 if (sel_bb_empty_p (bb))
2898 return;
2899
2900 invalidate_av_set (bb);
2901 }
2902
2903 /* Data for global dependency analysis (to initialize CANT_MOVE and
2904 SCHED_GROUP_P). */
2905 static struct
2906 {
2907 /* Previous insn. */
2908 insn_t prev_insn;
2909 } init_global_data;
2910
2911 /* Determine if INSN is in the sched_group, is an asm or should not be
2912 cloned. After that initialize its expr. */
2913 static void
2914 init_global_and_expr_for_insn (insn_t insn)
2915 {
2916 if (LABEL_P (insn))
2917 return;
2918
2919 if (NOTE_INSN_BASIC_BLOCK_P (insn))
2920 {
2921 init_global_data.prev_insn = NULL_RTX;
2922 return;
2923 }
2924
2925 gcc_assert (INSN_P (insn));
2926
2927 if (SCHED_GROUP_P (insn))
2928 /* Setup a sched_group. */
2929 {
2930 insn_t prev_insn = init_global_data.prev_insn;
2931
2932 if (prev_insn)
2933 INSN_SCHED_NEXT (prev_insn) = insn;
2934
2935 init_global_data.prev_insn = insn;
2936 }
2937 else
2938 init_global_data.prev_insn = NULL_RTX;
2939
2940 if (GET_CODE (PATTERN (insn)) == ASM_INPUT
2941 || asm_noperands (PATTERN (insn)) >= 0)
2942 /* Mark INSN as an asm. */
2943 INSN_ASM_P (insn) = true;
2944
2945 {
2946 bool force_unique_p;
2947 ds_t spec_done_ds;
2948
2949 /* Certain instructions cannot be cloned, and frame related insns and
2950 the insn adjacent to NOTE_INSN_EPILOGUE_BEG cannot be moved out of
2951 their block. */
2952 if (prologue_epilogue_contains (insn))
2953 {
2954 if (RTX_FRAME_RELATED_P (insn))
2955 CANT_MOVE (insn) = 1;
2956 else
2957 {
2958 rtx note;
2959 for (note = REG_NOTES (insn); note; note = XEXP (note, 1))
2960 if (REG_NOTE_KIND (note) == REG_SAVE_NOTE
2961 && ((enum insn_note) INTVAL (XEXP (note, 0))
2962 == NOTE_INSN_EPILOGUE_BEG))
2963 {
2964 CANT_MOVE (insn) = 1;
2965 break;
2966 }
2967 }
2968 force_unique_p = true;
2969 }
2970 else
2971 if (CANT_MOVE (insn)
2972 || INSN_ASM_P (insn)
2973 || SCHED_GROUP_P (insn)
2974 || CALL_P (insn)
2975 /* Exception handling insns are always unique. */
2976 || (cfun->can_throw_non_call_exceptions && can_throw_internal (insn))
2977 /* TRAP_IF though have an INSN code is control_flow_insn_p (). */
2978 || control_flow_insn_p (insn)
2979 || volatile_insn_p (PATTERN (insn))
2980 || (targetm.cannot_copy_insn_p
2981 && targetm.cannot_copy_insn_p (insn)))
2982 force_unique_p = true;
2983 else
2984 force_unique_p = false;
2985
2986 if (targetm.sched.get_insn_spec_ds)
2987 {
2988 spec_done_ds = targetm.sched.get_insn_spec_ds (insn);
2989 spec_done_ds = ds_get_max_dep_weak (spec_done_ds);
2990 }
2991 else
2992 spec_done_ds = 0;
2993
2994 /* Initialize INSN's expr. */
2995 init_expr (INSN_EXPR (insn), vinsn_create (insn, force_unique_p), 0,
2996 REG_BR_PROB_BASE, INSN_PRIORITY (insn), 0, BLOCK_NUM (insn),
2997 spec_done_ds, 0, 0, NULL, true, false, false, false,
2998 CANT_MOVE (insn));
2999 }
3000
3001 init_first_time_insn_data (insn);
3002 }
3003
3004 /* Scan the region and initialize instruction data for basic blocks BBS. */
3005 void
3006 sel_init_global_and_expr (bb_vec_t bbs)
3007 {
3008 /* ??? It would be nice to implement push / pop scheme for sched_infos. */
3009 const struct sched_scan_info_def ssi =
3010 {
3011 NULL, /* extend_bb */
3012 init_global_and_expr_for_bb, /* init_bb */
3013 extend_insn_data, /* extend_insn */
3014 init_global_and_expr_for_insn /* init_insn */
3015 };
3016
3017 sched_scan (&ssi, bbs);
3018 }
3019
3020 /* Finalize region-scope data structures for basic blocks. */
3021 static void
3022 finish_global_and_expr_for_bb (basic_block bb)
3023 {
3024 av_set_clear (&BB_AV_SET (bb));
3025 BB_AV_LEVEL (bb) = 0;
3026 }
3027
3028 /* Finalize INSN's data. */
3029 static void
3030 finish_global_and_expr_insn (insn_t insn)
3031 {
3032 if (LABEL_P (insn) || NOTE_INSN_BASIC_BLOCK_P (insn))
3033 return;
3034
3035 gcc_assert (INSN_P (insn));
3036
3037 if (INSN_LUID (insn) > 0)
3038 {
3039 free_first_time_insn_data (insn);
3040 INSN_WS_LEVEL (insn) = 0;
3041 CANT_MOVE (insn) = 0;
3042
3043 /* We can no longer assert this, as vinsns of this insn could be
3044 easily live in other insn's caches. This should be changed to
3045 a counter-like approach among all vinsns. */
3046 gcc_assert (true || VINSN_COUNT (INSN_VINSN (insn)) == 1);
3047 clear_expr (INSN_EXPR (insn));
3048 }
3049 }
3050
3051 /* Finalize per instruction data for the whole region. */
3052 void
3053 sel_finish_global_and_expr (void)
3054 {
3055 {
3056 bb_vec_t bbs;
3057 int i;
3058
3059 bbs = VEC_alloc (basic_block, heap, current_nr_blocks);
3060
3061 for (i = 0; i < current_nr_blocks; i++)
3062 VEC_quick_push (basic_block, bbs, BASIC_BLOCK (BB_TO_BLOCK (i)));
3063
3064 /* Clear AV_SETs and INSN_EXPRs. */
3065 {
3066 const struct sched_scan_info_def ssi =
3067 {
3068 NULL, /* extend_bb */
3069 finish_global_and_expr_for_bb, /* init_bb */
3070 NULL, /* extend_insn */
3071 finish_global_and_expr_insn /* init_insn */
3072 };
3073
3074 sched_scan (&ssi, bbs);
3075 }
3076
3077 VEC_free (basic_block, heap, bbs);
3078 }
3079
3080 finish_insns ();
3081 }
3082 \f
3083
3084 /* In the below hooks, we merely calculate whether or not a dependence
3085 exists, and in what part of insn. However, we will need more data
3086 when we'll start caching dependence requests. */
3087
3088 /* Container to hold information for dependency analysis. */
3089 static struct
3090 {
3091 deps_t dc;
3092
3093 /* A variable to track which part of rtx we are scanning in
3094 sched-deps.c: sched_analyze_insn (). */
3095 deps_where_t where;
3096
3097 /* Current producer. */
3098 insn_t pro;
3099
3100 /* Current consumer. */
3101 vinsn_t con;
3102
3103 /* Is SEL_DEPS_HAS_DEP_P[DEPS_IN_X] is true, then X has a dependence.
3104 X is from { INSN, LHS, RHS }. */
3105 ds_t has_dep_p[DEPS_IN_NOWHERE];
3106 } has_dependence_data;
3107
3108 /* Start analyzing dependencies of INSN. */
3109 static void
3110 has_dependence_start_insn (insn_t insn ATTRIBUTE_UNUSED)
3111 {
3112 gcc_assert (has_dependence_data.where == DEPS_IN_NOWHERE);
3113
3114 has_dependence_data.where = DEPS_IN_INSN;
3115 }
3116
3117 /* Finish analyzing dependencies of an insn. */
3118 static void
3119 has_dependence_finish_insn (void)
3120 {
3121 gcc_assert (has_dependence_data.where == DEPS_IN_INSN);
3122
3123 has_dependence_data.where = DEPS_IN_NOWHERE;
3124 }
3125
3126 /* Start analyzing dependencies of LHS. */
3127 static void
3128 has_dependence_start_lhs (rtx lhs ATTRIBUTE_UNUSED)
3129 {
3130 gcc_assert (has_dependence_data.where == DEPS_IN_INSN);
3131
3132 if (VINSN_LHS (has_dependence_data.con) != NULL)
3133 has_dependence_data.where = DEPS_IN_LHS;
3134 }
3135
3136 /* Finish analyzing dependencies of an lhs. */
3137 static void
3138 has_dependence_finish_lhs (void)
3139 {
3140 has_dependence_data.where = DEPS_IN_INSN;
3141 }
3142
3143 /* Start analyzing dependencies of RHS. */
3144 static void
3145 has_dependence_start_rhs (rtx rhs ATTRIBUTE_UNUSED)
3146 {
3147 gcc_assert (has_dependence_data.where == DEPS_IN_INSN);
3148
3149 if (VINSN_RHS (has_dependence_data.con) != NULL)
3150 has_dependence_data.where = DEPS_IN_RHS;
3151 }
3152
3153 /* Start analyzing dependencies of an rhs. */
3154 static void
3155 has_dependence_finish_rhs (void)
3156 {
3157 gcc_assert (has_dependence_data.where == DEPS_IN_RHS
3158 || has_dependence_data.where == DEPS_IN_INSN);
3159
3160 has_dependence_data.where = DEPS_IN_INSN;
3161 }
3162
3163 /* Note a set of REGNO. */
3164 static void
3165 has_dependence_note_reg_set (int regno)
3166 {
3167 struct deps_reg *reg_last = &has_dependence_data.dc->reg_last[regno];
3168
3169 if (!sched_insns_conditions_mutex_p (has_dependence_data.pro,
3170 VINSN_INSN_RTX
3171 (has_dependence_data.con)))
3172 {
3173 ds_t *dsp = &has_dependence_data.has_dep_p[has_dependence_data.where];
3174
3175 if (reg_last->sets != NULL
3176 || reg_last->clobbers != NULL)
3177 *dsp = (*dsp & ~SPECULATIVE) | DEP_OUTPUT;
3178
3179 if (reg_last->uses)
3180 *dsp = (*dsp & ~SPECULATIVE) | DEP_ANTI;
3181 }
3182 }
3183
3184 /* Note a clobber of REGNO. */
3185 static void
3186 has_dependence_note_reg_clobber (int regno)
3187 {
3188 struct deps_reg *reg_last = &has_dependence_data.dc->reg_last[regno];
3189
3190 if (!sched_insns_conditions_mutex_p (has_dependence_data.pro,
3191 VINSN_INSN_RTX
3192 (has_dependence_data.con)))
3193 {
3194 ds_t *dsp = &has_dependence_data.has_dep_p[has_dependence_data.where];
3195
3196 if (reg_last->sets)
3197 *dsp = (*dsp & ~SPECULATIVE) | DEP_OUTPUT;
3198
3199 if (reg_last->uses)
3200 *dsp = (*dsp & ~SPECULATIVE) | DEP_ANTI;
3201 }
3202 }
3203
3204 /* Note a use of REGNO. */
3205 static void
3206 has_dependence_note_reg_use (int regno)
3207 {
3208 struct deps_reg *reg_last = &has_dependence_data.dc->reg_last[regno];
3209
3210 if (!sched_insns_conditions_mutex_p (has_dependence_data.pro,
3211 VINSN_INSN_RTX
3212 (has_dependence_data.con)))
3213 {
3214 ds_t *dsp = &has_dependence_data.has_dep_p[has_dependence_data.where];
3215
3216 if (reg_last->sets)
3217 *dsp = (*dsp & ~SPECULATIVE) | DEP_TRUE;
3218
3219 if (reg_last->clobbers)
3220 *dsp = (*dsp & ~SPECULATIVE) | DEP_ANTI;
3221
3222 /* Handle BE_IN_SPEC. */
3223 if (reg_last->uses)
3224 {
3225 ds_t pro_spec_checked_ds;
3226
3227 pro_spec_checked_ds = INSN_SPEC_CHECKED_DS (has_dependence_data.pro);
3228 pro_spec_checked_ds = ds_get_max_dep_weak (pro_spec_checked_ds);
3229
3230 if (pro_spec_checked_ds != 0)
3231 /* Merge BE_IN_SPEC bits into *DSP. */
3232 *dsp = ds_full_merge (*dsp, pro_spec_checked_ds,
3233 NULL_RTX, NULL_RTX);
3234 }
3235 }
3236 }
3237
3238 /* Note a memory dependence. */
3239 static void
3240 has_dependence_note_mem_dep (rtx mem ATTRIBUTE_UNUSED,
3241 rtx pending_mem ATTRIBUTE_UNUSED,
3242 insn_t pending_insn ATTRIBUTE_UNUSED,
3243 ds_t ds ATTRIBUTE_UNUSED)
3244 {
3245 if (!sched_insns_conditions_mutex_p (has_dependence_data.pro,
3246 VINSN_INSN_RTX (has_dependence_data.con)))
3247 {
3248 ds_t *dsp = &has_dependence_data.has_dep_p[has_dependence_data.where];
3249
3250 *dsp = ds_full_merge (ds, *dsp, pending_mem, mem);
3251 }
3252 }
3253
3254 /* Note a dependence. */
3255 static void
3256 has_dependence_note_dep (insn_t pro ATTRIBUTE_UNUSED,
3257 ds_t ds ATTRIBUTE_UNUSED)
3258 {
3259 if (!sched_insns_conditions_mutex_p (has_dependence_data.pro,
3260 VINSN_INSN_RTX (has_dependence_data.con)))
3261 {
3262 ds_t *dsp = &has_dependence_data.has_dep_p[has_dependence_data.where];
3263
3264 *dsp = ds_full_merge (ds, *dsp, NULL_RTX, NULL_RTX);
3265 }
3266 }
3267
3268 /* Mark the insn as having a hard dependence that prevents speculation. */
3269 void
3270 sel_mark_hard_insn (rtx insn)
3271 {
3272 int i;
3273
3274 /* Only work when we're in has_dependence_p mode.
3275 ??? This is a hack, this should actually be a hook. */
3276 if (!has_dependence_data.dc || !has_dependence_data.pro)
3277 return;
3278
3279 gcc_assert (insn == VINSN_INSN_RTX (has_dependence_data.con));
3280 gcc_assert (has_dependence_data.where == DEPS_IN_INSN);
3281
3282 for (i = 0; i < DEPS_IN_NOWHERE; i++)
3283 has_dependence_data.has_dep_p[i] &= ~SPECULATIVE;
3284 }
3285
3286 /* This structure holds the hooks for the dependency analysis used when
3287 actually processing dependencies in the scheduler. */
3288 static struct sched_deps_info_def has_dependence_sched_deps_info;
3289
3290 /* This initializes most of the fields of the above structure. */
3291 static const struct sched_deps_info_def const_has_dependence_sched_deps_info =
3292 {
3293 NULL,
3294
3295 has_dependence_start_insn,
3296 has_dependence_finish_insn,
3297 has_dependence_start_lhs,
3298 has_dependence_finish_lhs,
3299 has_dependence_start_rhs,
3300 has_dependence_finish_rhs,
3301 has_dependence_note_reg_set,
3302 has_dependence_note_reg_clobber,
3303 has_dependence_note_reg_use,
3304 has_dependence_note_mem_dep,
3305 has_dependence_note_dep,
3306
3307 0, /* use_cselib */
3308 0, /* use_deps_list */
3309 0 /* generate_spec_deps */
3310 };
3311
3312 /* Initialize has_dependence_sched_deps_info with extra spec field. */
3313 static void
3314 setup_has_dependence_sched_deps_info (void)
3315 {
3316 memcpy (&has_dependence_sched_deps_info,
3317 &const_has_dependence_sched_deps_info,
3318 sizeof (has_dependence_sched_deps_info));
3319
3320 if (spec_info != NULL)
3321 has_dependence_sched_deps_info.generate_spec_deps = 1;
3322
3323 sched_deps_info = &has_dependence_sched_deps_info;
3324 }
3325
3326 /* Remove all dependences found and recorded in has_dependence_data array. */
3327 void
3328 sel_clear_has_dependence (void)
3329 {
3330 int i;
3331
3332 for (i = 0; i < DEPS_IN_NOWHERE; i++)
3333 has_dependence_data.has_dep_p[i] = 0;
3334 }
3335
3336 /* Return nonzero if EXPR has is dependent upon PRED. Return the pointer
3337 to the dependence information array in HAS_DEP_PP. */
3338 ds_t
3339 has_dependence_p (expr_t expr, insn_t pred, ds_t **has_dep_pp)
3340 {
3341 int i;
3342 ds_t ds;
3343 struct deps_desc *dc;
3344
3345 if (INSN_SIMPLEJUMP_P (pred))
3346 /* Unconditional jump is just a transfer of control flow.
3347 Ignore it. */
3348 return false;
3349
3350 dc = &INSN_DEPS_CONTEXT (pred);
3351
3352 /* We init this field lazily. */
3353 if (dc->reg_last == NULL)
3354 init_deps_reg_last (dc);
3355
3356 if (!dc->readonly)
3357 {
3358 has_dependence_data.pro = NULL;
3359 /* Initialize empty dep context with information about PRED. */
3360 advance_deps_context (dc, pred);
3361 dc->readonly = 1;
3362 }
3363
3364 has_dependence_data.where = DEPS_IN_NOWHERE;
3365 has_dependence_data.pro = pred;
3366 has_dependence_data.con = EXPR_VINSN (expr);
3367 has_dependence_data.dc = dc;
3368
3369 sel_clear_has_dependence ();
3370
3371 /* Now catch all dependencies that would be generated between PRED and
3372 INSN. */
3373 setup_has_dependence_sched_deps_info ();
3374 deps_analyze_insn (dc, EXPR_INSN_RTX (expr));
3375 has_dependence_data.dc = NULL;
3376
3377 /* When a barrier was found, set DEPS_IN_INSN bits. */
3378 if (dc->last_reg_pending_barrier == TRUE_BARRIER)
3379 has_dependence_data.has_dep_p[DEPS_IN_INSN] = DEP_TRUE;
3380 else if (dc->last_reg_pending_barrier == MOVE_BARRIER)
3381 has_dependence_data.has_dep_p[DEPS_IN_INSN] = DEP_ANTI;
3382
3383 /* Do not allow stores to memory to move through checks. Currently
3384 we don't move this to sched-deps.c as the check doesn't have
3385 obvious places to which this dependence can be attached.
3386 FIMXE: this should go to a hook. */
3387 if (EXPR_LHS (expr)
3388 && MEM_P (EXPR_LHS (expr))
3389 && sel_insn_is_speculation_check (pred))
3390 has_dependence_data.has_dep_p[DEPS_IN_INSN] = DEP_ANTI;
3391
3392 *has_dep_pp = has_dependence_data.has_dep_p;
3393 ds = 0;
3394 for (i = 0; i < DEPS_IN_NOWHERE; i++)
3395 ds = ds_full_merge (ds, has_dependence_data.has_dep_p[i],
3396 NULL_RTX, NULL_RTX);
3397
3398 return ds;
3399 }
3400 \f
3401
3402 /* Dependence hooks implementation that checks dependence latency constraints
3403 on the insns being scheduled. The entry point for these routines is
3404 tick_check_p predicate. */
3405
3406 static struct
3407 {
3408 /* An expr we are currently checking. */
3409 expr_t expr;
3410
3411 /* A minimal cycle for its scheduling. */
3412 int cycle;
3413
3414 /* Whether we have seen a true dependence while checking. */
3415 bool seen_true_dep_p;
3416 } tick_check_data;
3417
3418 /* Update minimal scheduling cycle for tick_check_insn given that it depends
3419 on PRO with status DS and weight DW. */
3420 static void
3421 tick_check_dep_with_dw (insn_t pro_insn, ds_t ds, dw_t dw)
3422 {
3423 expr_t con_expr = tick_check_data.expr;
3424 insn_t con_insn = EXPR_INSN_RTX (con_expr);
3425
3426 if (con_insn != pro_insn)
3427 {
3428 enum reg_note dt;
3429 int tick;
3430
3431 if (/* PROducer was removed from above due to pipelining. */
3432 !INSN_IN_STREAM_P (pro_insn)
3433 /* Or PROducer was originally on the next iteration regarding the
3434 CONsumer. */
3435 || (INSN_SCHED_TIMES (pro_insn)
3436 - EXPR_SCHED_TIMES (con_expr)) > 1)
3437 /* Don't count this dependence. */
3438 return;
3439
3440 dt = ds_to_dt (ds);
3441 if (dt == REG_DEP_TRUE)
3442 tick_check_data.seen_true_dep_p = true;
3443
3444 gcc_assert (INSN_SCHED_CYCLE (pro_insn) > 0);
3445
3446 {
3447 dep_def _dep, *dep = &_dep;
3448
3449 init_dep (dep, pro_insn, con_insn, dt);
3450
3451 tick = INSN_SCHED_CYCLE (pro_insn) + dep_cost_1 (dep, dw);
3452 }
3453
3454 /* When there are several kinds of dependencies between pro and con,
3455 only REG_DEP_TRUE should be taken into account. */
3456 if (tick > tick_check_data.cycle
3457 && (dt == REG_DEP_TRUE || !tick_check_data.seen_true_dep_p))
3458 tick_check_data.cycle = tick;
3459 }
3460 }
3461
3462 /* An implementation of note_dep hook. */
3463 static void
3464 tick_check_note_dep (insn_t pro, ds_t ds)
3465 {
3466 tick_check_dep_with_dw (pro, ds, 0);
3467 }
3468
3469 /* An implementation of note_mem_dep hook. */
3470 static void
3471 tick_check_note_mem_dep (rtx mem1, rtx mem2, insn_t pro, ds_t ds)
3472 {
3473 dw_t dw;
3474
3475 dw = (ds_to_dt (ds) == REG_DEP_TRUE
3476 ? estimate_dep_weak (mem1, mem2)
3477 : 0);
3478
3479 tick_check_dep_with_dw (pro, ds, dw);
3480 }
3481
3482 /* This structure contains hooks for dependence analysis used when determining
3483 whether an insn is ready for scheduling. */
3484 static struct sched_deps_info_def tick_check_sched_deps_info =
3485 {
3486 NULL,
3487
3488 NULL,
3489 NULL,
3490 NULL,
3491 NULL,
3492 NULL,
3493 NULL,
3494 haifa_note_reg_set,
3495 haifa_note_reg_clobber,
3496 haifa_note_reg_use,
3497 tick_check_note_mem_dep,
3498 tick_check_note_dep,
3499
3500 0, 0, 0
3501 };
3502
3503 /* Estimate number of cycles from the current cycle of FENCE until EXPR can be
3504 scheduled. Return 0 if all data from producers in DC is ready. */
3505 int
3506 tick_check_p (expr_t expr, deps_t dc, fence_t fence)
3507 {
3508 int cycles_left;
3509 /* Initialize variables. */
3510 tick_check_data.expr = expr;
3511 tick_check_data.cycle = 0;
3512 tick_check_data.seen_true_dep_p = false;
3513 sched_deps_info = &tick_check_sched_deps_info;
3514
3515 gcc_assert (!dc->readonly);
3516 dc->readonly = 1;
3517 deps_analyze_insn (dc, EXPR_INSN_RTX (expr));
3518 dc->readonly = 0;
3519
3520 cycles_left = tick_check_data.cycle - FENCE_CYCLE (fence);
3521
3522 return cycles_left >= 0 ? cycles_left : 0;
3523 }
3524 \f
3525
3526 /* Functions to work with insns. */
3527
3528 /* Returns true if LHS of INSN is the same as DEST of an insn
3529 being moved. */
3530 bool
3531 lhs_of_insn_equals_to_dest_p (insn_t insn, rtx dest)
3532 {
3533 rtx lhs = INSN_LHS (insn);
3534
3535 if (lhs == NULL || dest == NULL)
3536 return false;
3537
3538 return rtx_equal_p (lhs, dest);
3539 }
3540
3541 /* Return s_i_d entry of INSN. Callable from debugger. */
3542 sel_insn_data_def
3543 insn_sid (insn_t insn)
3544 {
3545 return *SID (insn);
3546 }
3547
3548 /* True when INSN is a speculative check. We can tell this by looking
3549 at the data structures of the selective scheduler, not by examining
3550 the pattern. */
3551 bool
3552 sel_insn_is_speculation_check (rtx insn)
3553 {
3554 return s_i_d && !! INSN_SPEC_CHECKED_DS (insn);
3555 }
3556
3557 /* Extracts machine mode MODE and destination location DST_LOC
3558 for given INSN. */
3559 void
3560 get_dest_and_mode (rtx insn, rtx *dst_loc, enum machine_mode *mode)
3561 {
3562 rtx pat = PATTERN (insn);
3563
3564 gcc_assert (dst_loc);
3565 gcc_assert (GET_CODE (pat) == SET);
3566
3567 *dst_loc = SET_DEST (pat);
3568
3569 gcc_assert (*dst_loc);
3570 gcc_assert (MEM_P (*dst_loc) || REG_P (*dst_loc));
3571
3572 if (mode)
3573 *mode = GET_MODE (*dst_loc);
3574 }
3575
3576 /* Returns true when moving through JUMP will result in bookkeeping
3577 creation. */
3578 bool
3579 bookkeeping_can_be_created_if_moved_through_p (insn_t jump)
3580 {
3581 insn_t succ;
3582 succ_iterator si;
3583
3584 FOR_EACH_SUCC (succ, si, jump)
3585 if (sel_num_cfg_preds_gt_1 (succ))
3586 return true;
3587
3588 return false;
3589 }
3590
3591 /* Return 'true' if INSN is the only one in its basic block. */
3592 static bool
3593 insn_is_the_only_one_in_bb_p (insn_t insn)
3594 {
3595 return sel_bb_head_p (insn) && sel_bb_end_p (insn);
3596 }
3597
3598 #ifdef ENABLE_CHECKING
3599 /* Check that the region we're scheduling still has at most one
3600 backedge. */
3601 static void
3602 verify_backedges (void)
3603 {
3604 if (pipelining_p)
3605 {
3606 int i, n = 0;
3607 edge e;
3608 edge_iterator ei;
3609
3610 for (i = 0; i < current_nr_blocks; i++)
3611 FOR_EACH_EDGE (e, ei, BASIC_BLOCK (BB_TO_BLOCK (i))->succs)
3612 if (in_current_region_p (e->dest)
3613 && BLOCK_TO_BB (e->dest->index) < i)
3614 n++;
3615
3616 gcc_assert (n <= 1);
3617 }
3618 }
3619 #endif
3620 \f
3621
3622 /* Functions to work with control flow. */
3623
3624 /* Recompute BLOCK_TO_BB and BB_FOR_BLOCK for current region so that blocks
3625 are sorted in topological order (it might have been invalidated by
3626 redirecting an edge). */
3627 static void
3628 sel_recompute_toporder (void)
3629 {
3630 int i, n, rgn;
3631 int *postorder, n_blocks;
3632
3633 postorder = XALLOCAVEC (int, n_basic_blocks);
3634 n_blocks = post_order_compute (postorder, false, false);
3635
3636 rgn = CONTAINING_RGN (BB_TO_BLOCK (0));
3637 for (n = 0, i = n_blocks - 1; i >= 0; i--)
3638 if (CONTAINING_RGN (postorder[i]) == rgn)
3639 {
3640 BLOCK_TO_BB (postorder[i]) = n;
3641 BB_TO_BLOCK (n) = postorder[i];
3642 n++;
3643 }
3644
3645 /* Assert that we updated info for all blocks. We may miss some blocks if
3646 this function is called when redirecting an edge made a block
3647 unreachable, but that block is not deleted yet. */
3648 gcc_assert (n == RGN_NR_BLOCKS (rgn));
3649 }
3650
3651 /* Tidy the possibly empty block BB. */
3652 static bool
3653 maybe_tidy_empty_bb (basic_block bb)
3654 {
3655 basic_block succ_bb, pred_bb;
3656 VEC (basic_block, heap) *dom_bbs;
3657 edge e;
3658 edge_iterator ei;
3659 bool rescan_p;
3660
3661 /* Keep empty bb only if this block immediately precedes EXIT and
3662 has incoming non-fallthrough edge, or it has no predecessors or
3663 successors. Otherwise remove it. */
3664 if (!sel_bb_empty_p (bb)
3665 || (single_succ_p (bb)
3666 && single_succ (bb) == EXIT_BLOCK_PTR
3667 && (!single_pred_p (bb)
3668 || !(single_pred_edge (bb)->flags & EDGE_FALLTHRU)))
3669 || EDGE_COUNT (bb->preds) == 0
3670 || EDGE_COUNT (bb->succs) == 0)
3671 return false;
3672
3673 /* Do not attempt to redirect complex edges. */
3674 FOR_EACH_EDGE (e, ei, bb->preds)
3675 if (e->flags & EDGE_COMPLEX)
3676 return false;
3677
3678 free_data_sets (bb);
3679
3680 /* Do not delete BB if it has more than one successor.
3681 That can occur when we moving a jump. */
3682 if (!single_succ_p (bb))
3683 {
3684 gcc_assert (can_merge_blocks_p (bb->prev_bb, bb));
3685 sel_merge_blocks (bb->prev_bb, bb);
3686 return true;
3687 }
3688
3689 succ_bb = single_succ (bb);
3690 rescan_p = true;
3691 pred_bb = NULL;
3692 dom_bbs = NULL;
3693
3694 /* Redirect all non-fallthru edges to the next bb. */
3695 while (rescan_p)
3696 {
3697 rescan_p = false;
3698
3699 FOR_EACH_EDGE (e, ei, bb->preds)
3700 {
3701 pred_bb = e->src;
3702
3703 if (!(e->flags & EDGE_FALLTHRU))
3704 {
3705 /* We can not invalidate computed topological order by moving
3706 the edge destination block (E->SUCC) along a fallthru edge.
3707
3708 We will update dominators here only when we'll get
3709 an unreachable block when redirecting, otherwise
3710 sel_redirect_edge_and_branch will take care of it. */
3711 if (e->dest != bb
3712 && single_pred_p (e->dest))
3713 VEC_safe_push (basic_block, heap, dom_bbs, e->dest);
3714 sel_redirect_edge_and_branch (e, succ_bb);
3715 rescan_p = true;
3716 break;
3717 }
3718 /* If the edge is fallthru, but PRED_BB ends in a conditional jump
3719 to BB (so there is no non-fallthru edge from PRED_BB to BB), we
3720 still have to adjust it. */
3721 else if (single_succ_p (pred_bb) && any_condjump_p (BB_END (pred_bb)))
3722 {
3723 /* If possible, try to remove the unneeded conditional jump. */
3724 if (INSN_SCHED_TIMES (BB_END (pred_bb)) == 0
3725 && !IN_CURRENT_FENCE_P (BB_END (pred_bb)))
3726 {
3727 if (!sel_remove_insn (BB_END (pred_bb), false, false))
3728 tidy_fallthru_edge (e);
3729 }
3730 else
3731 sel_redirect_edge_and_branch (e, succ_bb);
3732 rescan_p = true;
3733 break;
3734 }
3735 }
3736 }
3737
3738 if (can_merge_blocks_p (bb->prev_bb, bb))
3739 sel_merge_blocks (bb->prev_bb, bb);
3740 else
3741 {
3742 /* This is a block without fallthru predecessor. Just delete it. */
3743 gcc_assert (pred_bb != NULL);
3744
3745 if (in_current_region_p (pred_bb))
3746 move_bb_info (pred_bb, bb);
3747 remove_empty_bb (bb, true);
3748 }
3749
3750 if (!VEC_empty (basic_block, dom_bbs))
3751 {
3752 VEC_safe_push (basic_block, heap, dom_bbs, succ_bb);
3753 iterate_fix_dominators (CDI_DOMINATORS, dom_bbs, false);
3754 VEC_free (basic_block, heap, dom_bbs);
3755 }
3756
3757 return true;
3758 }
3759
3760 /* Tidy the control flow after we have removed original insn from
3761 XBB. Return true if we have removed some blocks. When FULL_TIDYING
3762 is true, also try to optimize control flow on non-empty blocks. */
3763 bool
3764 tidy_control_flow (basic_block xbb, bool full_tidying)
3765 {
3766 bool changed = true;
3767 insn_t first, last;
3768
3769 /* First check whether XBB is empty. */
3770 changed = maybe_tidy_empty_bb (xbb);
3771 if (changed || !full_tidying)
3772 return changed;
3773
3774 /* Check if there is a unnecessary jump after insn left. */
3775 if (bb_has_removable_jump_to_p (xbb, xbb->next_bb)
3776 && INSN_SCHED_TIMES (BB_END (xbb)) == 0
3777 && !IN_CURRENT_FENCE_P (BB_END (xbb)))
3778 {
3779 if (sel_remove_insn (BB_END (xbb), false, false))
3780 return true;
3781 tidy_fallthru_edge (EDGE_SUCC (xbb, 0));
3782 }
3783
3784 first = sel_bb_head (xbb);
3785 last = sel_bb_end (xbb);
3786 if (MAY_HAVE_DEBUG_INSNS)
3787 {
3788 if (first != last && DEBUG_INSN_P (first))
3789 do
3790 first = NEXT_INSN (first);
3791 while (first != last && (DEBUG_INSN_P (first) || NOTE_P (first)));
3792
3793 if (first != last && DEBUG_INSN_P (last))
3794 do
3795 last = PREV_INSN (last);
3796 while (first != last && (DEBUG_INSN_P (last) || NOTE_P (last)));
3797 }
3798 /* Check if there is an unnecessary jump in previous basic block leading
3799 to next basic block left after removing INSN from stream.
3800 If it is so, remove that jump and redirect edge to current
3801 basic block (where there was INSN before deletion). This way
3802 when NOP will be deleted several instructions later with its
3803 basic block we will not get a jump to next instruction, which
3804 can be harmful. */
3805 if (first == last
3806 && !sel_bb_empty_p (xbb)
3807 && INSN_NOP_P (last)
3808 /* Flow goes fallthru from current block to the next. */
3809 && EDGE_COUNT (xbb->succs) == 1
3810 && (EDGE_SUCC (xbb, 0)->flags & EDGE_FALLTHRU)
3811 /* When successor is an EXIT block, it may not be the next block. */
3812 && single_succ (xbb) != EXIT_BLOCK_PTR
3813 /* And unconditional jump in previous basic block leads to
3814 next basic block of XBB and this jump can be safely removed. */
3815 && in_current_region_p (xbb->prev_bb)
3816 && bb_has_removable_jump_to_p (xbb->prev_bb, xbb->next_bb)
3817 && INSN_SCHED_TIMES (BB_END (xbb->prev_bb)) == 0
3818 /* Also this jump is not at the scheduling boundary. */
3819 && !IN_CURRENT_FENCE_P (BB_END (xbb->prev_bb)))
3820 {
3821 bool recompute_toporder_p;
3822 /* Clear data structures of jump - jump itself will be removed
3823 by sel_redirect_edge_and_branch. */
3824 clear_expr (INSN_EXPR (BB_END (xbb->prev_bb)));
3825 recompute_toporder_p
3826 = sel_redirect_edge_and_branch (EDGE_SUCC (xbb->prev_bb, 0), xbb);
3827
3828 gcc_assert (EDGE_SUCC (xbb->prev_bb, 0)->flags & EDGE_FALLTHRU);
3829
3830 /* It can turn out that after removing unused jump, basic block
3831 that contained that jump, becomes empty too. In such case
3832 remove it too. */
3833 if (sel_bb_empty_p (xbb->prev_bb))
3834 changed = maybe_tidy_empty_bb (xbb->prev_bb);
3835 if (recompute_toporder_p)
3836 sel_recompute_toporder ();
3837 }
3838
3839 #ifdef ENABLE_CHECKING
3840 verify_backedges ();
3841 verify_dominators (CDI_DOMINATORS);
3842 #endif
3843
3844 return changed;
3845 }
3846
3847 /* Purge meaningless empty blocks in the middle of a region. */
3848 void
3849 purge_empty_blocks (void)
3850 {
3851 int i;
3852
3853 /* Do not attempt to delete the first basic block in the region. */
3854 for (i = 1; i < current_nr_blocks; )
3855 {
3856 basic_block b = BASIC_BLOCK (BB_TO_BLOCK (i));
3857
3858 if (maybe_tidy_empty_bb (b))
3859 continue;
3860
3861 i++;
3862 }
3863 }
3864
3865 /* Rip-off INSN from the insn stream. When ONLY_DISCONNECT is true,
3866 do not delete insn's data, because it will be later re-emitted.
3867 Return true if we have removed some blocks afterwards. */
3868 bool
3869 sel_remove_insn (insn_t insn, bool only_disconnect, bool full_tidying)
3870 {
3871 basic_block bb = BLOCK_FOR_INSN (insn);
3872
3873 gcc_assert (INSN_IN_STREAM_P (insn));
3874
3875 if (DEBUG_INSN_P (insn) && BB_AV_SET_VALID_P (bb))
3876 {
3877 expr_t expr;
3878 av_set_iterator i;
3879
3880 /* When we remove a debug insn that is head of a BB, it remains
3881 in the AV_SET of the block, but it shouldn't. */
3882 FOR_EACH_EXPR_1 (expr, i, &BB_AV_SET (bb))
3883 if (EXPR_INSN_RTX (expr) == insn)
3884 {
3885 av_set_iter_remove (&i);
3886 break;
3887 }
3888 }
3889
3890 if (only_disconnect)
3891 {
3892 insn_t prev = PREV_INSN (insn);
3893 insn_t next = NEXT_INSN (insn);
3894 basic_block bb = BLOCK_FOR_INSN (insn);
3895
3896 NEXT_INSN (prev) = next;
3897 PREV_INSN (next) = prev;
3898
3899 if (BB_HEAD (bb) == insn)
3900 {
3901 gcc_assert (BLOCK_FOR_INSN (prev) == bb);
3902 BB_HEAD (bb) = prev;
3903 }
3904 if (BB_END (bb) == insn)
3905 BB_END (bb) = prev;
3906 }
3907 else
3908 {
3909 remove_insn (insn);
3910 clear_expr (INSN_EXPR (insn));
3911 }
3912
3913 /* It is necessary to null this fields before calling add_insn (). */
3914 PREV_INSN (insn) = NULL_RTX;
3915 NEXT_INSN (insn) = NULL_RTX;
3916
3917 return tidy_control_flow (bb, full_tidying);
3918 }
3919
3920 /* Estimate number of the insns in BB. */
3921 static int
3922 sel_estimate_number_of_insns (basic_block bb)
3923 {
3924 int res = 0;
3925 insn_t insn = NEXT_INSN (BB_HEAD (bb)), next_tail = NEXT_INSN (BB_END (bb));
3926
3927 for (; insn != next_tail; insn = NEXT_INSN (insn))
3928 if (NONDEBUG_INSN_P (insn))
3929 res++;
3930
3931 return res;
3932 }
3933
3934 /* We don't need separate luids for notes or labels. */
3935 static int
3936 sel_luid_for_non_insn (rtx x)
3937 {
3938 gcc_assert (NOTE_P (x) || LABEL_P (x));
3939
3940 return -1;
3941 }
3942
3943 /* Return seqno of the only predecessor of INSN. */
3944 static int
3945 get_seqno_of_a_pred (insn_t insn)
3946 {
3947 int seqno;
3948
3949 gcc_assert (INSN_SIMPLEJUMP_P (insn));
3950
3951 if (!sel_bb_head_p (insn))
3952 seqno = INSN_SEQNO (PREV_INSN (insn));
3953 else
3954 {
3955 basic_block bb = BLOCK_FOR_INSN (insn);
3956
3957 if (single_pred_p (bb)
3958 && !in_current_region_p (single_pred (bb)))
3959 {
3960 /* We can have preds outside a region when splitting edges
3961 for pipelining of an outer loop. Use succ instead.
3962 There should be only one of them. */
3963 insn_t succ = NULL;
3964 succ_iterator si;
3965 bool first = true;
3966
3967 gcc_assert (flag_sel_sched_pipelining_outer_loops
3968 && current_loop_nest);
3969 FOR_EACH_SUCC_1 (succ, si, insn,
3970 SUCCS_NORMAL | SUCCS_SKIP_TO_LOOP_EXITS)
3971 {
3972 gcc_assert (first);
3973 first = false;
3974 }
3975
3976 gcc_assert (succ != NULL);
3977 seqno = INSN_SEQNO (succ);
3978 }
3979 else
3980 {
3981 insn_t *preds;
3982 int n;
3983
3984 cfg_preds (BLOCK_FOR_INSN (insn), &preds, &n);
3985 gcc_assert (n == 1);
3986
3987 seqno = INSN_SEQNO (preds[0]);
3988
3989 free (preds);
3990 }
3991 }
3992
3993 return seqno;
3994 }
3995
3996 /* Find the proper seqno for inserting at INSN. Returns -1 if no predecessors
3997 with positive seqno exist. */
3998 int
3999 get_seqno_by_preds (rtx insn)
4000 {
4001 basic_block bb = BLOCK_FOR_INSN (insn);
4002 rtx tmp = insn, head = BB_HEAD (bb);
4003 insn_t *preds;
4004 int n, i, seqno;
4005
4006 while (tmp != head)
4007 if (INSN_P (tmp))
4008 return INSN_SEQNO (tmp);
4009 else
4010 tmp = PREV_INSN (tmp);
4011
4012 cfg_preds (bb, &preds, &n);
4013 for (i = 0, seqno = -1; i < n; i++)
4014 seqno = MAX (seqno, INSN_SEQNO (preds[i]));
4015
4016 return seqno;
4017 }
4018
4019 \f
4020
4021 /* Extend pass-scope data structures for basic blocks. */
4022 void
4023 sel_extend_global_bb_info (void)
4024 {
4025 VEC_safe_grow_cleared (sel_global_bb_info_def, heap, sel_global_bb_info,
4026 last_basic_block);
4027 }
4028
4029 /* Extend region-scope data structures for basic blocks. */
4030 static void
4031 extend_region_bb_info (void)
4032 {
4033 VEC_safe_grow_cleared (sel_region_bb_info_def, heap, sel_region_bb_info,
4034 last_basic_block);
4035 }
4036
4037 /* Extend all data structures to fit for all basic blocks. */
4038 static void
4039 extend_bb_info (void)
4040 {
4041 sel_extend_global_bb_info ();
4042 extend_region_bb_info ();
4043 }
4044
4045 /* Finalize pass-scope data structures for basic blocks. */
4046 void
4047 sel_finish_global_bb_info (void)
4048 {
4049 VEC_free (sel_global_bb_info_def, heap, sel_global_bb_info);
4050 }
4051
4052 /* Finalize region-scope data structures for basic blocks. */
4053 static void
4054 finish_region_bb_info (void)
4055 {
4056 VEC_free (sel_region_bb_info_def, heap, sel_region_bb_info);
4057 }
4058 \f
4059
4060 /* Data for each insn in current region. */
4061 VEC (sel_insn_data_def, heap) *s_i_d = NULL;
4062
4063 /* Extend data structures for insns from current region. */
4064 static void
4065 extend_insn_data (void)
4066 {
4067 int reserve;
4068
4069 sched_extend_target ();
4070 sched_deps_init (false);
4071
4072 /* Extend data structures for insns from current region. */
4073 reserve = (sched_max_luid + 1
4074 - VEC_length (sel_insn_data_def, s_i_d));
4075 if (reserve > 0
4076 && ! VEC_space (sel_insn_data_def, s_i_d, reserve))
4077 {
4078 int size;
4079
4080 if (sched_max_luid / 2 > 1024)
4081 size = sched_max_luid + 1024;
4082 else
4083 size = 3 * sched_max_luid / 2;
4084
4085
4086 VEC_safe_grow_cleared (sel_insn_data_def, heap, s_i_d, size);
4087 }
4088 }
4089
4090 /* Finalize data structures for insns from current region. */
4091 static void
4092 finish_insns (void)
4093 {
4094 unsigned i;
4095
4096 /* Clear here all dependence contexts that may have left from insns that were
4097 removed during the scheduling. */
4098 for (i = 0; i < VEC_length (sel_insn_data_def, s_i_d); i++)
4099 {
4100 sel_insn_data_def *sid_entry = VEC_index (sel_insn_data_def, s_i_d, i);
4101
4102 if (sid_entry->live)
4103 return_regset_to_pool (sid_entry->live);
4104 if (sid_entry->analyzed_deps)
4105 {
4106 BITMAP_FREE (sid_entry->analyzed_deps);
4107 BITMAP_FREE (sid_entry->found_deps);
4108 htab_delete (sid_entry->transformed_insns);
4109 free_deps (&sid_entry->deps_context);
4110 }
4111 if (EXPR_VINSN (&sid_entry->expr))
4112 {
4113 clear_expr (&sid_entry->expr);
4114
4115 /* Also, clear CANT_MOVE bit here, because we really don't want it
4116 to be passed to the next region. */
4117 CANT_MOVE_BY_LUID (i) = 0;
4118 }
4119 }
4120
4121 VEC_free (sel_insn_data_def, heap, s_i_d);
4122 }
4123
4124 /* A proxy to pass initialization data to init_insn (). */
4125 static sel_insn_data_def _insn_init_ssid;
4126 static sel_insn_data_t insn_init_ssid = &_insn_init_ssid;
4127
4128 /* If true create a new vinsn. Otherwise use the one from EXPR. */
4129 static bool insn_init_create_new_vinsn_p;
4130
4131 /* Set all necessary data for initialization of the new insn[s]. */
4132 static expr_t
4133 set_insn_init (expr_t expr, vinsn_t vi, int seqno)
4134 {
4135 expr_t x = &insn_init_ssid->expr;
4136
4137 copy_expr_onside (x, expr);
4138 if (vi != NULL)
4139 {
4140 insn_init_create_new_vinsn_p = false;
4141 change_vinsn_in_expr (x, vi);
4142 }
4143 else
4144 insn_init_create_new_vinsn_p = true;
4145
4146 insn_init_ssid->seqno = seqno;
4147 return x;
4148 }
4149
4150 /* Init data for INSN. */
4151 static void
4152 init_insn_data (insn_t insn)
4153 {
4154 expr_t expr;
4155 sel_insn_data_t ssid = insn_init_ssid;
4156
4157 /* The fields mentioned below are special and hence are not being
4158 propagated to the new insns. */
4159 gcc_assert (!ssid->asm_p && ssid->sched_next == NULL
4160 && !ssid->after_stall_p && ssid->sched_cycle == 0);
4161 gcc_assert (INSN_P (insn) && INSN_LUID (insn) > 0);
4162
4163 expr = INSN_EXPR (insn);
4164 copy_expr (expr, &ssid->expr);
4165 prepare_insn_expr (insn, ssid->seqno);
4166
4167 if (insn_init_create_new_vinsn_p)
4168 change_vinsn_in_expr (expr, vinsn_create (insn, init_insn_force_unique_p));
4169
4170 if (first_time_insn_init (insn))
4171 init_first_time_insn_data (insn);
4172 }
4173
4174 /* This is used to initialize spurious jumps generated by
4175 sel_redirect_edge (). */
4176 static void
4177 init_simplejump_data (insn_t insn)
4178 {
4179 init_expr (INSN_EXPR (insn), vinsn_create (insn, false), 0,
4180 REG_BR_PROB_BASE, 0, 0, 0, 0, 0, 0, NULL, true, false, false,
4181 false, true);
4182 INSN_SEQNO (insn) = get_seqno_of_a_pred (insn);
4183 init_first_time_insn_data (insn);
4184 }
4185
4186 /* Perform deferred initialization of insns. This is used to process
4187 a new jump that may be created by redirect_edge. */
4188 void
4189 sel_init_new_insn (insn_t insn, int flags)
4190 {
4191 /* We create data structures for bb when the first insn is emitted in it. */
4192 if (INSN_P (insn)
4193 && INSN_IN_STREAM_P (insn)
4194 && insn_is_the_only_one_in_bb_p (insn))
4195 {
4196 extend_bb_info ();
4197 create_initial_data_sets (BLOCK_FOR_INSN (insn));
4198 }
4199
4200 if (flags & INSN_INIT_TODO_LUID)
4201 {
4202 sched_extend_luids ();
4203 sched_init_insn_luid (insn);
4204 }
4205
4206 if (flags & INSN_INIT_TODO_SSID)
4207 {
4208 extend_insn_data ();
4209 init_insn_data (insn);
4210 clear_expr (&insn_init_ssid->expr);
4211 }
4212
4213 if (flags & INSN_INIT_TODO_SIMPLEJUMP)
4214 {
4215 extend_insn_data ();
4216 init_simplejump_data (insn);
4217 }
4218
4219 gcc_assert (CONTAINING_RGN (BLOCK_NUM (insn))
4220 == CONTAINING_RGN (BB_TO_BLOCK (0)));
4221 }
4222 \f
4223
4224 /* Functions to init/finish work with lv sets. */
4225
4226 /* Init BB_LV_SET of BB from DF_LR_IN set of BB. */
4227 static void
4228 init_lv_set (basic_block bb)
4229 {
4230 gcc_assert (!BB_LV_SET_VALID_P (bb));
4231
4232 BB_LV_SET (bb) = get_regset_from_pool ();
4233 COPY_REG_SET (BB_LV_SET (bb), DF_LR_IN (bb));
4234 BB_LV_SET_VALID_P (bb) = true;
4235 }
4236
4237 /* Copy liveness information to BB from FROM_BB. */
4238 static void
4239 copy_lv_set_from (basic_block bb, basic_block from_bb)
4240 {
4241 gcc_assert (!BB_LV_SET_VALID_P (bb));
4242
4243 COPY_REG_SET (BB_LV_SET (bb), BB_LV_SET (from_bb));
4244 BB_LV_SET_VALID_P (bb) = true;
4245 }
4246
4247 /* Initialize lv set of all bb headers. */
4248 void
4249 init_lv_sets (void)
4250 {
4251 basic_block bb;
4252
4253 /* Initialize of LV sets. */
4254 FOR_EACH_BB (bb)
4255 init_lv_set (bb);
4256
4257 /* Don't forget EXIT_BLOCK. */
4258 init_lv_set (EXIT_BLOCK_PTR);
4259 }
4260
4261 /* Release lv set of HEAD. */
4262 static void
4263 free_lv_set (basic_block bb)
4264 {
4265 gcc_assert (BB_LV_SET (bb) != NULL);
4266
4267 return_regset_to_pool (BB_LV_SET (bb));
4268 BB_LV_SET (bb) = NULL;
4269 BB_LV_SET_VALID_P (bb) = false;
4270 }
4271
4272 /* Finalize lv sets of all bb headers. */
4273 void
4274 free_lv_sets (void)
4275 {
4276 basic_block bb;
4277
4278 /* Don't forget EXIT_BLOCK. */
4279 free_lv_set (EXIT_BLOCK_PTR);
4280
4281 /* Free LV sets. */
4282 FOR_EACH_BB (bb)
4283 if (BB_LV_SET (bb))
4284 free_lv_set (bb);
4285 }
4286
4287 /* Mark AV_SET for BB as invalid, so this set will be updated the next time
4288 compute_av() processes BB. This function is called when creating new basic
4289 blocks, as well as for blocks (either new or existing) where new jumps are
4290 created when the control flow is being updated. */
4291 static void
4292 invalidate_av_set (basic_block bb)
4293 {
4294 BB_AV_LEVEL (bb) = -1;
4295 }
4296
4297 /* Create initial data sets for BB (they will be invalid). */
4298 static void
4299 create_initial_data_sets (basic_block bb)
4300 {
4301 if (BB_LV_SET (bb))
4302 BB_LV_SET_VALID_P (bb) = false;
4303 else
4304 BB_LV_SET (bb) = get_regset_from_pool ();
4305 invalidate_av_set (bb);
4306 }
4307
4308 /* Free av set of BB. */
4309 static void
4310 free_av_set (basic_block bb)
4311 {
4312 av_set_clear (&BB_AV_SET (bb));
4313 BB_AV_LEVEL (bb) = 0;
4314 }
4315
4316 /* Free data sets of BB. */
4317 void
4318 free_data_sets (basic_block bb)
4319 {
4320 free_lv_set (bb);
4321 free_av_set (bb);
4322 }
4323
4324 /* Exchange lv sets of TO and FROM. */
4325 static void
4326 exchange_lv_sets (basic_block to, basic_block from)
4327 {
4328 {
4329 regset to_lv_set = BB_LV_SET (to);
4330
4331 BB_LV_SET (to) = BB_LV_SET (from);
4332 BB_LV_SET (from) = to_lv_set;
4333 }
4334
4335 {
4336 bool to_lv_set_valid_p = BB_LV_SET_VALID_P (to);
4337
4338 BB_LV_SET_VALID_P (to) = BB_LV_SET_VALID_P (from);
4339 BB_LV_SET_VALID_P (from) = to_lv_set_valid_p;
4340 }
4341 }
4342
4343
4344 /* Exchange av sets of TO and FROM. */
4345 static void
4346 exchange_av_sets (basic_block to, basic_block from)
4347 {
4348 {
4349 av_set_t to_av_set = BB_AV_SET (to);
4350
4351 BB_AV_SET (to) = BB_AV_SET (from);
4352 BB_AV_SET (from) = to_av_set;
4353 }
4354
4355 {
4356 int to_av_level = BB_AV_LEVEL (to);
4357
4358 BB_AV_LEVEL (to) = BB_AV_LEVEL (from);
4359 BB_AV_LEVEL (from) = to_av_level;
4360 }
4361 }
4362
4363 /* Exchange data sets of TO and FROM. */
4364 void
4365 exchange_data_sets (basic_block to, basic_block from)
4366 {
4367 exchange_lv_sets (to, from);
4368 exchange_av_sets (to, from);
4369 }
4370
4371 /* Copy data sets of FROM to TO. */
4372 void
4373 copy_data_sets (basic_block to, basic_block from)
4374 {
4375 gcc_assert (!BB_LV_SET_VALID_P (to) && !BB_AV_SET_VALID_P (to));
4376 gcc_assert (BB_AV_SET (to) == NULL);
4377
4378 BB_AV_LEVEL (to) = BB_AV_LEVEL (from);
4379 BB_LV_SET_VALID_P (to) = BB_LV_SET_VALID_P (from);
4380
4381 if (BB_AV_SET_VALID_P (from))
4382 {
4383 BB_AV_SET (to) = av_set_copy (BB_AV_SET (from));
4384 }
4385 if (BB_LV_SET_VALID_P (from))
4386 {
4387 gcc_assert (BB_LV_SET (to) != NULL);
4388 COPY_REG_SET (BB_LV_SET (to), BB_LV_SET (from));
4389 }
4390 }
4391
4392 /* Return an av set for INSN, if any. */
4393 av_set_t
4394 get_av_set (insn_t insn)
4395 {
4396 av_set_t av_set;
4397
4398 gcc_assert (AV_SET_VALID_P (insn));
4399
4400 if (sel_bb_head_p (insn))
4401 av_set = BB_AV_SET (BLOCK_FOR_INSN (insn));
4402 else
4403 av_set = NULL;
4404
4405 return av_set;
4406 }
4407
4408 /* Implementation of AV_LEVEL () macro. Return AV_LEVEL () of INSN. */
4409 int
4410 get_av_level (insn_t insn)
4411 {
4412 int av_level;
4413
4414 gcc_assert (INSN_P (insn));
4415
4416 if (sel_bb_head_p (insn))
4417 av_level = BB_AV_LEVEL (BLOCK_FOR_INSN (insn));
4418 else
4419 av_level = INSN_WS_LEVEL (insn);
4420
4421 return av_level;
4422 }
4423
4424 \f
4425
4426 /* Variables to work with control-flow graph. */
4427
4428 /* The basic block that already has been processed by the sched_data_update (),
4429 but hasn't been in sel_add_bb () yet. */
4430 static VEC (basic_block, heap) *last_added_blocks = NULL;
4431
4432 /* A pool for allocating successor infos. */
4433 static struct
4434 {
4435 /* A stack for saving succs_info structures. */
4436 struct succs_info *stack;
4437
4438 /* Its size. */
4439 int size;
4440
4441 /* Top of the stack. */
4442 int top;
4443
4444 /* Maximal value of the top. */
4445 int max_top;
4446 } succs_info_pool;
4447
4448 /* Functions to work with control-flow graph. */
4449
4450 /* Return basic block note of BB. */
4451 insn_t
4452 sel_bb_head (basic_block bb)
4453 {
4454 insn_t head;
4455
4456 if (bb == EXIT_BLOCK_PTR)
4457 {
4458 gcc_assert (exit_insn != NULL_RTX);
4459 head = exit_insn;
4460 }
4461 else
4462 {
4463 insn_t note;
4464
4465 note = bb_note (bb);
4466 head = next_nonnote_insn (note);
4467
4468 if (head && (BARRIER_P (head) || BLOCK_FOR_INSN (head) != bb))
4469 head = NULL_RTX;
4470 }
4471
4472 return head;
4473 }
4474
4475 /* Return true if INSN is a basic block header. */
4476 bool
4477 sel_bb_head_p (insn_t insn)
4478 {
4479 return sel_bb_head (BLOCK_FOR_INSN (insn)) == insn;
4480 }
4481
4482 /* Return last insn of BB. */
4483 insn_t
4484 sel_bb_end (basic_block bb)
4485 {
4486 if (sel_bb_empty_p (bb))
4487 return NULL_RTX;
4488
4489 gcc_assert (bb != EXIT_BLOCK_PTR);
4490
4491 return BB_END (bb);
4492 }
4493
4494 /* Return true if INSN is the last insn in its basic block. */
4495 bool
4496 sel_bb_end_p (insn_t insn)
4497 {
4498 return insn == sel_bb_end (BLOCK_FOR_INSN (insn));
4499 }
4500
4501 /* Return true if BB consist of single NOTE_INSN_BASIC_BLOCK. */
4502 bool
4503 sel_bb_empty_p (basic_block bb)
4504 {
4505 return sel_bb_head (bb) == NULL;
4506 }
4507
4508 /* True when BB belongs to the current scheduling region. */
4509 bool
4510 in_current_region_p (basic_block bb)
4511 {
4512 if (bb->index < NUM_FIXED_BLOCKS)
4513 return false;
4514
4515 return CONTAINING_RGN (bb->index) == CONTAINING_RGN (BB_TO_BLOCK (0));
4516 }
4517
4518 /* Return the block which is a fallthru bb of a conditional jump JUMP. */
4519 basic_block
4520 fallthru_bb_of_jump (rtx jump)
4521 {
4522 if (!JUMP_P (jump))
4523 return NULL;
4524
4525 if (!any_condjump_p (jump))
4526 return NULL;
4527
4528 /* A basic block that ends with a conditional jump may still have one successor
4529 (and be followed by a barrier), we are not interested. */
4530 if (single_succ_p (BLOCK_FOR_INSN (jump)))
4531 return NULL;
4532
4533 return FALLTHRU_EDGE (BLOCK_FOR_INSN (jump))->dest;
4534 }
4535
4536 /* Remove all notes from BB. */
4537 static void
4538 init_bb (basic_block bb)
4539 {
4540 remove_notes (bb_note (bb), BB_END (bb));
4541 BB_NOTE_LIST (bb) = note_list;
4542 }
4543
4544 void
4545 sel_init_bbs (bb_vec_t bbs)
4546 {
4547 const struct sched_scan_info_def ssi =
4548 {
4549 extend_bb_info, /* extend_bb */
4550 init_bb, /* init_bb */
4551 NULL, /* extend_insn */
4552 NULL /* init_insn */
4553 };
4554
4555 sched_scan (&ssi, bbs);
4556 }
4557
4558 /* Restore notes for the whole region. */
4559 static void
4560 sel_restore_notes (void)
4561 {
4562 int bb;
4563 insn_t insn;
4564
4565 for (bb = 0; bb < current_nr_blocks; bb++)
4566 {
4567 basic_block first, last;
4568
4569 first = EBB_FIRST_BB (bb);
4570 last = EBB_LAST_BB (bb)->next_bb;
4571
4572 do
4573 {
4574 note_list = BB_NOTE_LIST (first);
4575 restore_other_notes (NULL, first);
4576 BB_NOTE_LIST (first) = NULL_RTX;
4577
4578 FOR_BB_INSNS (first, insn)
4579 if (NONDEBUG_INSN_P (insn))
4580 reemit_notes (insn);
4581
4582 first = first->next_bb;
4583 }
4584 while (first != last);
4585 }
4586 }
4587
4588 /* Free per-bb data structures. */
4589 void
4590 sel_finish_bbs (void)
4591 {
4592 sel_restore_notes ();
4593
4594 /* Remove current loop preheader from this loop. */
4595 if (current_loop_nest)
4596 sel_remove_loop_preheader ();
4597
4598 finish_region_bb_info ();
4599 }
4600
4601 /* Return true if INSN has a single successor of type FLAGS. */
4602 bool
4603 sel_insn_has_single_succ_p (insn_t insn, int flags)
4604 {
4605 insn_t succ;
4606 succ_iterator si;
4607 bool first_p = true;
4608
4609 FOR_EACH_SUCC_1 (succ, si, insn, flags)
4610 {
4611 if (first_p)
4612 first_p = false;
4613 else
4614 return false;
4615 }
4616
4617 return true;
4618 }
4619
4620 /* Allocate successor's info. */
4621 static struct succs_info *
4622 alloc_succs_info (void)
4623 {
4624 if (succs_info_pool.top == succs_info_pool.max_top)
4625 {
4626 int i;
4627
4628 if (++succs_info_pool.max_top >= succs_info_pool.size)
4629 gcc_unreachable ();
4630
4631 i = ++succs_info_pool.top;
4632 succs_info_pool.stack[i].succs_ok = VEC_alloc (rtx, heap, 10);
4633 succs_info_pool.stack[i].succs_other = VEC_alloc (rtx, heap, 10);
4634 succs_info_pool.stack[i].probs_ok = VEC_alloc (int, heap, 10);
4635 }
4636 else
4637 succs_info_pool.top++;
4638
4639 return &succs_info_pool.stack[succs_info_pool.top];
4640 }
4641
4642 /* Free successor's info. */
4643 void
4644 free_succs_info (struct succs_info * sinfo)
4645 {
4646 gcc_assert (succs_info_pool.top >= 0
4647 && &succs_info_pool.stack[succs_info_pool.top] == sinfo);
4648 succs_info_pool.top--;
4649
4650 /* Clear stale info. */
4651 VEC_block_remove (rtx, sinfo->succs_ok,
4652 0, VEC_length (rtx, sinfo->succs_ok));
4653 VEC_block_remove (rtx, sinfo->succs_other,
4654 0, VEC_length (rtx, sinfo->succs_other));
4655 VEC_block_remove (int, sinfo->probs_ok,
4656 0, VEC_length (int, sinfo->probs_ok));
4657 sinfo->all_prob = 0;
4658 sinfo->succs_ok_n = 0;
4659 sinfo->all_succs_n = 0;
4660 }
4661
4662 /* Compute successor info for INSN. FLAGS are the flags passed
4663 to the FOR_EACH_SUCC_1 iterator. */
4664 struct succs_info *
4665 compute_succs_info (insn_t insn, short flags)
4666 {
4667 succ_iterator si;
4668 insn_t succ;
4669 struct succs_info *sinfo = alloc_succs_info ();
4670
4671 /* Traverse *all* successors and decide what to do with each. */
4672 FOR_EACH_SUCC_1 (succ, si, insn, SUCCS_ALL)
4673 {
4674 /* FIXME: this doesn't work for skipping to loop exits, as we don't
4675 perform code motion through inner loops. */
4676 short current_flags = si.current_flags & ~SUCCS_SKIP_TO_LOOP_EXITS;
4677
4678 if (current_flags & flags)
4679 {
4680 VEC_safe_push (rtx, heap, sinfo->succs_ok, succ);
4681 VEC_safe_push (int, heap, sinfo->probs_ok,
4682 /* FIXME: Improve calculation when skipping
4683 inner loop to exits. */
4684 (si.bb_end
4685 ? si.e1->probability
4686 : REG_BR_PROB_BASE));
4687 sinfo->succs_ok_n++;
4688 }
4689 else
4690 VEC_safe_push (rtx, heap, sinfo->succs_other, succ);
4691
4692 /* Compute all_prob. */
4693 if (!si.bb_end)
4694 sinfo->all_prob = REG_BR_PROB_BASE;
4695 else
4696 sinfo->all_prob += si.e1->probability;
4697
4698 sinfo->all_succs_n++;
4699 }
4700
4701 return sinfo;
4702 }
4703
4704 /* Return the predecessors of BB in PREDS and their number in N.
4705 Empty blocks are skipped. SIZE is used to allocate PREDS. */
4706 static void
4707 cfg_preds_1 (basic_block bb, insn_t **preds, int *n, int *size)
4708 {
4709 edge e;
4710 edge_iterator ei;
4711
4712 gcc_assert (BLOCK_TO_BB (bb->index) != 0);
4713
4714 FOR_EACH_EDGE (e, ei, bb->preds)
4715 {
4716 basic_block pred_bb = e->src;
4717 insn_t bb_end = BB_END (pred_bb);
4718
4719 if (!in_current_region_p (pred_bb))
4720 {
4721 gcc_assert (flag_sel_sched_pipelining_outer_loops
4722 && current_loop_nest);
4723 continue;
4724 }
4725
4726 if (sel_bb_empty_p (pred_bb))
4727 cfg_preds_1 (pred_bb, preds, n, size);
4728 else
4729 {
4730 if (*n == *size)
4731 *preds = XRESIZEVEC (insn_t, *preds,
4732 (*size = 2 * *size + 1));
4733 (*preds)[(*n)++] = bb_end;
4734 }
4735 }
4736
4737 gcc_assert (*n != 0
4738 || (flag_sel_sched_pipelining_outer_loops
4739 && current_loop_nest));
4740 }
4741
4742 /* Find all predecessors of BB and record them in PREDS and their number
4743 in N. Empty blocks are skipped, and only normal (forward in-region)
4744 edges are processed. */
4745 static void
4746 cfg_preds (basic_block bb, insn_t **preds, int *n)
4747 {
4748 int size = 0;
4749
4750 *preds = NULL;
4751 *n = 0;
4752 cfg_preds_1 (bb, preds, n, &size);
4753 }
4754
4755 /* Returns true if we are moving INSN through join point. */
4756 bool
4757 sel_num_cfg_preds_gt_1 (insn_t insn)
4758 {
4759 basic_block bb;
4760
4761 if (!sel_bb_head_p (insn) || INSN_BB (insn) == 0)
4762 return false;
4763
4764 bb = BLOCK_FOR_INSN (insn);
4765
4766 while (1)
4767 {
4768 if (EDGE_COUNT (bb->preds) > 1)
4769 return true;
4770
4771 gcc_assert (EDGE_PRED (bb, 0)->dest == bb);
4772 bb = EDGE_PRED (bb, 0)->src;
4773
4774 if (!sel_bb_empty_p (bb))
4775 break;
4776 }
4777
4778 return false;
4779 }
4780
4781 /* Returns true when BB should be the end of an ebb. Adapted from the
4782 code in sched-ebb.c. */
4783 bool
4784 bb_ends_ebb_p (basic_block bb)
4785 {
4786 basic_block next_bb = bb_next_bb (bb);
4787 edge e;
4788
4789 if (next_bb == EXIT_BLOCK_PTR
4790 || bitmap_bit_p (forced_ebb_heads, next_bb->index)
4791 || (LABEL_P (BB_HEAD (next_bb))
4792 /* NB: LABEL_NUSES () is not maintained outside of jump.c.
4793 Work around that. */
4794 && !single_pred_p (next_bb)))
4795 return true;
4796
4797 if (!in_current_region_p (next_bb))
4798 return true;
4799
4800 e = find_fallthru_edge (bb->succs);
4801 if (e)
4802 {
4803 gcc_assert (e->dest == next_bb);
4804
4805 return false;
4806 }
4807
4808 return true;
4809 }
4810
4811 /* Returns true when INSN and SUCC are in the same EBB, given that SUCC is a
4812 successor of INSN. */
4813 bool
4814 in_same_ebb_p (insn_t insn, insn_t succ)
4815 {
4816 basic_block ptr = BLOCK_FOR_INSN (insn);
4817
4818 for(;;)
4819 {
4820 if (ptr == BLOCK_FOR_INSN (succ))
4821 return true;
4822
4823 if (bb_ends_ebb_p (ptr))
4824 return false;
4825
4826 ptr = bb_next_bb (ptr);
4827 }
4828
4829 gcc_unreachable ();
4830 return false;
4831 }
4832
4833 /* Recomputes the reverse topological order for the function and
4834 saves it in REV_TOP_ORDER_INDEX. REV_TOP_ORDER_INDEX_LEN is also
4835 modified appropriately. */
4836 static void
4837 recompute_rev_top_order (void)
4838 {
4839 int *postorder;
4840 int n_blocks, i;
4841
4842 if (!rev_top_order_index || rev_top_order_index_len < last_basic_block)
4843 {
4844 rev_top_order_index_len = last_basic_block;
4845 rev_top_order_index = XRESIZEVEC (int, rev_top_order_index,
4846 rev_top_order_index_len);
4847 }
4848
4849 postorder = XNEWVEC (int, n_basic_blocks);
4850
4851 n_blocks = post_order_compute (postorder, true, false);
4852 gcc_assert (n_basic_blocks == n_blocks);
4853
4854 /* Build reverse function: for each basic block with BB->INDEX == K
4855 rev_top_order_index[K] is it's reverse topological sort number. */
4856 for (i = 0; i < n_blocks; i++)
4857 {
4858 gcc_assert (postorder[i] < rev_top_order_index_len);
4859 rev_top_order_index[postorder[i]] = i;
4860 }
4861
4862 free (postorder);
4863 }
4864
4865 /* Clear all flags from insns in BB that could spoil its rescheduling. */
4866 void
4867 clear_outdated_rtx_info (basic_block bb)
4868 {
4869 rtx insn;
4870
4871 FOR_BB_INSNS (bb, insn)
4872 if (INSN_P (insn))
4873 {
4874 SCHED_GROUP_P (insn) = 0;
4875 INSN_AFTER_STALL_P (insn) = 0;
4876 INSN_SCHED_TIMES (insn) = 0;
4877 EXPR_PRIORITY_ADJ (INSN_EXPR (insn)) = 0;
4878
4879 /* We cannot use the changed caches, as previously we could ignore
4880 the LHS dependence due to enabled renaming and transform
4881 the expression, and currently we'll be unable to do this. */
4882 htab_empty (INSN_TRANSFORMED_INSNS (insn));
4883 }
4884 }
4885
4886 /* Add BB_NOTE to the pool of available basic block notes. */
4887 static void
4888 return_bb_to_pool (basic_block bb)
4889 {
4890 rtx note = bb_note (bb);
4891
4892 gcc_assert (NOTE_BASIC_BLOCK (note) == bb
4893 && bb->aux == NULL);
4894
4895 /* It turns out that current cfg infrastructure does not support
4896 reuse of basic blocks. Don't bother for now. */
4897 /*VEC_safe_push (rtx, heap, bb_note_pool, note);*/
4898 }
4899
4900 /* Get a bb_note from pool or return NULL_RTX if pool is empty. */
4901 static rtx
4902 get_bb_note_from_pool (void)
4903 {
4904 if (VEC_empty (rtx, bb_note_pool))
4905 return NULL_RTX;
4906 else
4907 {
4908 rtx note = VEC_pop (rtx, bb_note_pool);
4909
4910 PREV_INSN (note) = NULL_RTX;
4911 NEXT_INSN (note) = NULL_RTX;
4912
4913 return note;
4914 }
4915 }
4916
4917 /* Free bb_note_pool. */
4918 void
4919 free_bb_note_pool (void)
4920 {
4921 VEC_free (rtx, heap, bb_note_pool);
4922 }
4923
4924 /* Setup scheduler pool and successor structure. */
4925 void
4926 alloc_sched_pools (void)
4927 {
4928 int succs_size;
4929
4930 succs_size = MAX_WS + 1;
4931 succs_info_pool.stack = XCNEWVEC (struct succs_info, succs_size);
4932 succs_info_pool.size = succs_size;
4933 succs_info_pool.top = -1;
4934 succs_info_pool.max_top = -1;
4935
4936 sched_lists_pool = create_alloc_pool ("sel-sched-lists",
4937 sizeof (struct _list_node), 500);
4938 }
4939
4940 /* Free the pools. */
4941 void
4942 free_sched_pools (void)
4943 {
4944 int i;
4945
4946 free_alloc_pool (sched_lists_pool);
4947 gcc_assert (succs_info_pool.top == -1);
4948 for (i = 0; i < succs_info_pool.max_top; i++)
4949 {
4950 VEC_free (rtx, heap, succs_info_pool.stack[i].succs_ok);
4951 VEC_free (rtx, heap, succs_info_pool.stack[i].succs_other);
4952 VEC_free (int, heap, succs_info_pool.stack[i].probs_ok);
4953 }
4954 free (succs_info_pool.stack);
4955 }
4956 \f
4957
4958 /* Returns a position in RGN where BB can be inserted retaining
4959 topological order. */
4960 static int
4961 find_place_to_insert_bb (basic_block bb, int rgn)
4962 {
4963 bool has_preds_outside_rgn = false;
4964 edge e;
4965 edge_iterator ei;
4966
4967 /* Find whether we have preds outside the region. */
4968 FOR_EACH_EDGE (e, ei, bb->preds)
4969 if (!in_current_region_p (e->src))
4970 {
4971 has_preds_outside_rgn = true;
4972 break;
4973 }
4974
4975 /* Recompute the top order -- needed when we have > 1 pred
4976 and in case we don't have preds outside. */
4977 if (flag_sel_sched_pipelining_outer_loops
4978 && (has_preds_outside_rgn || EDGE_COUNT (bb->preds) > 1))
4979 {
4980 int i, bbi = bb->index, cur_bbi;
4981
4982 recompute_rev_top_order ();
4983 for (i = RGN_NR_BLOCKS (rgn) - 1; i >= 0; i--)
4984 {
4985 cur_bbi = BB_TO_BLOCK (i);
4986 if (rev_top_order_index[bbi]
4987 < rev_top_order_index[cur_bbi])
4988 break;
4989 }
4990
4991 /* We skipped the right block, so we increase i. We accomodate
4992 it for increasing by step later, so we decrease i. */
4993 return (i + 1) - 1;
4994 }
4995 else if (has_preds_outside_rgn)
4996 {
4997 /* This is the case when we generate an extra empty block
4998 to serve as region head during pipelining. */
4999 e = EDGE_SUCC (bb, 0);
5000 gcc_assert (EDGE_COUNT (bb->succs) == 1
5001 && in_current_region_p (EDGE_SUCC (bb, 0)->dest)
5002 && (BLOCK_TO_BB (e->dest->index) == 0));
5003 return -1;
5004 }
5005
5006 /* We don't have preds outside the region. We should have
5007 the only pred, because the multiple preds case comes from
5008 the pipelining of outer loops, and that is handled above.
5009 Just take the bbi of this single pred. */
5010 if (EDGE_COUNT (bb->succs) > 0)
5011 {
5012 int pred_bbi;
5013
5014 gcc_assert (EDGE_COUNT (bb->preds) == 1);
5015
5016 pred_bbi = EDGE_PRED (bb, 0)->src->index;
5017 return BLOCK_TO_BB (pred_bbi);
5018 }
5019 else
5020 /* BB has no successors. It is safe to put it in the end. */
5021 return current_nr_blocks - 1;
5022 }
5023
5024 /* Deletes an empty basic block freeing its data. */
5025 static void
5026 delete_and_free_basic_block (basic_block bb)
5027 {
5028 gcc_assert (sel_bb_empty_p (bb));
5029
5030 if (BB_LV_SET (bb))
5031 free_lv_set (bb);
5032
5033 bitmap_clear_bit (blocks_to_reschedule, bb->index);
5034
5035 /* Can't assert av_set properties because we use sel_aremove_bb
5036 when removing loop preheader from the region. At the point of
5037 removing the preheader we already have deallocated sel_region_bb_info. */
5038 gcc_assert (BB_LV_SET (bb) == NULL
5039 && !BB_LV_SET_VALID_P (bb)
5040 && BB_AV_LEVEL (bb) == 0
5041 && BB_AV_SET (bb) == NULL);
5042
5043 delete_basic_block (bb);
5044 }
5045
5046 /* Add BB to the current region and update the region data. */
5047 static void
5048 add_block_to_current_region (basic_block bb)
5049 {
5050 int i, pos, bbi = -2, rgn;
5051
5052 rgn = CONTAINING_RGN (BB_TO_BLOCK (0));
5053 bbi = find_place_to_insert_bb (bb, rgn);
5054 bbi += 1;
5055 pos = RGN_BLOCKS (rgn) + bbi;
5056
5057 gcc_assert (RGN_HAS_REAL_EBB (rgn) == 0
5058 && ebb_head[bbi] == pos);
5059
5060 /* Make a place for the new block. */
5061 extend_regions ();
5062
5063 for (i = RGN_BLOCKS (rgn + 1) - 1; i >= pos; i--)
5064 BLOCK_TO_BB (rgn_bb_table[i])++;
5065
5066 memmove (rgn_bb_table + pos + 1,
5067 rgn_bb_table + pos,
5068 (RGN_BLOCKS (nr_regions) - pos) * sizeof (*rgn_bb_table));
5069
5070 /* Initialize data for BB. */
5071 rgn_bb_table[pos] = bb->index;
5072 BLOCK_TO_BB (bb->index) = bbi;
5073 CONTAINING_RGN (bb->index) = rgn;
5074
5075 RGN_NR_BLOCKS (rgn)++;
5076
5077 for (i = rgn + 1; i <= nr_regions; i++)
5078 RGN_BLOCKS (i)++;
5079 }
5080
5081 /* Remove BB from the current region and update the region data. */
5082 static void
5083 remove_bb_from_region (basic_block bb)
5084 {
5085 int i, pos, bbi = -2, rgn;
5086
5087 rgn = CONTAINING_RGN (BB_TO_BLOCK (0));
5088 bbi = BLOCK_TO_BB (bb->index);
5089 pos = RGN_BLOCKS (rgn) + bbi;
5090
5091 gcc_assert (RGN_HAS_REAL_EBB (rgn) == 0
5092 && ebb_head[bbi] == pos);
5093
5094 for (i = RGN_BLOCKS (rgn + 1) - 1; i >= pos; i--)
5095 BLOCK_TO_BB (rgn_bb_table[i])--;
5096
5097 memmove (rgn_bb_table + pos,
5098 rgn_bb_table + pos + 1,
5099 (RGN_BLOCKS (nr_regions) - pos) * sizeof (*rgn_bb_table));
5100
5101 RGN_NR_BLOCKS (rgn)--;
5102 for (i = rgn + 1; i <= nr_regions; i++)
5103 RGN_BLOCKS (i)--;
5104 }
5105
5106 /* Add BB to the current region and update all data. If BB is NULL, add all
5107 blocks from last_added_blocks vector. */
5108 static void
5109 sel_add_bb (basic_block bb)
5110 {
5111 /* Extend luids so that new notes will receive zero luids. */
5112 sched_extend_luids ();
5113 sched_init_bbs ();
5114 sel_init_bbs (last_added_blocks);
5115
5116 /* When bb is passed explicitly, the vector should contain
5117 the only element that equals to bb; otherwise, the vector
5118 should not be NULL. */
5119 gcc_assert (last_added_blocks != NULL);
5120
5121 if (bb != NULL)
5122 {
5123 gcc_assert (VEC_length (basic_block, last_added_blocks) == 1
5124 && VEC_index (basic_block,
5125 last_added_blocks, 0) == bb);
5126 add_block_to_current_region (bb);
5127
5128 /* We associate creating/deleting data sets with the first insn
5129 appearing / disappearing in the bb. */
5130 if (!sel_bb_empty_p (bb) && BB_LV_SET (bb) == NULL)
5131 create_initial_data_sets (bb);
5132
5133 VEC_free (basic_block, heap, last_added_blocks);
5134 }
5135 else
5136 /* BB is NULL - process LAST_ADDED_BLOCKS instead. */
5137 {
5138 int i;
5139 basic_block temp_bb = NULL;
5140
5141 for (i = 0;
5142 VEC_iterate (basic_block, last_added_blocks, i, bb); i++)
5143 {
5144 add_block_to_current_region (bb);
5145 temp_bb = bb;
5146 }
5147
5148 /* We need to fetch at least one bb so we know the region
5149 to update. */
5150 gcc_assert (temp_bb != NULL);
5151 bb = temp_bb;
5152
5153 VEC_free (basic_block, heap, last_added_blocks);
5154 }
5155
5156 rgn_setup_region (CONTAINING_RGN (bb->index));
5157 }
5158
5159 /* Remove BB from the current region and update all data.
5160 If REMOVE_FROM_CFG_PBB is true, also remove the block cfom cfg. */
5161 static void
5162 sel_remove_bb (basic_block bb, bool remove_from_cfg_p)
5163 {
5164 unsigned idx = bb->index;
5165
5166 gcc_assert (bb != NULL && BB_NOTE_LIST (bb) == NULL_RTX);
5167
5168 remove_bb_from_region (bb);
5169 return_bb_to_pool (bb);
5170 bitmap_clear_bit (blocks_to_reschedule, idx);
5171
5172 if (remove_from_cfg_p)
5173 {
5174 basic_block succ = single_succ (bb);
5175 delete_and_free_basic_block (bb);
5176 set_immediate_dominator (CDI_DOMINATORS, succ,
5177 recompute_dominator (CDI_DOMINATORS, succ));
5178 }
5179
5180 rgn_setup_region (CONTAINING_RGN (idx));
5181 }
5182
5183 /* Concatenate info of EMPTY_BB to info of MERGE_BB. */
5184 static void
5185 move_bb_info (basic_block merge_bb, basic_block empty_bb)
5186 {
5187 gcc_assert (in_current_region_p (merge_bb));
5188
5189 concat_note_lists (BB_NOTE_LIST (empty_bb),
5190 &BB_NOTE_LIST (merge_bb));
5191 BB_NOTE_LIST (empty_bb) = NULL_RTX;
5192
5193 }
5194
5195 /* Remove EMPTY_BB. If REMOVE_FROM_CFG_P is false, remove EMPTY_BB from
5196 region, but keep it in CFG. */
5197 static void
5198 remove_empty_bb (basic_block empty_bb, bool remove_from_cfg_p)
5199 {
5200 /* The block should contain just a note or a label.
5201 We try to check whether it is unused below. */
5202 gcc_assert (BB_HEAD (empty_bb) == BB_END (empty_bb)
5203 || LABEL_P (BB_HEAD (empty_bb)));
5204
5205 /* If basic block has predecessors or successors, redirect them. */
5206 if (remove_from_cfg_p
5207 && (EDGE_COUNT (empty_bb->preds) > 0
5208 || EDGE_COUNT (empty_bb->succs) > 0))
5209 {
5210 basic_block pred;
5211 basic_block succ;
5212
5213 /* We need to init PRED and SUCC before redirecting edges. */
5214 if (EDGE_COUNT (empty_bb->preds) > 0)
5215 {
5216 edge e;
5217
5218 gcc_assert (EDGE_COUNT (empty_bb->preds) == 1);
5219
5220 e = EDGE_PRED (empty_bb, 0);
5221 gcc_assert (e->src == empty_bb->prev_bb
5222 && (e->flags & EDGE_FALLTHRU));
5223
5224 pred = empty_bb->prev_bb;
5225 }
5226 else
5227 pred = NULL;
5228
5229 if (EDGE_COUNT (empty_bb->succs) > 0)
5230 {
5231 /* We do not check fallthruness here as above, because
5232 after removing a jump the edge may actually be not fallthru. */
5233 gcc_assert (EDGE_COUNT (empty_bb->succs) == 1);
5234 succ = EDGE_SUCC (empty_bb, 0)->dest;
5235 }
5236 else
5237 succ = NULL;
5238
5239 if (EDGE_COUNT (empty_bb->preds) > 0 && succ != NULL)
5240 {
5241 edge e = EDGE_PRED (empty_bb, 0);
5242
5243 if (e->flags & EDGE_FALLTHRU)
5244 redirect_edge_succ_nodup (e, succ);
5245 else
5246 sel_redirect_edge_and_branch (EDGE_PRED (empty_bb, 0), succ);
5247 }
5248
5249 if (EDGE_COUNT (empty_bb->succs) > 0 && pred != NULL)
5250 {
5251 edge e = EDGE_SUCC (empty_bb, 0);
5252
5253 if (find_edge (pred, e->dest) == NULL)
5254 redirect_edge_pred (e, pred);
5255 }
5256 }
5257
5258 /* Finish removing. */
5259 sel_remove_bb (empty_bb, remove_from_cfg_p);
5260 }
5261
5262 /* An implementation of create_basic_block hook, which additionally updates
5263 per-bb data structures. */
5264 static basic_block
5265 sel_create_basic_block (void *headp, void *endp, basic_block after)
5266 {
5267 basic_block new_bb;
5268 insn_t new_bb_note;
5269
5270 gcc_assert (flag_sel_sched_pipelining_outer_loops
5271 || last_added_blocks == NULL);
5272
5273 new_bb_note = get_bb_note_from_pool ();
5274
5275 if (new_bb_note == NULL_RTX)
5276 new_bb = orig_cfg_hooks.create_basic_block (headp, endp, after);
5277 else
5278 {
5279 new_bb = create_basic_block_structure ((rtx) headp, (rtx) endp,
5280 new_bb_note, after);
5281 new_bb->aux = NULL;
5282 }
5283
5284 VEC_safe_push (basic_block, heap, last_added_blocks, new_bb);
5285
5286 return new_bb;
5287 }
5288
5289 /* Implement sched_init_only_bb (). */
5290 static void
5291 sel_init_only_bb (basic_block bb, basic_block after)
5292 {
5293 gcc_assert (after == NULL);
5294
5295 extend_regions ();
5296 rgn_make_new_region_out_of_new_block (bb);
5297 }
5298
5299 /* Update the latch when we've splitted or merged it from FROM block to TO.
5300 This should be checked for all outer loops, too. */
5301 static void
5302 change_loops_latches (basic_block from, basic_block to)
5303 {
5304 gcc_assert (from != to);
5305
5306 if (current_loop_nest)
5307 {
5308 struct loop *loop;
5309
5310 for (loop = current_loop_nest; loop; loop = loop_outer (loop))
5311 if (considered_for_pipelining_p (loop) && loop->latch == from)
5312 {
5313 gcc_assert (loop == current_loop_nest);
5314 loop->latch = to;
5315 gcc_assert (loop_latch_edge (loop));
5316 }
5317 }
5318 }
5319
5320 /* Splits BB on two basic blocks, adding it to the region and extending
5321 per-bb data structures. Returns the newly created bb. */
5322 static basic_block
5323 sel_split_block (basic_block bb, rtx after)
5324 {
5325 basic_block new_bb;
5326 insn_t insn;
5327
5328 new_bb = sched_split_block_1 (bb, after);
5329 sel_add_bb (new_bb);
5330
5331 /* This should be called after sel_add_bb, because this uses
5332 CONTAINING_RGN for the new block, which is not yet initialized.
5333 FIXME: this function may be a no-op now. */
5334 change_loops_latches (bb, new_bb);
5335
5336 /* Update ORIG_BB_INDEX for insns moved into the new block. */
5337 FOR_BB_INSNS (new_bb, insn)
5338 if (INSN_P (insn))
5339 EXPR_ORIG_BB_INDEX (INSN_EXPR (insn)) = new_bb->index;
5340
5341 if (sel_bb_empty_p (bb))
5342 {
5343 gcc_assert (!sel_bb_empty_p (new_bb));
5344
5345 /* NEW_BB has data sets that need to be updated and BB holds
5346 data sets that should be removed. Exchange these data sets
5347 so that we won't lose BB's valid data sets. */
5348 exchange_data_sets (new_bb, bb);
5349 free_data_sets (bb);
5350 }
5351
5352 if (!sel_bb_empty_p (new_bb)
5353 && bitmap_bit_p (blocks_to_reschedule, bb->index))
5354 bitmap_set_bit (blocks_to_reschedule, new_bb->index);
5355
5356 return new_bb;
5357 }
5358
5359 /* If BB ends with a jump insn whose ID is bigger then PREV_MAX_UID, return it.
5360 Otherwise returns NULL. */
5361 static rtx
5362 check_for_new_jump (basic_block bb, int prev_max_uid)
5363 {
5364 rtx end;
5365
5366 end = sel_bb_end (bb);
5367 if (end && INSN_UID (end) >= prev_max_uid)
5368 return end;
5369 return NULL;
5370 }
5371
5372 /* Look for a new jump either in FROM_BB block or in newly created JUMP_BB block.
5373 New means having UID at least equal to PREV_MAX_UID. */
5374 static rtx
5375 find_new_jump (basic_block from, basic_block jump_bb, int prev_max_uid)
5376 {
5377 rtx jump;
5378
5379 /* Return immediately if no new insns were emitted. */
5380 if (get_max_uid () == prev_max_uid)
5381 return NULL;
5382
5383 /* Now check both blocks for new jumps. It will ever be only one. */
5384 if ((jump = check_for_new_jump (from, prev_max_uid)))
5385 return jump;
5386
5387 if (jump_bb != NULL
5388 && (jump = check_for_new_jump (jump_bb, prev_max_uid)))
5389 return jump;
5390 return NULL;
5391 }
5392
5393 /* Splits E and adds the newly created basic block to the current region.
5394 Returns this basic block. */
5395 basic_block
5396 sel_split_edge (edge e)
5397 {
5398 basic_block new_bb, src, other_bb = NULL;
5399 int prev_max_uid;
5400 rtx jump;
5401
5402 src = e->src;
5403 prev_max_uid = get_max_uid ();
5404 new_bb = split_edge (e);
5405
5406 if (flag_sel_sched_pipelining_outer_loops
5407 && current_loop_nest)
5408 {
5409 int i;
5410 basic_block bb;
5411
5412 /* Some of the basic blocks might not have been added to the loop.
5413 Add them here, until this is fixed in force_fallthru. */
5414 for (i = 0;
5415 VEC_iterate (basic_block, last_added_blocks, i, bb); i++)
5416 if (!bb->loop_father)
5417 {
5418 add_bb_to_loop (bb, e->dest->loop_father);
5419
5420 gcc_assert (!other_bb && (new_bb->index != bb->index));
5421 other_bb = bb;
5422 }
5423 }
5424
5425 /* Add all last_added_blocks to the region. */
5426 sel_add_bb (NULL);
5427
5428 jump = find_new_jump (src, new_bb, prev_max_uid);
5429 if (jump)
5430 sel_init_new_insn (jump, INSN_INIT_TODO_LUID | INSN_INIT_TODO_SIMPLEJUMP);
5431
5432 /* Put the correct lv set on this block. */
5433 if (other_bb && !sel_bb_empty_p (other_bb))
5434 compute_live (sel_bb_head (other_bb));
5435
5436 return new_bb;
5437 }
5438
5439 /* Implement sched_create_empty_bb (). */
5440 static basic_block
5441 sel_create_empty_bb (basic_block after)
5442 {
5443 basic_block new_bb;
5444
5445 new_bb = sched_create_empty_bb_1 (after);
5446
5447 /* We'll explicitly initialize NEW_BB via sel_init_only_bb () a bit
5448 later. */
5449 gcc_assert (VEC_length (basic_block, last_added_blocks) == 1
5450 && VEC_index (basic_block, last_added_blocks, 0) == new_bb);
5451
5452 VEC_free (basic_block, heap, last_added_blocks);
5453 return new_bb;
5454 }
5455
5456 /* Implement sched_create_recovery_block. ORIG_INSN is where block
5457 will be splitted to insert a check. */
5458 basic_block
5459 sel_create_recovery_block (insn_t orig_insn)
5460 {
5461 basic_block first_bb, second_bb, recovery_block;
5462 basic_block before_recovery = NULL;
5463 rtx jump;
5464
5465 first_bb = BLOCK_FOR_INSN (orig_insn);
5466 if (sel_bb_end_p (orig_insn))
5467 {
5468 /* Avoid introducing an empty block while splitting. */
5469 gcc_assert (single_succ_p (first_bb));
5470 second_bb = single_succ (first_bb);
5471 }
5472 else
5473 second_bb = sched_split_block (first_bb, orig_insn);
5474
5475 recovery_block = sched_create_recovery_block (&before_recovery);
5476 if (before_recovery)
5477 copy_lv_set_from (before_recovery, EXIT_BLOCK_PTR);
5478
5479 gcc_assert (sel_bb_empty_p (recovery_block));
5480 sched_create_recovery_edges (first_bb, recovery_block, second_bb);
5481 if (current_loops != NULL)
5482 add_bb_to_loop (recovery_block, first_bb->loop_father);
5483
5484 sel_add_bb (recovery_block);
5485
5486 jump = BB_END (recovery_block);
5487 gcc_assert (sel_bb_head (recovery_block) == jump);
5488 sel_init_new_insn (jump, INSN_INIT_TODO_LUID | INSN_INIT_TODO_SIMPLEJUMP);
5489
5490 return recovery_block;
5491 }
5492
5493 /* Merge basic block B into basic block A. */
5494 static void
5495 sel_merge_blocks (basic_block a, basic_block b)
5496 {
5497 gcc_assert (sel_bb_empty_p (b)
5498 && EDGE_COUNT (b->preds) == 1
5499 && EDGE_PRED (b, 0)->src == b->prev_bb);
5500
5501 move_bb_info (b->prev_bb, b);
5502 remove_empty_bb (b, false);
5503 merge_blocks (a, b);
5504 change_loops_latches (b, a);
5505 }
5506
5507 /* A wrapper for redirect_edge_and_branch_force, which also initializes
5508 data structures for possibly created bb and insns. Returns the newly
5509 added bb or NULL, when a bb was not needed. */
5510 void
5511 sel_redirect_edge_and_branch_force (edge e, basic_block to)
5512 {
5513 basic_block jump_bb, src, orig_dest = e->dest;
5514 int prev_max_uid;
5515 rtx jump;
5516
5517 /* This function is now used only for bookkeeping code creation, where
5518 we'll never get the single pred of orig_dest block and thus will not
5519 hit unreachable blocks when updating dominator info. */
5520 gcc_assert (!sel_bb_empty_p (e->src)
5521 && !single_pred_p (orig_dest));
5522 src = e->src;
5523 prev_max_uid = get_max_uid ();
5524 jump_bb = redirect_edge_and_branch_force (e, to);
5525
5526 if (jump_bb != NULL)
5527 sel_add_bb (jump_bb);
5528
5529 /* This function could not be used to spoil the loop structure by now,
5530 thus we don't care to update anything. But check it to be sure. */
5531 if (current_loop_nest
5532 && pipelining_p)
5533 gcc_assert (loop_latch_edge (current_loop_nest));
5534
5535 jump = find_new_jump (src, jump_bb, prev_max_uid);
5536 if (jump)
5537 sel_init_new_insn (jump, INSN_INIT_TODO_LUID | INSN_INIT_TODO_SIMPLEJUMP);
5538 set_immediate_dominator (CDI_DOMINATORS, to,
5539 recompute_dominator (CDI_DOMINATORS, to));
5540 set_immediate_dominator (CDI_DOMINATORS, orig_dest,
5541 recompute_dominator (CDI_DOMINATORS, orig_dest));
5542 }
5543
5544 /* A wrapper for redirect_edge_and_branch. Return TRUE if blocks connected by
5545 redirected edge are in reverse topological order. */
5546 bool
5547 sel_redirect_edge_and_branch (edge e, basic_block to)
5548 {
5549 bool latch_edge_p;
5550 basic_block src, orig_dest = e->dest;
5551 int prev_max_uid;
5552 rtx jump;
5553 edge redirected;
5554 bool recompute_toporder_p = false;
5555 bool maybe_unreachable = single_pred_p (orig_dest);
5556
5557 latch_edge_p = (pipelining_p
5558 && current_loop_nest
5559 && e == loop_latch_edge (current_loop_nest));
5560
5561 src = e->src;
5562 prev_max_uid = get_max_uid ();
5563
5564 redirected = redirect_edge_and_branch (e, to);
5565
5566 gcc_assert (redirected && last_added_blocks == NULL);
5567
5568 /* When we've redirected a latch edge, update the header. */
5569 if (latch_edge_p)
5570 {
5571 current_loop_nest->header = to;
5572 gcc_assert (loop_latch_edge (current_loop_nest));
5573 }
5574
5575 /* In rare situations, the topological relation between the blocks connected
5576 by the redirected edge can change (see PR42245 for an example). Update
5577 block_to_bb/bb_to_block. */
5578 if (CONTAINING_RGN (e->src->index) == CONTAINING_RGN (to->index)
5579 && BLOCK_TO_BB (e->src->index) > BLOCK_TO_BB (to->index))
5580 recompute_toporder_p = true;
5581
5582 jump = find_new_jump (src, NULL, prev_max_uid);
5583 if (jump)
5584 sel_init_new_insn (jump, INSN_INIT_TODO_LUID | INSN_INIT_TODO_SIMPLEJUMP);
5585
5586 /* Only update dominator info when we don't have unreachable blocks.
5587 Otherwise we'll update in maybe_tidy_empty_bb. */
5588 if (!maybe_unreachable)
5589 {
5590 set_immediate_dominator (CDI_DOMINATORS, to,
5591 recompute_dominator (CDI_DOMINATORS, to));
5592 set_immediate_dominator (CDI_DOMINATORS, orig_dest,
5593 recompute_dominator (CDI_DOMINATORS, orig_dest));
5594 }
5595 return recompute_toporder_p;
5596 }
5597
5598 /* This variable holds the cfg hooks used by the selective scheduler. */
5599 static struct cfg_hooks sel_cfg_hooks;
5600
5601 /* Register sel-sched cfg hooks. */
5602 void
5603 sel_register_cfg_hooks (void)
5604 {
5605 sched_split_block = sel_split_block;
5606
5607 orig_cfg_hooks = get_cfg_hooks ();
5608 sel_cfg_hooks = orig_cfg_hooks;
5609
5610 sel_cfg_hooks.create_basic_block = sel_create_basic_block;
5611
5612 set_cfg_hooks (sel_cfg_hooks);
5613
5614 sched_init_only_bb = sel_init_only_bb;
5615 sched_split_block = sel_split_block;
5616 sched_create_empty_bb = sel_create_empty_bb;
5617 }
5618
5619 /* Unregister sel-sched cfg hooks. */
5620 void
5621 sel_unregister_cfg_hooks (void)
5622 {
5623 sched_create_empty_bb = NULL;
5624 sched_split_block = NULL;
5625 sched_init_only_bb = NULL;
5626
5627 set_cfg_hooks (orig_cfg_hooks);
5628 }
5629 \f
5630
5631 /* Emit an insn rtx based on PATTERN. If a jump insn is wanted,
5632 LABEL is where this jump should be directed. */
5633 rtx
5634 create_insn_rtx_from_pattern (rtx pattern, rtx label)
5635 {
5636 rtx insn_rtx;
5637
5638 gcc_assert (!INSN_P (pattern));
5639
5640 start_sequence ();
5641
5642 if (label == NULL_RTX)
5643 insn_rtx = emit_insn (pattern);
5644 else if (DEBUG_INSN_P (label))
5645 insn_rtx = emit_debug_insn (pattern);
5646 else
5647 {
5648 insn_rtx = emit_jump_insn (pattern);
5649 JUMP_LABEL (insn_rtx) = label;
5650 ++LABEL_NUSES (label);
5651 }
5652
5653 end_sequence ();
5654
5655 sched_extend_luids ();
5656 sched_extend_target ();
5657 sched_deps_init (false);
5658
5659 /* Initialize INSN_CODE now. */
5660 recog_memoized (insn_rtx);
5661 return insn_rtx;
5662 }
5663
5664 /* Create a new vinsn for INSN_RTX. FORCE_UNIQUE_P is true when the vinsn
5665 must not be clonable. */
5666 vinsn_t
5667 create_vinsn_from_insn_rtx (rtx insn_rtx, bool force_unique_p)
5668 {
5669 gcc_assert (INSN_P (insn_rtx) && !INSN_IN_STREAM_P (insn_rtx));
5670
5671 /* If VINSN_TYPE is not USE, retain its uniqueness. */
5672 return vinsn_create (insn_rtx, force_unique_p);
5673 }
5674
5675 /* Create a copy of INSN_RTX. */
5676 rtx
5677 create_copy_of_insn_rtx (rtx insn_rtx)
5678 {
5679 rtx res;
5680
5681 if (DEBUG_INSN_P (insn_rtx))
5682 return create_insn_rtx_from_pattern (copy_rtx (PATTERN (insn_rtx)),
5683 insn_rtx);
5684
5685 gcc_assert (NONJUMP_INSN_P (insn_rtx));
5686
5687 res = create_insn_rtx_from_pattern (copy_rtx (PATTERN (insn_rtx)),
5688 NULL_RTX);
5689 return res;
5690 }
5691
5692 /* Change vinsn field of EXPR to hold NEW_VINSN. */
5693 void
5694 change_vinsn_in_expr (expr_t expr, vinsn_t new_vinsn)
5695 {
5696 vinsn_detach (EXPR_VINSN (expr));
5697
5698 EXPR_VINSN (expr) = new_vinsn;
5699 vinsn_attach (new_vinsn);
5700 }
5701
5702 /* Helpers for global init. */
5703 /* This structure is used to be able to call existing bundling mechanism
5704 and calculate insn priorities. */
5705 static struct haifa_sched_info sched_sel_haifa_sched_info =
5706 {
5707 NULL, /* init_ready_list */
5708 NULL, /* can_schedule_ready_p */
5709 NULL, /* schedule_more_p */
5710 NULL, /* new_ready */
5711 NULL, /* rgn_rank */
5712 sel_print_insn, /* rgn_print_insn */
5713 contributes_to_priority,
5714 NULL, /* insn_finishes_block_p */
5715
5716 NULL, NULL,
5717 NULL, NULL,
5718 0, 0,
5719
5720 NULL, /* add_remove_insn */
5721 NULL, /* begin_schedule_ready */
5722 NULL, /* begin_move_insn */
5723 NULL, /* advance_target_bb */
5724
5725 NULL,
5726 NULL,
5727
5728 SEL_SCHED | NEW_BBS
5729 };
5730
5731 /* Setup special insns used in the scheduler. */
5732 void
5733 setup_nop_and_exit_insns (void)
5734 {
5735 gcc_assert (nop_pattern == NULL_RTX
5736 && exit_insn == NULL_RTX);
5737
5738 nop_pattern = constm1_rtx;
5739
5740 start_sequence ();
5741 emit_insn (nop_pattern);
5742 exit_insn = get_insns ();
5743 end_sequence ();
5744 set_block_for_insn (exit_insn, EXIT_BLOCK_PTR);
5745 }
5746
5747 /* Free special insns used in the scheduler. */
5748 void
5749 free_nop_and_exit_insns (void)
5750 {
5751 exit_insn = NULL_RTX;
5752 nop_pattern = NULL_RTX;
5753 }
5754
5755 /* Setup a special vinsn used in new insns initialization. */
5756 void
5757 setup_nop_vinsn (void)
5758 {
5759 nop_vinsn = vinsn_create (exit_insn, false);
5760 vinsn_attach (nop_vinsn);
5761 }
5762
5763 /* Free a special vinsn used in new insns initialization. */
5764 void
5765 free_nop_vinsn (void)
5766 {
5767 gcc_assert (VINSN_COUNT (nop_vinsn) == 1);
5768 vinsn_detach (nop_vinsn);
5769 nop_vinsn = NULL;
5770 }
5771
5772 /* Call a set_sched_flags hook. */
5773 void
5774 sel_set_sched_flags (void)
5775 {
5776 /* ??? This means that set_sched_flags were called, and we decided to
5777 support speculation. However, set_sched_flags also modifies flags
5778 on current_sched_info, doing this only at global init. And we
5779 sometimes change c_s_i later. So put the correct flags again. */
5780 if (spec_info && targetm.sched.set_sched_flags)
5781 targetm.sched.set_sched_flags (spec_info);
5782 }
5783
5784 /* Setup pointers to global sched info structures. */
5785 void
5786 sel_setup_sched_infos (void)
5787 {
5788 rgn_setup_common_sched_info ();
5789
5790 memcpy (&sel_common_sched_info, common_sched_info,
5791 sizeof (sel_common_sched_info));
5792
5793 sel_common_sched_info.fix_recovery_cfg = NULL;
5794 sel_common_sched_info.add_block = NULL;
5795 sel_common_sched_info.estimate_number_of_insns
5796 = sel_estimate_number_of_insns;
5797 sel_common_sched_info.luid_for_non_insn = sel_luid_for_non_insn;
5798 sel_common_sched_info.sched_pass_id = SCHED_SEL_PASS;
5799
5800 common_sched_info = &sel_common_sched_info;
5801
5802 current_sched_info = &sched_sel_haifa_sched_info;
5803 current_sched_info->sched_max_insns_priority =
5804 get_rgn_sched_max_insns_priority ();
5805
5806 sel_set_sched_flags ();
5807 }
5808 \f
5809
5810 /* Adds basic block BB to region RGN at the position *BB_ORD_INDEX,
5811 *BB_ORD_INDEX after that is increased. */
5812 static void
5813 sel_add_block_to_region (basic_block bb, int *bb_ord_index, int rgn)
5814 {
5815 RGN_NR_BLOCKS (rgn) += 1;
5816 RGN_DONT_CALC_DEPS (rgn) = 0;
5817 RGN_HAS_REAL_EBB (rgn) = 0;
5818 CONTAINING_RGN (bb->index) = rgn;
5819 BLOCK_TO_BB (bb->index) = *bb_ord_index;
5820 rgn_bb_table[RGN_BLOCKS (rgn) + *bb_ord_index] = bb->index;
5821 (*bb_ord_index)++;
5822
5823 /* FIXME: it is true only when not scheduling ebbs. */
5824 RGN_BLOCKS (rgn + 1) = RGN_BLOCKS (rgn) + RGN_NR_BLOCKS (rgn);
5825 }
5826
5827 /* Functions to support pipelining of outer loops. */
5828
5829 /* Creates a new empty region and returns it's number. */
5830 static int
5831 sel_create_new_region (void)
5832 {
5833 int new_rgn_number = nr_regions;
5834
5835 RGN_NR_BLOCKS (new_rgn_number) = 0;
5836
5837 /* FIXME: This will work only when EBBs are not created. */
5838 if (new_rgn_number != 0)
5839 RGN_BLOCKS (new_rgn_number) = RGN_BLOCKS (new_rgn_number - 1) +
5840 RGN_NR_BLOCKS (new_rgn_number - 1);
5841 else
5842 RGN_BLOCKS (new_rgn_number) = 0;
5843
5844 /* Set the blocks of the next region so the other functions may
5845 calculate the number of blocks in the region. */
5846 RGN_BLOCKS (new_rgn_number + 1) = RGN_BLOCKS (new_rgn_number) +
5847 RGN_NR_BLOCKS (new_rgn_number);
5848
5849 nr_regions++;
5850
5851 return new_rgn_number;
5852 }
5853
5854 /* If X has a smaller topological sort number than Y, returns -1;
5855 if greater, returns 1. */
5856 static int
5857 bb_top_order_comparator (const void *x, const void *y)
5858 {
5859 basic_block bb1 = *(const basic_block *) x;
5860 basic_block bb2 = *(const basic_block *) y;
5861
5862 gcc_assert (bb1 == bb2
5863 || rev_top_order_index[bb1->index]
5864 != rev_top_order_index[bb2->index]);
5865
5866 /* It's a reverse topological order in REV_TOP_ORDER_INDEX, so
5867 bbs with greater number should go earlier. */
5868 if (rev_top_order_index[bb1->index] > rev_top_order_index[bb2->index])
5869 return -1;
5870 else
5871 return 1;
5872 }
5873
5874 /* Create a region for LOOP and return its number. If we don't want
5875 to pipeline LOOP, return -1. */
5876 static int
5877 make_region_from_loop (struct loop *loop)
5878 {
5879 unsigned int i;
5880 int new_rgn_number = -1;
5881 struct loop *inner;
5882
5883 /* Basic block index, to be assigned to BLOCK_TO_BB. */
5884 int bb_ord_index = 0;
5885 basic_block *loop_blocks;
5886 basic_block preheader_block;
5887
5888 if (loop->num_nodes
5889 > (unsigned) PARAM_VALUE (PARAM_MAX_PIPELINE_REGION_BLOCKS))
5890 return -1;
5891
5892 /* Don't pipeline loops whose latch belongs to some of its inner loops. */
5893 for (inner = loop->inner; inner; inner = inner->inner)
5894 if (flow_bb_inside_loop_p (inner, loop->latch))
5895 return -1;
5896
5897 loop->ninsns = num_loop_insns (loop);
5898 if ((int) loop->ninsns > PARAM_VALUE (PARAM_MAX_PIPELINE_REGION_INSNS))
5899 return -1;
5900
5901 loop_blocks = get_loop_body_in_custom_order (loop, bb_top_order_comparator);
5902
5903 for (i = 0; i < loop->num_nodes; i++)
5904 if (loop_blocks[i]->flags & BB_IRREDUCIBLE_LOOP)
5905 {
5906 free (loop_blocks);
5907 return -1;
5908 }
5909
5910 preheader_block = loop_preheader_edge (loop)->src;
5911 gcc_assert (preheader_block);
5912 gcc_assert (loop_blocks[0] == loop->header);
5913
5914 new_rgn_number = sel_create_new_region ();
5915
5916 sel_add_block_to_region (preheader_block, &bb_ord_index, new_rgn_number);
5917 SET_BIT (bbs_in_loop_rgns, preheader_block->index);
5918
5919 for (i = 0; i < loop->num_nodes; i++)
5920 {
5921 /* Add only those blocks that haven't been scheduled in the inner loop.
5922 The exception is the basic blocks with bookkeeping code - they should
5923 be added to the region (and they actually don't belong to the loop
5924 body, but to the region containing that loop body). */
5925
5926 gcc_assert (new_rgn_number >= 0);
5927
5928 if (! TEST_BIT (bbs_in_loop_rgns, loop_blocks[i]->index))
5929 {
5930 sel_add_block_to_region (loop_blocks[i], &bb_ord_index,
5931 new_rgn_number);
5932 SET_BIT (bbs_in_loop_rgns, loop_blocks[i]->index);
5933 }
5934 }
5935
5936 free (loop_blocks);
5937 MARK_LOOP_FOR_PIPELINING (loop);
5938
5939 return new_rgn_number;
5940 }
5941
5942 /* Create a new region from preheader blocks LOOP_BLOCKS. */
5943 void
5944 make_region_from_loop_preheader (VEC(basic_block, heap) **loop_blocks)
5945 {
5946 unsigned int i;
5947 int new_rgn_number = -1;
5948 basic_block bb;
5949
5950 /* Basic block index, to be assigned to BLOCK_TO_BB. */
5951 int bb_ord_index = 0;
5952
5953 new_rgn_number = sel_create_new_region ();
5954
5955 FOR_EACH_VEC_ELT (basic_block, *loop_blocks, i, bb)
5956 {
5957 gcc_assert (new_rgn_number >= 0);
5958
5959 sel_add_block_to_region (bb, &bb_ord_index, new_rgn_number);
5960 }
5961
5962 VEC_free (basic_block, heap, *loop_blocks);
5963 gcc_assert (*loop_blocks == NULL);
5964 }
5965
5966
5967 /* Create region(s) from loop nest LOOP, such that inner loops will be
5968 pipelined before outer loops. Returns true when a region for LOOP
5969 is created. */
5970 static bool
5971 make_regions_from_loop_nest (struct loop *loop)
5972 {
5973 struct loop *cur_loop;
5974 int rgn_number;
5975
5976 /* Traverse all inner nodes of the loop. */
5977 for (cur_loop = loop->inner; cur_loop; cur_loop = cur_loop->next)
5978 if (! TEST_BIT (bbs_in_loop_rgns, cur_loop->header->index))
5979 return false;
5980
5981 /* At this moment all regular inner loops should have been pipelined.
5982 Try to create a region from this loop. */
5983 rgn_number = make_region_from_loop (loop);
5984
5985 if (rgn_number < 0)
5986 return false;
5987
5988 VEC_safe_push (loop_p, heap, loop_nests, loop);
5989 return true;
5990 }
5991
5992 /* Initalize data structures needed. */
5993 void
5994 sel_init_pipelining (void)
5995 {
5996 /* Collect loop information to be used in outer loops pipelining. */
5997 loop_optimizer_init (LOOPS_HAVE_PREHEADERS
5998 | LOOPS_HAVE_FALLTHRU_PREHEADERS
5999 | LOOPS_HAVE_RECORDED_EXITS
6000 | LOOPS_HAVE_MARKED_IRREDUCIBLE_REGIONS);
6001 current_loop_nest = NULL;
6002
6003 bbs_in_loop_rgns = sbitmap_alloc (last_basic_block);
6004 sbitmap_zero (bbs_in_loop_rgns);
6005
6006 recompute_rev_top_order ();
6007 }
6008
6009 /* Returns a struct loop for region RGN. */
6010 loop_p
6011 get_loop_nest_for_rgn (unsigned int rgn)
6012 {
6013 /* Regions created with extend_rgns don't have corresponding loop nests,
6014 because they don't represent loops. */
6015 if (rgn < VEC_length (loop_p, loop_nests))
6016 return VEC_index (loop_p, loop_nests, rgn);
6017 else
6018 return NULL;
6019 }
6020
6021 /* True when LOOP was included into pipelining regions. */
6022 bool
6023 considered_for_pipelining_p (struct loop *loop)
6024 {
6025 if (loop_depth (loop) == 0)
6026 return false;
6027
6028 /* Now, the loop could be too large or irreducible. Check whether its
6029 region is in LOOP_NESTS.
6030 We determine the region number of LOOP as the region number of its
6031 latch. We can't use header here, because this header could be
6032 just removed preheader and it will give us the wrong region number.
6033 Latch can't be used because it could be in the inner loop too. */
6034 if (LOOP_MARKED_FOR_PIPELINING_P (loop))
6035 {
6036 int rgn = CONTAINING_RGN (loop->latch->index);
6037
6038 gcc_assert ((unsigned) rgn < VEC_length (loop_p, loop_nests));
6039 return true;
6040 }
6041
6042 return false;
6043 }
6044
6045 /* Makes regions from the rest of the blocks, after loops are chosen
6046 for pipelining. */
6047 static void
6048 make_regions_from_the_rest (void)
6049 {
6050 int cur_rgn_blocks;
6051 int *loop_hdr;
6052 int i;
6053
6054 basic_block bb;
6055 edge e;
6056 edge_iterator ei;
6057 int *degree;
6058
6059 /* Index in rgn_bb_table where to start allocating new regions. */
6060 cur_rgn_blocks = nr_regions ? RGN_BLOCKS (nr_regions) : 0;
6061
6062 /* Make regions from all the rest basic blocks - those that don't belong to
6063 any loop or belong to irreducible loops. Prepare the data structures
6064 for extend_rgns. */
6065
6066 /* LOOP_HDR[I] == -1 if I-th bb doesn't belong to any loop,
6067 LOOP_HDR[I] == LOOP_HDR[J] iff basic blocks I and J reside within the same
6068 loop. */
6069 loop_hdr = XNEWVEC (int, last_basic_block);
6070 degree = XCNEWVEC (int, last_basic_block);
6071
6072
6073 /* For each basic block that belongs to some loop assign the number
6074 of innermost loop it belongs to. */
6075 for (i = 0; i < last_basic_block; i++)
6076 loop_hdr[i] = -1;
6077
6078 FOR_EACH_BB (bb)
6079 {
6080 if (bb->loop_father && !bb->loop_father->num == 0
6081 && !(bb->flags & BB_IRREDUCIBLE_LOOP))
6082 loop_hdr[bb->index] = bb->loop_father->num;
6083 }
6084
6085 /* For each basic block degree is calculated as the number of incoming
6086 edges, that are going out of bbs that are not yet scheduled.
6087 The basic blocks that are scheduled have degree value of zero. */
6088 FOR_EACH_BB (bb)
6089 {
6090 degree[bb->index] = 0;
6091
6092 if (!TEST_BIT (bbs_in_loop_rgns, bb->index))
6093 {
6094 FOR_EACH_EDGE (e, ei, bb->preds)
6095 if (!TEST_BIT (bbs_in_loop_rgns, e->src->index))
6096 degree[bb->index]++;
6097 }
6098 else
6099 degree[bb->index] = -1;
6100 }
6101
6102 extend_rgns (degree, &cur_rgn_blocks, bbs_in_loop_rgns, loop_hdr);
6103
6104 /* Any block that did not end up in a region is placed into a region
6105 by itself. */
6106 FOR_EACH_BB (bb)
6107 if (degree[bb->index] >= 0)
6108 {
6109 rgn_bb_table[cur_rgn_blocks] = bb->index;
6110 RGN_NR_BLOCKS (nr_regions) = 1;
6111 RGN_BLOCKS (nr_regions) = cur_rgn_blocks++;
6112 RGN_DONT_CALC_DEPS (nr_regions) = 0;
6113 RGN_HAS_REAL_EBB (nr_regions) = 0;
6114 CONTAINING_RGN (bb->index) = nr_regions++;
6115 BLOCK_TO_BB (bb->index) = 0;
6116 }
6117
6118 free (degree);
6119 free (loop_hdr);
6120 }
6121
6122 /* Free data structures used in pipelining of loops. */
6123 void sel_finish_pipelining (void)
6124 {
6125 loop_iterator li;
6126 struct loop *loop;
6127
6128 /* Release aux fields so we don't free them later by mistake. */
6129 FOR_EACH_LOOP (li, loop, 0)
6130 loop->aux = NULL;
6131
6132 loop_optimizer_finalize ();
6133
6134 VEC_free (loop_p, heap, loop_nests);
6135
6136 free (rev_top_order_index);
6137 rev_top_order_index = NULL;
6138 }
6139
6140 /* This function replaces the find_rgns when
6141 FLAG_SEL_SCHED_PIPELINING_OUTER_LOOPS is set. */
6142 void
6143 sel_find_rgns (void)
6144 {
6145 sel_init_pipelining ();
6146 extend_regions ();
6147
6148 if (current_loops)
6149 {
6150 loop_p loop;
6151 loop_iterator li;
6152
6153 FOR_EACH_LOOP (li, loop, (flag_sel_sched_pipelining_outer_loops
6154 ? LI_FROM_INNERMOST
6155 : LI_ONLY_INNERMOST))
6156 make_regions_from_loop_nest (loop);
6157 }
6158
6159 /* Make regions from all the rest basic blocks and schedule them.
6160 These blocks include blocks that don't belong to any loop or belong
6161 to irreducible loops. */
6162 make_regions_from_the_rest ();
6163
6164 /* We don't need bbs_in_loop_rgns anymore. */
6165 sbitmap_free (bbs_in_loop_rgns);
6166 bbs_in_loop_rgns = NULL;
6167 }
6168
6169 /* Add the preheader blocks from previous loop to current region taking
6170 it from LOOP_PREHEADER_BLOCKS (current_loop_nest) and record them in *BBS.
6171 This function is only used with -fsel-sched-pipelining-outer-loops. */
6172 void
6173 sel_add_loop_preheaders (bb_vec_t *bbs)
6174 {
6175 int i;
6176 basic_block bb;
6177 VEC(basic_block, heap) *preheader_blocks
6178 = LOOP_PREHEADER_BLOCKS (current_loop_nest);
6179
6180 for (i = 0;
6181 VEC_iterate (basic_block, preheader_blocks, i, bb);
6182 i++)
6183 {
6184 VEC_safe_push (basic_block, heap, *bbs, bb);
6185 VEC_safe_push (basic_block, heap, last_added_blocks, bb);
6186 sel_add_bb (bb);
6187 }
6188
6189 VEC_free (basic_block, heap, preheader_blocks);
6190 }
6191
6192 /* While pipelining outer loops, returns TRUE if BB is a loop preheader.
6193 Please note that the function should also work when pipelining_p is
6194 false, because it is used when deciding whether we should or should
6195 not reschedule pipelined code. */
6196 bool
6197 sel_is_loop_preheader_p (basic_block bb)
6198 {
6199 if (current_loop_nest)
6200 {
6201 struct loop *outer;
6202
6203 if (preheader_removed)
6204 return false;
6205
6206 /* Preheader is the first block in the region. */
6207 if (BLOCK_TO_BB (bb->index) == 0)
6208 return true;
6209
6210 /* We used to find a preheader with the topological information.
6211 Check that the above code is equivalent to what we did before. */
6212
6213 if (in_current_region_p (current_loop_nest->header))
6214 gcc_assert (!(BLOCK_TO_BB (bb->index)
6215 < BLOCK_TO_BB (current_loop_nest->header->index)));
6216
6217 /* Support the situation when the latch block of outer loop
6218 could be from here. */
6219 for (outer = loop_outer (current_loop_nest);
6220 outer;
6221 outer = loop_outer (outer))
6222 if (considered_for_pipelining_p (outer) && outer->latch == bb)
6223 gcc_unreachable ();
6224 }
6225
6226 return false;
6227 }
6228
6229 /* Check whether JUMP_BB ends with a jump insn that leads only to DEST_BB and
6230 can be removed, making the corresponding edge fallthrough (assuming that
6231 all basic blocks between JUMP_BB and DEST_BB are empty). */
6232 static bool
6233 bb_has_removable_jump_to_p (basic_block jump_bb, basic_block dest_bb)
6234 {
6235 if (!onlyjump_p (BB_END (jump_bb))
6236 || tablejump_p (BB_END (jump_bb), NULL, NULL))
6237 return false;
6238
6239 /* Several outgoing edges, abnormal edge or destination of jump is
6240 not DEST_BB. */
6241 if (EDGE_COUNT (jump_bb->succs) != 1
6242 || EDGE_SUCC (jump_bb, 0)->flags & (EDGE_ABNORMAL | EDGE_CROSSING)
6243 || EDGE_SUCC (jump_bb, 0)->dest != dest_bb)
6244 return false;
6245
6246 /* If not anything of the upper. */
6247 return true;
6248 }
6249
6250 /* Removes the loop preheader from the current region and saves it in
6251 PREHEADER_BLOCKS of the father loop, so they will be added later to
6252 region that represents an outer loop. */
6253 static void
6254 sel_remove_loop_preheader (void)
6255 {
6256 int i, old_len;
6257 int cur_rgn = CONTAINING_RGN (BB_TO_BLOCK (0));
6258 basic_block bb;
6259 bool all_empty_p = true;
6260 VEC(basic_block, heap) *preheader_blocks
6261 = LOOP_PREHEADER_BLOCKS (loop_outer (current_loop_nest));
6262
6263 gcc_assert (current_loop_nest);
6264 old_len = VEC_length (basic_block, preheader_blocks);
6265
6266 /* Add blocks that aren't within the current loop to PREHEADER_BLOCKS. */
6267 for (i = 0; i < RGN_NR_BLOCKS (cur_rgn); i++)
6268 {
6269 bb = BASIC_BLOCK (BB_TO_BLOCK (i));
6270
6271 /* If the basic block belongs to region, but doesn't belong to
6272 corresponding loop, then it should be a preheader. */
6273 if (sel_is_loop_preheader_p (bb))
6274 {
6275 VEC_safe_push (basic_block, heap, preheader_blocks, bb);
6276 if (BB_END (bb) != bb_note (bb))
6277 all_empty_p = false;
6278 }
6279 }
6280
6281 /* Remove these blocks only after iterating over the whole region. */
6282 for (i = VEC_length (basic_block, preheader_blocks) - 1;
6283 i >= old_len;
6284 i--)
6285 {
6286 bb = VEC_index (basic_block, preheader_blocks, i);
6287 sel_remove_bb (bb, false);
6288 }
6289
6290 if (!considered_for_pipelining_p (loop_outer (current_loop_nest)))
6291 {
6292 if (!all_empty_p)
6293 /* Immediately create new region from preheader. */
6294 make_region_from_loop_preheader (&preheader_blocks);
6295 else
6296 {
6297 /* If all preheader blocks are empty - dont create new empty region.
6298 Instead, remove them completely. */
6299 FOR_EACH_VEC_ELT (basic_block, preheader_blocks, i, bb)
6300 {
6301 edge e;
6302 edge_iterator ei;
6303 basic_block prev_bb = bb->prev_bb, next_bb = bb->next_bb;
6304
6305 /* Redirect all incoming edges to next basic block. */
6306 for (ei = ei_start (bb->preds); (e = ei_safe_edge (ei)); )
6307 {
6308 if (! (e->flags & EDGE_FALLTHRU))
6309 redirect_edge_and_branch (e, bb->next_bb);
6310 else
6311 redirect_edge_succ (e, bb->next_bb);
6312 }
6313 gcc_assert (BB_NOTE_LIST (bb) == NULL);
6314 delete_and_free_basic_block (bb);
6315
6316 /* Check if after deleting preheader there is a nonconditional
6317 jump in PREV_BB that leads to the next basic block NEXT_BB.
6318 If it is so - delete this jump and clear data sets of its
6319 basic block if it becomes empty. */
6320 if (next_bb->prev_bb == prev_bb
6321 && prev_bb != ENTRY_BLOCK_PTR
6322 && bb_has_removable_jump_to_p (prev_bb, next_bb))
6323 {
6324 redirect_edge_and_branch (EDGE_SUCC (prev_bb, 0), next_bb);
6325 if (BB_END (prev_bb) == bb_note (prev_bb))
6326 free_data_sets (prev_bb);
6327 }
6328
6329 set_immediate_dominator (CDI_DOMINATORS, next_bb,
6330 recompute_dominator (CDI_DOMINATORS,
6331 next_bb));
6332 }
6333 }
6334 VEC_free (basic_block, heap, preheader_blocks);
6335 }
6336 else
6337 /* Store preheader within the father's loop structure. */
6338 SET_LOOP_PREHEADER_BLOCKS (loop_outer (current_loop_nest),
6339 preheader_blocks);
6340 }
6341 #endif