]> git.ipfire.org Git - thirdparty/gcc.git/blob - gcc/cfgexpand.c
Correct a function pre/postcondition [PR102403].
[thirdparty/gcc.git] / gcc / cfgexpand.c
1 /* A pass for lowering trees to RTL.
2 Copyright (C) 2004-2021 Free Software Foundation, Inc.
3
4 This file is part of GCC.
5
6 GCC is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
10
11 GCC is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
15
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
19
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "backend.h"
24 #include "target.h"
25 #include "rtl.h"
26 #include "tree.h"
27 #include "gimple.h"
28 #include "cfghooks.h"
29 #include "tree-pass.h"
30 #include "memmodel.h"
31 #include "tm_p.h"
32 #include "ssa.h"
33 #include "optabs.h"
34 #include "regs.h" /* For reg_renumber. */
35 #include "emit-rtl.h"
36 #include "recog.h"
37 #include "cgraph.h"
38 #include "diagnostic.h"
39 #include "fold-const.h"
40 #include "varasm.h"
41 #include "stor-layout.h"
42 #include "stmt.h"
43 #include "print-tree.h"
44 #include "cfgrtl.h"
45 #include "cfganal.h"
46 #include "cfgbuild.h"
47 #include "cfgcleanup.h"
48 #include "dojump.h"
49 #include "explow.h"
50 #include "calls.h"
51 #include "expr.h"
52 #include "internal-fn.h"
53 #include "tree-eh.h"
54 #include "gimple-iterator.h"
55 #include "gimple-expr.h"
56 #include "gimple-walk.h"
57 #include "tree-cfg.h"
58 #include "tree-dfa.h"
59 #include "tree-ssa.h"
60 #include "except.h"
61 #include "gimple-pretty-print.h"
62 #include "toplev.h"
63 #include "debug.h"
64 #include "tree-inline.h"
65 #include "value-prof.h"
66 #include "tree-ssa-live.h"
67 #include "tree-outof-ssa.h"
68 #include "cfgloop.h"
69 #include "insn-attr.h" /* For INSN_SCHEDULING. */
70 #include "stringpool.h"
71 #include "attribs.h"
72 #include "asan.h"
73 #include "tree-ssa-address.h"
74 #include "output.h"
75 #include "builtins.h"
76 #include "opts.h"
77
78 /* Some systems use __main in a way incompatible with its use in gcc, in these
79 cases use the macros NAME__MAIN to give a quoted symbol and SYMBOL__MAIN to
80 give the same symbol without quotes for an alternative entry point. You
81 must define both, or neither. */
82 #ifndef NAME__MAIN
83 #define NAME__MAIN "__main"
84 #endif
85
86 /* This variable holds information helping the rewriting of SSA trees
87 into RTL. */
88 struct ssaexpand SA;
89
90 /* This variable holds the currently expanded gimple statement for purposes
91 of comminucating the profile info to the builtin expanders. */
92 gimple *currently_expanding_gimple_stmt;
93
94 static rtx expand_debug_expr (tree);
95
96 static bool defer_stack_allocation (tree, bool);
97
98 static void record_alignment_for_reg_var (unsigned int);
99
100 /* Return an expression tree corresponding to the RHS of GIMPLE
101 statement STMT. */
102
103 tree
104 gimple_assign_rhs_to_tree (gimple *stmt)
105 {
106 tree t;
107 switch (gimple_assign_rhs_class (stmt))
108 {
109 case GIMPLE_TERNARY_RHS:
110 t = build3 (gimple_assign_rhs_code (stmt),
111 TREE_TYPE (gimple_assign_lhs (stmt)),
112 gimple_assign_rhs1 (stmt), gimple_assign_rhs2 (stmt),
113 gimple_assign_rhs3 (stmt));
114 break;
115 case GIMPLE_BINARY_RHS:
116 t = build2 (gimple_assign_rhs_code (stmt),
117 TREE_TYPE (gimple_assign_lhs (stmt)),
118 gimple_assign_rhs1 (stmt), gimple_assign_rhs2 (stmt));
119 break;
120 case GIMPLE_UNARY_RHS:
121 t = build1 (gimple_assign_rhs_code (stmt),
122 TREE_TYPE (gimple_assign_lhs (stmt)),
123 gimple_assign_rhs1 (stmt));
124 break;
125 case GIMPLE_SINGLE_RHS:
126 {
127 t = gimple_assign_rhs1 (stmt);
128 /* Avoid modifying this tree in place below. */
129 if ((gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t)
130 && gimple_location (stmt) != EXPR_LOCATION (t))
131 || (gimple_block (stmt) && currently_expanding_to_rtl
132 && EXPR_P (t)))
133 t = copy_node (t);
134 break;
135 }
136 default:
137 gcc_unreachable ();
138 }
139
140 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t))
141 SET_EXPR_LOCATION (t, gimple_location (stmt));
142
143 return t;
144 }
145
146
147 #ifndef STACK_ALIGNMENT_NEEDED
148 #define STACK_ALIGNMENT_NEEDED 1
149 #endif
150
151 #define SSAVAR(x) (TREE_CODE (x) == SSA_NAME ? SSA_NAME_VAR (x) : x)
152
153 /* Choose either CUR or NEXT as the leader DECL for a partition.
154 Prefer ignored decls, to simplify debug dumps and reduce ambiguity
155 out of the same user variable being in multiple partitions (this is
156 less likely for compiler-introduced temps). */
157
158 static tree
159 leader_merge (tree cur, tree next)
160 {
161 if (cur == NULL || cur == next)
162 return next;
163
164 if (DECL_P (cur) && DECL_IGNORED_P (cur))
165 return cur;
166
167 if (DECL_P (next) && DECL_IGNORED_P (next))
168 return next;
169
170 return cur;
171 }
172
173 /* Associate declaration T with storage space X. If T is no
174 SSA name this is exactly SET_DECL_RTL, otherwise make the
175 partition of T associated with X. */
176 static inline void
177 set_rtl (tree t, rtx x)
178 {
179 gcc_checking_assert (!x
180 || !(TREE_CODE (t) == SSA_NAME || is_gimple_reg (t))
181 || (use_register_for_decl (t)
182 ? (REG_P (x)
183 || (GET_CODE (x) == CONCAT
184 && (REG_P (XEXP (x, 0))
185 || SUBREG_P (XEXP (x, 0)))
186 && (REG_P (XEXP (x, 1))
187 || SUBREG_P (XEXP (x, 1))))
188 /* We need to accept PARALLELs for RESUT_DECLs
189 because of vector types with BLKmode returned
190 in multiple registers, but they are supposed
191 to be uncoalesced. */
192 || (GET_CODE (x) == PARALLEL
193 && SSAVAR (t)
194 && TREE_CODE (SSAVAR (t)) == RESULT_DECL
195 && (GET_MODE (x) == BLKmode
196 || !flag_tree_coalesce_vars)))
197 : (MEM_P (x) || x == pc_rtx
198 || (GET_CODE (x) == CONCAT
199 && MEM_P (XEXP (x, 0))
200 && MEM_P (XEXP (x, 1))))));
201 /* Check that the RTL for SSA_NAMEs and gimple-reg PARM_DECLs and
202 RESULT_DECLs has the expected mode. For memory, we accept
203 unpromoted modes, since that's what we're likely to get. For
204 PARM_DECLs and RESULT_DECLs, we'll have been called by
205 set_parm_rtl, which will give us the default def, so we don't
206 have to compute it ourselves. For RESULT_DECLs, we accept mode
207 mismatches too, as long as we have BLKmode or are not coalescing
208 across variables, so that we don't reject BLKmode PARALLELs or
209 unpromoted REGs. */
210 gcc_checking_assert (!x || x == pc_rtx || TREE_CODE (t) != SSA_NAME
211 || (SSAVAR (t)
212 && TREE_CODE (SSAVAR (t)) == RESULT_DECL
213 && (promote_ssa_mode (t, NULL) == BLKmode
214 || !flag_tree_coalesce_vars))
215 || !use_register_for_decl (t)
216 || GET_MODE (x) == promote_ssa_mode (t, NULL));
217
218 if (x)
219 {
220 bool skip = false;
221 tree cur = NULL_TREE;
222 rtx xm = x;
223
224 retry:
225 if (MEM_P (xm))
226 cur = MEM_EXPR (xm);
227 else if (REG_P (xm))
228 cur = REG_EXPR (xm);
229 else if (SUBREG_P (xm))
230 {
231 gcc_assert (subreg_lowpart_p (xm));
232 xm = SUBREG_REG (xm);
233 goto retry;
234 }
235 else if (GET_CODE (xm) == CONCAT)
236 {
237 xm = XEXP (xm, 0);
238 goto retry;
239 }
240 else if (GET_CODE (xm) == PARALLEL)
241 {
242 xm = XVECEXP (xm, 0, 0);
243 gcc_assert (GET_CODE (xm) == EXPR_LIST);
244 xm = XEXP (xm, 0);
245 goto retry;
246 }
247 else if (xm == pc_rtx)
248 skip = true;
249 else
250 gcc_unreachable ();
251
252 tree next = skip ? cur : leader_merge (cur, SSAVAR (t) ? SSAVAR (t) : t);
253
254 if (cur != next)
255 {
256 if (MEM_P (x))
257 set_mem_attributes (x,
258 next && TREE_CODE (next) == SSA_NAME
259 ? TREE_TYPE (next)
260 : next, true);
261 else
262 set_reg_attrs_for_decl_rtl (next, x);
263 }
264 }
265
266 if (TREE_CODE (t) == SSA_NAME)
267 {
268 int part = var_to_partition (SA.map, t);
269 if (part != NO_PARTITION)
270 {
271 if (SA.partition_to_pseudo[part])
272 gcc_assert (SA.partition_to_pseudo[part] == x);
273 else if (x != pc_rtx)
274 SA.partition_to_pseudo[part] = x;
275 }
276 /* For the benefit of debug information at -O0 (where
277 vartracking doesn't run) record the place also in the base
278 DECL. For PARMs and RESULTs, do so only when setting the
279 default def. */
280 if (x && x != pc_rtx && SSA_NAME_VAR (t)
281 && (VAR_P (SSA_NAME_VAR (t))
282 || SSA_NAME_IS_DEFAULT_DEF (t)))
283 {
284 tree var = SSA_NAME_VAR (t);
285 /* If we don't yet have something recorded, just record it now. */
286 if (!DECL_RTL_SET_P (var))
287 SET_DECL_RTL (var, x);
288 /* If we have it set already to "multiple places" don't
289 change this. */
290 else if (DECL_RTL (var) == pc_rtx)
291 ;
292 /* If we have something recorded and it's not the same place
293 as we want to record now, we have multiple partitions for the
294 same base variable, with different places. We can't just
295 randomly chose one, hence we have to say that we don't know.
296 This only happens with optimization, and there var-tracking
297 will figure out the right thing. */
298 else if (DECL_RTL (var) != x)
299 SET_DECL_RTL (var, pc_rtx);
300 }
301 }
302 else
303 SET_DECL_RTL (t, x);
304 }
305
306 /* This structure holds data relevant to one variable that will be
307 placed in a stack slot. */
308 class stack_var
309 {
310 public:
311 /* The Variable. */
312 tree decl;
313
314 /* Initially, the size of the variable. Later, the size of the partition,
315 if this variable becomes it's partition's representative. */
316 poly_uint64 size;
317
318 /* The *byte* alignment required for this variable. Or as, with the
319 size, the alignment for this partition. */
320 unsigned int alignb;
321
322 /* The partition representative. */
323 size_t representative;
324
325 /* The next stack variable in the partition, or EOC. */
326 size_t next;
327
328 /* The numbers of conflicting stack variables. */
329 bitmap conflicts;
330 };
331
332 #define EOC ((size_t)-1)
333
334 /* We have an array of such objects while deciding allocation. */
335 static class stack_var *stack_vars;
336 static size_t stack_vars_alloc;
337 static size_t stack_vars_num;
338 static hash_map<tree, size_t> *decl_to_stack_part;
339
340 /* Conflict bitmaps go on this obstack. This allows us to destroy
341 all of them in one big sweep. */
342 static bitmap_obstack stack_var_bitmap_obstack;
343
344 /* An array of indices such that stack_vars[stack_vars_sorted[i]].size
345 is non-decreasing. */
346 static size_t *stack_vars_sorted;
347
348 /* The phase of the stack frame. This is the known misalignment of
349 virtual_stack_vars_rtx from PREFERRED_STACK_BOUNDARY. That is,
350 (frame_offset+frame_phase) % PREFERRED_STACK_BOUNDARY == 0. */
351 static int frame_phase;
352
353 /* Used during expand_used_vars to remember if we saw any decls for
354 which we'd like to enable stack smashing protection. */
355 static bool has_protected_decls;
356
357 /* Used during expand_used_vars. Remember if we say a character buffer
358 smaller than our cutoff threshold. Used for -Wstack-protector. */
359 static bool has_short_buffer;
360
361 /* Compute the byte alignment to use for DECL. Ignore alignment
362 we can't do with expected alignment of the stack boundary. */
363
364 static unsigned int
365 align_local_variable (tree decl, bool really_expand)
366 {
367 unsigned int align;
368
369 if (TREE_CODE (decl) == SSA_NAME)
370 {
371 tree type = TREE_TYPE (decl);
372 machine_mode mode = TYPE_MODE (type);
373
374 align = TYPE_ALIGN (type);
375 if (mode != BLKmode
376 && align < GET_MODE_ALIGNMENT (mode))
377 align = GET_MODE_ALIGNMENT (mode);
378 }
379 else
380 align = LOCAL_DECL_ALIGNMENT (decl);
381
382 if (hwasan_sanitize_stack_p ())
383 align = MAX (align, (unsigned) HWASAN_TAG_GRANULE_SIZE * BITS_PER_UNIT);
384
385 if (TREE_CODE (decl) != SSA_NAME && really_expand)
386 /* Don't change DECL_ALIGN when called from estimated_stack_frame_size.
387 That is done before IPA and could bump alignment based on host
388 backend even for offloaded code which wants different
389 LOCAL_DECL_ALIGNMENT. */
390 SET_DECL_ALIGN (decl, align);
391
392 return align / BITS_PER_UNIT;
393 }
394
395 /* Align given offset BASE with ALIGN. Truncate up if ALIGN_UP is true,
396 down otherwise. Return truncated BASE value. */
397
398 static inline unsigned HOST_WIDE_INT
399 align_base (HOST_WIDE_INT base, unsigned HOST_WIDE_INT align, bool align_up)
400 {
401 return align_up ? (base + align - 1) & -align : base & -align;
402 }
403
404 /* Allocate SIZE bytes at byte alignment ALIGN from the stack frame.
405 Return the frame offset. */
406
407 static poly_int64
408 alloc_stack_frame_space (poly_int64 size, unsigned HOST_WIDE_INT align)
409 {
410 poly_int64 offset, new_frame_offset;
411
412 if (FRAME_GROWS_DOWNWARD)
413 {
414 new_frame_offset
415 = aligned_lower_bound (frame_offset - frame_phase - size,
416 align) + frame_phase;
417 offset = new_frame_offset;
418 }
419 else
420 {
421 new_frame_offset
422 = aligned_upper_bound (frame_offset - frame_phase,
423 align) + frame_phase;
424 offset = new_frame_offset;
425 new_frame_offset += size;
426 }
427 frame_offset = new_frame_offset;
428
429 if (frame_offset_overflow (frame_offset, cfun->decl))
430 frame_offset = offset = 0;
431
432 return offset;
433 }
434
435 /* Ensure that the stack is aligned to ALIGN bytes.
436 Return the new frame offset. */
437 static poly_int64
438 align_frame_offset (unsigned HOST_WIDE_INT align)
439 {
440 return alloc_stack_frame_space (0, align);
441 }
442
443 /* Accumulate DECL into STACK_VARS. */
444
445 static void
446 add_stack_var (tree decl, bool really_expand)
447 {
448 class stack_var *v;
449
450 if (stack_vars_num >= stack_vars_alloc)
451 {
452 if (stack_vars_alloc)
453 stack_vars_alloc = stack_vars_alloc * 3 / 2;
454 else
455 stack_vars_alloc = 32;
456 stack_vars
457 = XRESIZEVEC (class stack_var, stack_vars, stack_vars_alloc);
458 }
459 if (!decl_to_stack_part)
460 decl_to_stack_part = new hash_map<tree, size_t>;
461
462 v = &stack_vars[stack_vars_num];
463 decl_to_stack_part->put (decl, stack_vars_num);
464
465 v->decl = decl;
466 tree size = TREE_CODE (decl) == SSA_NAME
467 ? TYPE_SIZE_UNIT (TREE_TYPE (decl))
468 : DECL_SIZE_UNIT (decl);
469 v->size = tree_to_poly_uint64 (size);
470 /* Ensure that all variables have size, so that &a != &b for any two
471 variables that are simultaneously live. */
472 if (known_eq (v->size, 0U))
473 v->size = 1;
474 v->alignb = align_local_variable (decl, really_expand);
475 /* An alignment of zero can mightily confuse us later. */
476 gcc_assert (v->alignb != 0);
477
478 /* All variables are initially in their own partition. */
479 v->representative = stack_vars_num;
480 v->next = EOC;
481
482 /* All variables initially conflict with no other. */
483 v->conflicts = NULL;
484
485 /* Ensure that this decl doesn't get put onto the list twice. */
486 set_rtl (decl, pc_rtx);
487
488 stack_vars_num++;
489 }
490
491 /* Make the decls associated with luid's X and Y conflict. */
492
493 static void
494 add_stack_var_conflict (size_t x, size_t y)
495 {
496 class stack_var *a = &stack_vars[x];
497 class stack_var *b = &stack_vars[y];
498 if (x == y)
499 return;
500 if (!a->conflicts)
501 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
502 if (!b->conflicts)
503 b->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
504 bitmap_set_bit (a->conflicts, y);
505 bitmap_set_bit (b->conflicts, x);
506 }
507
508 /* Check whether the decls associated with luid's X and Y conflict. */
509
510 static bool
511 stack_var_conflict_p (size_t x, size_t y)
512 {
513 class stack_var *a = &stack_vars[x];
514 class stack_var *b = &stack_vars[y];
515 if (x == y)
516 return false;
517 /* Partitions containing an SSA name result from gimple registers
518 with things like unsupported modes. They are top-level and
519 hence conflict with everything else. */
520 if (TREE_CODE (a->decl) == SSA_NAME || TREE_CODE (b->decl) == SSA_NAME)
521 return true;
522
523 if (!a->conflicts || !b->conflicts)
524 return false;
525 return bitmap_bit_p (a->conflicts, y);
526 }
527
528 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
529 enter its partition number into bitmap DATA. */
530
531 static bool
532 visit_op (gimple *, tree op, tree, void *data)
533 {
534 bitmap active = (bitmap)data;
535 op = get_base_address (op);
536 if (op
537 && DECL_P (op)
538 && DECL_RTL_IF_SET (op) == pc_rtx)
539 {
540 size_t *v = decl_to_stack_part->get (op);
541 if (v)
542 bitmap_set_bit (active, *v);
543 }
544 return false;
545 }
546
547 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
548 record conflicts between it and all currently active other partitions
549 from bitmap DATA. */
550
551 static bool
552 visit_conflict (gimple *, tree op, tree, void *data)
553 {
554 bitmap active = (bitmap)data;
555 op = get_base_address (op);
556 if (op
557 && DECL_P (op)
558 && DECL_RTL_IF_SET (op) == pc_rtx)
559 {
560 size_t *v = decl_to_stack_part->get (op);
561 if (v && bitmap_set_bit (active, *v))
562 {
563 size_t num = *v;
564 bitmap_iterator bi;
565 unsigned i;
566 gcc_assert (num < stack_vars_num);
567 EXECUTE_IF_SET_IN_BITMAP (active, 0, i, bi)
568 add_stack_var_conflict (num, i);
569 }
570 }
571 return false;
572 }
573
574 /* Helper routine for add_scope_conflicts, calculating the active partitions
575 at the end of BB, leaving the result in WORK. We're called to generate
576 conflicts when FOR_CONFLICT is true, otherwise we're just tracking
577 liveness. */
578
579 static void
580 add_scope_conflicts_1 (basic_block bb, bitmap work, bool for_conflict)
581 {
582 edge e;
583 edge_iterator ei;
584 gimple_stmt_iterator gsi;
585 walk_stmt_load_store_addr_fn visit;
586
587 bitmap_clear (work);
588 FOR_EACH_EDGE (e, ei, bb->preds)
589 bitmap_ior_into (work, (bitmap)e->src->aux);
590
591 visit = visit_op;
592
593 for (gsi = gsi_start_phis (bb); !gsi_end_p (gsi); gsi_next (&gsi))
594 {
595 gimple *stmt = gsi_stmt (gsi);
596 walk_stmt_load_store_addr_ops (stmt, work, NULL, NULL, visit);
597 }
598 for (gsi = gsi_after_labels (bb); !gsi_end_p (gsi); gsi_next (&gsi))
599 {
600 gimple *stmt = gsi_stmt (gsi);
601
602 if (gimple_clobber_p (stmt))
603 {
604 tree lhs = gimple_assign_lhs (stmt);
605 size_t *v;
606 /* Nested function lowering might introduce LHSs
607 that are COMPONENT_REFs. */
608 if (!VAR_P (lhs))
609 continue;
610 if (DECL_RTL_IF_SET (lhs) == pc_rtx
611 && (v = decl_to_stack_part->get (lhs)))
612 bitmap_clear_bit (work, *v);
613 }
614 else if (!is_gimple_debug (stmt))
615 {
616 if (for_conflict
617 && visit == visit_op)
618 {
619 /* If this is the first real instruction in this BB we need
620 to add conflicts for everything live at this point now.
621 Unlike classical liveness for named objects we can't
622 rely on seeing a def/use of the names we're interested in.
623 There might merely be indirect loads/stores. We'd not add any
624 conflicts for such partitions. */
625 bitmap_iterator bi;
626 unsigned i;
627 EXECUTE_IF_SET_IN_BITMAP (work, 0, i, bi)
628 {
629 class stack_var *a = &stack_vars[i];
630 if (!a->conflicts)
631 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
632 bitmap_ior_into (a->conflicts, work);
633 }
634 visit = visit_conflict;
635 }
636 walk_stmt_load_store_addr_ops (stmt, work, visit, visit, visit);
637 }
638 }
639 }
640
641 /* Generate stack partition conflicts between all partitions that are
642 simultaneously live. */
643
644 static void
645 add_scope_conflicts (void)
646 {
647 basic_block bb;
648 bool changed;
649 bitmap work = BITMAP_ALLOC (NULL);
650 int *rpo;
651 int n_bbs;
652
653 /* We approximate the live range of a stack variable by taking the first
654 mention of its name as starting point(s), and by the end-of-scope
655 death clobber added by gimplify as ending point(s) of the range.
656 This overapproximates in the case we for instance moved an address-taken
657 operation upward, without also moving a dereference to it upwards.
658 But it's conservatively correct as a variable never can hold values
659 before its name is mentioned at least once.
660
661 We then do a mostly classical bitmap liveness algorithm. */
662
663 FOR_ALL_BB_FN (bb, cfun)
664 bb->aux = BITMAP_ALLOC (&stack_var_bitmap_obstack);
665
666 rpo = XNEWVEC (int, last_basic_block_for_fn (cfun));
667 n_bbs = pre_and_rev_post_order_compute (NULL, rpo, false);
668
669 changed = true;
670 while (changed)
671 {
672 int i;
673 changed = false;
674 for (i = 0; i < n_bbs; i++)
675 {
676 bitmap active;
677 bb = BASIC_BLOCK_FOR_FN (cfun, rpo[i]);
678 active = (bitmap)bb->aux;
679 add_scope_conflicts_1 (bb, work, false);
680 if (bitmap_ior_into (active, work))
681 changed = true;
682 }
683 }
684
685 FOR_EACH_BB_FN (bb, cfun)
686 add_scope_conflicts_1 (bb, work, true);
687
688 free (rpo);
689 BITMAP_FREE (work);
690 FOR_ALL_BB_FN (bb, cfun)
691 BITMAP_FREE (bb->aux);
692 }
693
694 /* A subroutine of partition_stack_vars. A comparison function for qsort,
695 sorting an array of indices by the properties of the object. */
696
697 static int
698 stack_var_cmp (const void *a, const void *b)
699 {
700 size_t ia = *(const size_t *)a;
701 size_t ib = *(const size_t *)b;
702 unsigned int aligna = stack_vars[ia].alignb;
703 unsigned int alignb = stack_vars[ib].alignb;
704 poly_int64 sizea = stack_vars[ia].size;
705 poly_int64 sizeb = stack_vars[ib].size;
706 tree decla = stack_vars[ia].decl;
707 tree declb = stack_vars[ib].decl;
708 bool largea, largeb;
709 unsigned int uida, uidb;
710
711 /* Primary compare on "large" alignment. Large comes first. */
712 largea = (aligna * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
713 largeb = (alignb * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
714 if (largea != largeb)
715 return (int)largeb - (int)largea;
716
717 /* Secondary compare on size, decreasing */
718 int diff = compare_sizes_for_sort (sizeb, sizea);
719 if (diff != 0)
720 return diff;
721
722 /* Tertiary compare on true alignment, decreasing. */
723 if (aligna < alignb)
724 return -1;
725 if (aligna > alignb)
726 return 1;
727
728 /* Final compare on ID for sort stability, increasing.
729 Two SSA names are compared by their version, SSA names come before
730 non-SSA names, and two normal decls are compared by their DECL_UID. */
731 if (TREE_CODE (decla) == SSA_NAME)
732 {
733 if (TREE_CODE (declb) == SSA_NAME)
734 uida = SSA_NAME_VERSION (decla), uidb = SSA_NAME_VERSION (declb);
735 else
736 return -1;
737 }
738 else if (TREE_CODE (declb) == SSA_NAME)
739 return 1;
740 else
741 uida = DECL_UID (decla), uidb = DECL_UID (declb);
742 if (uida < uidb)
743 return 1;
744 if (uida > uidb)
745 return -1;
746 return 0;
747 }
748
749 struct part_traits : unbounded_int_hashmap_traits <size_t, bitmap> {};
750 typedef hash_map<size_t, bitmap, part_traits> part_hashmap;
751
752 /* If the points-to solution *PI points to variables that are in a partition
753 together with other variables add all partition members to the pointed-to
754 variables bitmap. */
755
756 static void
757 add_partitioned_vars_to_ptset (struct pt_solution *pt,
758 part_hashmap *decls_to_partitions,
759 hash_set<bitmap> *visited, bitmap temp)
760 {
761 bitmap_iterator bi;
762 unsigned i;
763 bitmap *part;
764
765 if (pt->anything
766 || pt->vars == NULL
767 /* The pointed-to vars bitmap is shared, it is enough to
768 visit it once. */
769 || visited->add (pt->vars))
770 return;
771
772 bitmap_clear (temp);
773
774 /* By using a temporary bitmap to store all members of the partitions
775 we have to add we make sure to visit each of the partitions only
776 once. */
777 EXECUTE_IF_SET_IN_BITMAP (pt->vars, 0, i, bi)
778 if ((!temp
779 || !bitmap_bit_p (temp, i))
780 && (part = decls_to_partitions->get (i)))
781 bitmap_ior_into (temp, *part);
782 if (!bitmap_empty_p (temp))
783 bitmap_ior_into (pt->vars, temp);
784 }
785
786 /* Update points-to sets based on partition info, so we can use them on RTL.
787 The bitmaps representing stack partitions will be saved until expand,
788 where partitioned decls used as bases in memory expressions will be
789 rewritten. */
790
791 static void
792 update_alias_info_with_stack_vars (void)
793 {
794 part_hashmap *decls_to_partitions = NULL;
795 size_t i, j;
796 tree var = NULL_TREE;
797
798 for (i = 0; i < stack_vars_num; i++)
799 {
800 bitmap part = NULL;
801 tree name;
802 struct ptr_info_def *pi;
803
804 /* Not interested in partitions with single variable. */
805 if (stack_vars[i].representative != i
806 || stack_vars[i].next == EOC)
807 continue;
808
809 if (!decls_to_partitions)
810 {
811 decls_to_partitions = new part_hashmap;
812 cfun->gimple_df->decls_to_pointers = new hash_map<tree, tree>;
813 }
814
815 /* Create an SSA_NAME that points to the partition for use
816 as base during alias-oracle queries on RTL for bases that
817 have been partitioned. */
818 if (var == NULL_TREE)
819 var = create_tmp_var (ptr_type_node);
820 name = make_ssa_name (var);
821
822 /* Create bitmaps representing partitions. They will be used for
823 points-to sets later, so use GGC alloc. */
824 part = BITMAP_GGC_ALLOC ();
825 for (j = i; j != EOC; j = stack_vars[j].next)
826 {
827 tree decl = stack_vars[j].decl;
828 unsigned int uid = DECL_PT_UID (decl);
829 bitmap_set_bit (part, uid);
830 decls_to_partitions->put (uid, part);
831 cfun->gimple_df->decls_to_pointers->put (decl, name);
832 if (TREE_ADDRESSABLE (decl))
833 TREE_ADDRESSABLE (name) = 1;
834 }
835
836 /* Make the SSA name point to all partition members. */
837 pi = get_ptr_info (name);
838 pt_solution_set (&pi->pt, part, false);
839 }
840
841 /* Make all points-to sets that contain one member of a partition
842 contain all members of the partition. */
843 if (decls_to_partitions)
844 {
845 unsigned i;
846 tree name;
847 hash_set<bitmap> visited;
848 bitmap temp = BITMAP_ALLOC (&stack_var_bitmap_obstack);
849
850 FOR_EACH_SSA_NAME (i, name, cfun)
851 {
852 struct ptr_info_def *pi;
853
854 if (POINTER_TYPE_P (TREE_TYPE (name))
855 && ((pi = SSA_NAME_PTR_INFO (name)) != NULL))
856 add_partitioned_vars_to_ptset (&pi->pt, decls_to_partitions,
857 &visited, temp);
858 }
859
860 add_partitioned_vars_to_ptset (&cfun->gimple_df->escaped,
861 decls_to_partitions, &visited, temp);
862
863 delete decls_to_partitions;
864 BITMAP_FREE (temp);
865 }
866 }
867
868 /* A subroutine of partition_stack_vars. The UNION portion of a UNION/FIND
869 partitioning algorithm. Partitions A and B are known to be non-conflicting.
870 Merge them into a single partition A. */
871
872 static void
873 union_stack_vars (size_t a, size_t b)
874 {
875 class stack_var *vb = &stack_vars[b];
876 bitmap_iterator bi;
877 unsigned u;
878
879 gcc_assert (stack_vars[b].next == EOC);
880 /* Add B to A's partition. */
881 stack_vars[b].next = stack_vars[a].next;
882 stack_vars[b].representative = a;
883 stack_vars[a].next = b;
884
885 /* Make sure A is big enough to hold B. */
886 stack_vars[a].size = upper_bound (stack_vars[a].size, stack_vars[b].size);
887
888 /* Update the required alignment of partition A to account for B. */
889 if (stack_vars[a].alignb < stack_vars[b].alignb)
890 stack_vars[a].alignb = stack_vars[b].alignb;
891
892 /* Update the interference graph and merge the conflicts. */
893 if (vb->conflicts)
894 {
895 EXECUTE_IF_SET_IN_BITMAP (vb->conflicts, 0, u, bi)
896 add_stack_var_conflict (a, stack_vars[u].representative);
897 BITMAP_FREE (vb->conflicts);
898 }
899 }
900
901 /* A subroutine of expand_used_vars. Binpack the variables into
902 partitions constrained by the interference graph. The overall
903 algorithm used is as follows:
904
905 Sort the objects by size in descending order.
906 For each object A {
907 S = size(A)
908 O = 0
909 loop {
910 Look for the largest non-conflicting object B with size <= S.
911 UNION (A, B)
912 }
913 }
914 */
915
916 static void
917 partition_stack_vars (void)
918 {
919 size_t si, sj, n = stack_vars_num;
920
921 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
922 for (si = 0; si < n; ++si)
923 stack_vars_sorted[si] = si;
924
925 if (n == 1)
926 return;
927
928 qsort (stack_vars_sorted, n, sizeof (size_t), stack_var_cmp);
929
930 for (si = 0; si < n; ++si)
931 {
932 size_t i = stack_vars_sorted[si];
933 unsigned int ialign = stack_vars[i].alignb;
934 poly_int64 isize = stack_vars[i].size;
935
936 /* Ignore objects that aren't partition representatives. If we
937 see a var that is not a partition representative, it must
938 have been merged earlier. */
939 if (stack_vars[i].representative != i)
940 continue;
941
942 for (sj = si + 1; sj < n; ++sj)
943 {
944 size_t j = stack_vars_sorted[sj];
945 unsigned int jalign = stack_vars[j].alignb;
946 poly_int64 jsize = stack_vars[j].size;
947
948 /* Ignore objects that aren't partition representatives. */
949 if (stack_vars[j].representative != j)
950 continue;
951
952 /* Do not mix objects of "small" (supported) alignment
953 and "large" (unsupported) alignment. */
954 if ((ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
955 != (jalign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT))
956 break;
957
958 /* For Address Sanitizer do not mix objects with different
959 sizes, as the shorter vars wouldn't be adequately protected.
960 Don't do that for "large" (unsupported) alignment objects,
961 those aren't protected anyway. */
962 if (asan_sanitize_stack_p ()
963 && maybe_ne (isize, jsize)
964 && ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
965 break;
966
967 /* Ignore conflicting objects. */
968 if (stack_var_conflict_p (i, j))
969 continue;
970
971 /* UNION the objects, placing J at OFFSET. */
972 union_stack_vars (i, j);
973 }
974 }
975
976 update_alias_info_with_stack_vars ();
977 }
978
979 /* A debugging aid for expand_used_vars. Dump the generated partitions. */
980
981 static void
982 dump_stack_var_partition (void)
983 {
984 size_t si, i, j, n = stack_vars_num;
985
986 for (si = 0; si < n; ++si)
987 {
988 i = stack_vars_sorted[si];
989
990 /* Skip variables that aren't partition representatives, for now. */
991 if (stack_vars[i].representative != i)
992 continue;
993
994 fprintf (dump_file, "Partition %lu: size ", (unsigned long) i);
995 print_dec (stack_vars[i].size, dump_file);
996 fprintf (dump_file, " align %u\n", stack_vars[i].alignb);
997
998 for (j = i; j != EOC; j = stack_vars[j].next)
999 {
1000 fputc ('\t', dump_file);
1001 print_generic_expr (dump_file, stack_vars[j].decl, dump_flags);
1002 }
1003 fputc ('\n', dump_file);
1004 }
1005 }
1006
1007 /* Assign rtl to DECL at BASE + OFFSET. */
1008
1009 static void
1010 expand_one_stack_var_at (tree decl, rtx base, unsigned base_align,
1011 poly_int64 offset)
1012 {
1013 unsigned align;
1014 rtx x;
1015
1016 /* If this fails, we've overflowed the stack frame. Error nicely? */
1017 gcc_assert (known_eq (offset, trunc_int_for_mode (offset, Pmode)));
1018
1019 if (hwasan_sanitize_stack_p ())
1020 x = targetm.memtag.add_tag (base, offset,
1021 hwasan_current_frame_tag ());
1022 else
1023 x = plus_constant (Pmode, base, offset);
1024
1025 x = gen_rtx_MEM (TREE_CODE (decl) == SSA_NAME
1026 ? TYPE_MODE (TREE_TYPE (decl))
1027 : DECL_MODE (decl), x);
1028
1029 /* Set alignment we actually gave this decl if it isn't an SSA name.
1030 If it is we generate stack slots only accidentally so it isn't as
1031 important, we'll simply set the alignment directly on the MEM. */
1032
1033 if (stack_vars_base_reg_p (base))
1034 offset -= frame_phase;
1035 align = known_alignment (offset);
1036 align *= BITS_PER_UNIT;
1037 if (align == 0 || align > base_align)
1038 align = base_align;
1039
1040 if (TREE_CODE (decl) != SSA_NAME)
1041 {
1042 /* One would think that we could assert that we're not decreasing
1043 alignment here, but (at least) the i386 port does exactly this
1044 via the MINIMUM_ALIGNMENT hook. */
1045
1046 SET_DECL_ALIGN (decl, align);
1047 DECL_USER_ALIGN (decl) = 0;
1048 }
1049
1050 set_rtl (decl, x);
1051
1052 set_mem_align (x, align);
1053 }
1054
1055 class stack_vars_data
1056 {
1057 public:
1058 /* Vector of offset pairs, always end of some padding followed
1059 by start of the padding that needs Address Sanitizer protection.
1060 The vector is in reversed, highest offset pairs come first. */
1061 auto_vec<HOST_WIDE_INT> asan_vec;
1062
1063 /* Vector of partition representative decls in between the paddings. */
1064 auto_vec<tree> asan_decl_vec;
1065
1066 /* Base pseudo register for Address Sanitizer protected automatic vars. */
1067 rtx asan_base;
1068
1069 /* Alignment needed for the Address Sanitizer protected automatic vars. */
1070 unsigned int asan_alignb;
1071 };
1072
1073 /* A subroutine of expand_used_vars. Give each partition representative
1074 a unique location within the stack frame. Update each partition member
1075 with that location. */
1076 static void
1077 expand_stack_vars (bool (*pred) (size_t), class stack_vars_data *data)
1078 {
1079 size_t si, i, j, n = stack_vars_num;
1080 poly_uint64 large_size = 0, large_alloc = 0;
1081 rtx large_base = NULL;
1082 rtx large_untagged_base = NULL;
1083 unsigned large_align = 0;
1084 bool large_allocation_done = false;
1085 tree decl;
1086
1087 /* Determine if there are any variables requiring "large" alignment.
1088 Since these are dynamically allocated, we only process these if
1089 no predicate involved. */
1090 large_align = stack_vars[stack_vars_sorted[0]].alignb * BITS_PER_UNIT;
1091 if (pred == NULL && large_align > MAX_SUPPORTED_STACK_ALIGNMENT)
1092 {
1093 /* Find the total size of these variables. */
1094 for (si = 0; si < n; ++si)
1095 {
1096 unsigned alignb;
1097
1098 i = stack_vars_sorted[si];
1099 alignb = stack_vars[i].alignb;
1100
1101 /* All "large" alignment decls come before all "small" alignment
1102 decls, but "large" alignment decls are not sorted based on
1103 their alignment. Increase large_align to track the largest
1104 required alignment. */
1105 if ((alignb * BITS_PER_UNIT) > large_align)
1106 large_align = alignb * BITS_PER_UNIT;
1107
1108 /* Stop when we get to the first decl with "small" alignment. */
1109 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1110 break;
1111
1112 /* Skip variables that aren't partition representatives. */
1113 if (stack_vars[i].representative != i)
1114 continue;
1115
1116 /* Skip variables that have already had rtl assigned. See also
1117 add_stack_var where we perpetrate this pc_rtx hack. */
1118 decl = stack_vars[i].decl;
1119 if (TREE_CODE (decl) == SSA_NAME
1120 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)] != NULL_RTX
1121 : DECL_RTL (decl) != pc_rtx)
1122 continue;
1123
1124 large_size = aligned_upper_bound (large_size, alignb);
1125 large_size += stack_vars[i].size;
1126 }
1127 }
1128
1129 for (si = 0; si < n; ++si)
1130 {
1131 rtx base;
1132 unsigned base_align, alignb;
1133 poly_int64 offset = 0;
1134
1135 i = stack_vars_sorted[si];
1136
1137 /* Skip variables that aren't partition representatives, for now. */
1138 if (stack_vars[i].representative != i)
1139 continue;
1140
1141 /* Skip variables that have already had rtl assigned. See also
1142 add_stack_var where we perpetrate this pc_rtx hack. */
1143 decl = stack_vars[i].decl;
1144 if (TREE_CODE (decl) == SSA_NAME
1145 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)] != NULL_RTX
1146 : DECL_RTL (decl) != pc_rtx)
1147 continue;
1148
1149 /* Check the predicate to see whether this variable should be
1150 allocated in this pass. */
1151 if (pred && !pred (i))
1152 continue;
1153
1154 base = (hwasan_sanitize_stack_p ()
1155 ? hwasan_frame_base ()
1156 : virtual_stack_vars_rtx);
1157 alignb = stack_vars[i].alignb;
1158 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1159 {
1160 poly_int64 hwasan_orig_offset;
1161 if (hwasan_sanitize_stack_p ())
1162 {
1163 /* There must be no tag granule "shared" between different
1164 objects. This means that no HWASAN_TAG_GRANULE_SIZE byte
1165 chunk can have more than one object in it.
1166
1167 We ensure this by forcing the end of the last bit of data to
1168 be aligned to HWASAN_TAG_GRANULE_SIZE bytes here, and setting
1169 the start of each variable to be aligned to
1170 HWASAN_TAG_GRANULE_SIZE bytes in `align_local_variable`.
1171
1172 We can't align just one of the start or end, since there are
1173 untagged things stored on the stack which we do not align to
1174 HWASAN_TAG_GRANULE_SIZE bytes. If we only aligned the start
1175 or the end of tagged objects then untagged objects could end
1176 up sharing the first granule of a tagged object or sharing the
1177 last granule of a tagged object respectively. */
1178 hwasan_orig_offset = align_frame_offset (HWASAN_TAG_GRANULE_SIZE);
1179 gcc_assert (stack_vars[i].alignb >= HWASAN_TAG_GRANULE_SIZE);
1180 }
1181 /* ASAN description strings don't yet have a syntax for expressing
1182 polynomial offsets. */
1183 HOST_WIDE_INT prev_offset;
1184 if (asan_sanitize_stack_p ()
1185 && pred
1186 && frame_offset.is_constant (&prev_offset)
1187 && stack_vars[i].size.is_constant ())
1188 {
1189 if (data->asan_vec.is_empty ())
1190 {
1191 align_frame_offset (ASAN_RED_ZONE_SIZE);
1192 prev_offset = frame_offset.to_constant ();
1193 }
1194 prev_offset = align_base (prev_offset,
1195 ASAN_MIN_RED_ZONE_SIZE,
1196 !FRAME_GROWS_DOWNWARD);
1197 tree repr_decl = NULL_TREE;
1198 unsigned HOST_WIDE_INT size
1199 = asan_var_and_redzone_size (stack_vars[i].size.to_constant ());
1200 if (data->asan_vec.is_empty ())
1201 size = MAX (size, ASAN_RED_ZONE_SIZE);
1202
1203 unsigned HOST_WIDE_INT alignment = MAX (alignb,
1204 ASAN_MIN_RED_ZONE_SIZE);
1205 offset = alloc_stack_frame_space (size, alignment);
1206
1207 data->asan_vec.safe_push (prev_offset);
1208 /* Allocating a constant amount of space from a constant
1209 starting offset must give a constant result. */
1210 data->asan_vec.safe_push ((offset + stack_vars[i].size)
1211 .to_constant ());
1212 /* Find best representative of the partition.
1213 Prefer those with DECL_NAME, even better
1214 satisfying asan_protect_stack_decl predicate. */
1215 for (j = i; j != EOC; j = stack_vars[j].next)
1216 if (asan_protect_stack_decl (stack_vars[j].decl)
1217 && DECL_NAME (stack_vars[j].decl))
1218 {
1219 repr_decl = stack_vars[j].decl;
1220 break;
1221 }
1222 else if (repr_decl == NULL_TREE
1223 && DECL_P (stack_vars[j].decl)
1224 && DECL_NAME (stack_vars[j].decl))
1225 repr_decl = stack_vars[j].decl;
1226 if (repr_decl == NULL_TREE)
1227 repr_decl = stack_vars[i].decl;
1228 data->asan_decl_vec.safe_push (repr_decl);
1229
1230 /* Make sure a representative is unpoison if another
1231 variable in the partition is handled by
1232 use-after-scope sanitization. */
1233 if (asan_handled_variables != NULL
1234 && !asan_handled_variables->contains (repr_decl))
1235 {
1236 for (j = i; j != EOC; j = stack_vars[j].next)
1237 if (asan_handled_variables->contains (stack_vars[j].decl))
1238 break;
1239 if (j != EOC)
1240 asan_handled_variables->add (repr_decl);
1241 }
1242
1243 data->asan_alignb = MAX (data->asan_alignb, alignb);
1244 if (data->asan_base == NULL)
1245 data->asan_base = gen_reg_rtx (Pmode);
1246 base = data->asan_base;
1247
1248 if (!STRICT_ALIGNMENT)
1249 base_align = crtl->max_used_stack_slot_alignment;
1250 else
1251 base_align = MAX (crtl->max_used_stack_slot_alignment,
1252 GET_MODE_ALIGNMENT (SImode)
1253 << ASAN_SHADOW_SHIFT);
1254 }
1255 else
1256 {
1257 offset = alloc_stack_frame_space (stack_vars[i].size, alignb);
1258 base_align = crtl->max_used_stack_slot_alignment;
1259
1260 if (hwasan_sanitize_stack_p ())
1261 {
1262 /* Align again since the point of this alignment is to handle
1263 the "end" of the object (i.e. smallest address after the
1264 stack object). For FRAME_GROWS_DOWNWARD that requires
1265 aligning the stack before allocating, but for a frame that
1266 grows upwards that requires aligning the stack after
1267 allocation.
1268
1269 Use `frame_offset` to record the offset value rather than
1270 `offset` since the `frame_offset` describes the extent
1271 allocated for this particular variable while `offset`
1272 describes the address that this variable starts at. */
1273 align_frame_offset (HWASAN_TAG_GRANULE_SIZE);
1274 hwasan_record_stack_var (virtual_stack_vars_rtx, base,
1275 hwasan_orig_offset, frame_offset);
1276 }
1277 }
1278 }
1279 else
1280 {
1281 /* Large alignment is only processed in the last pass. */
1282 if (pred)
1283 continue;
1284
1285 /* If there were any variables requiring "large" alignment, allocate
1286 space. */
1287 if (maybe_ne (large_size, 0U) && ! large_allocation_done)
1288 {
1289 poly_int64 loffset;
1290 rtx large_allocsize;
1291
1292 large_allocsize = gen_int_mode (large_size, Pmode);
1293 get_dynamic_stack_size (&large_allocsize, 0, large_align, NULL);
1294 loffset = alloc_stack_frame_space
1295 (rtx_to_poly_int64 (large_allocsize),
1296 PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT);
1297 large_base = get_dynamic_stack_base (loffset, large_align, base);
1298 large_allocation_done = true;
1299 }
1300
1301 gcc_assert (large_base != NULL);
1302 large_alloc = aligned_upper_bound (large_alloc, alignb);
1303 offset = large_alloc;
1304 large_alloc += stack_vars[i].size;
1305 if (hwasan_sanitize_stack_p ())
1306 {
1307 /* An object with a large alignment requirement means that the
1308 alignment requirement is greater than the required alignment
1309 for tags. */
1310 if (!large_untagged_base)
1311 large_untagged_base
1312 = targetm.memtag.untagged_pointer (large_base, NULL_RTX);
1313 /* Ensure the end of the variable is also aligned correctly. */
1314 poly_int64 align_again
1315 = aligned_upper_bound (large_alloc, HWASAN_TAG_GRANULE_SIZE);
1316 /* For large allocations we always allocate a chunk of space
1317 (which is addressed by large_untagged_base/large_base) and
1318 then use positive offsets from that. Hence the farthest
1319 offset is `align_again` and the nearest offset from the base
1320 is `offset`. */
1321 hwasan_record_stack_var (large_untagged_base, large_base,
1322 offset, align_again);
1323 }
1324
1325 base = large_base;
1326 base_align = large_align;
1327 }
1328
1329 /* Create rtl for each variable based on their location within the
1330 partition. */
1331 for (j = i; j != EOC; j = stack_vars[j].next)
1332 {
1333 expand_one_stack_var_at (stack_vars[j].decl,
1334 base, base_align, offset);
1335 }
1336 if (hwasan_sanitize_stack_p ())
1337 hwasan_increment_frame_tag ();
1338 }
1339
1340 gcc_assert (known_eq (large_alloc, large_size));
1341 }
1342
1343 /* Take into account all sizes of partitions and reset DECL_RTLs. */
1344 static poly_uint64
1345 account_stack_vars (void)
1346 {
1347 size_t si, j, i, n = stack_vars_num;
1348 poly_uint64 size = 0;
1349
1350 for (si = 0; si < n; ++si)
1351 {
1352 i = stack_vars_sorted[si];
1353
1354 /* Skip variables that aren't partition representatives, for now. */
1355 if (stack_vars[i].representative != i)
1356 continue;
1357
1358 size += stack_vars[i].size;
1359 for (j = i; j != EOC; j = stack_vars[j].next)
1360 set_rtl (stack_vars[j].decl, NULL);
1361 }
1362 return size;
1363 }
1364
1365 /* Record the RTL assignment X for the default def of PARM. */
1366
1367 extern void
1368 set_parm_rtl (tree parm, rtx x)
1369 {
1370 gcc_assert (TREE_CODE (parm) == PARM_DECL
1371 || TREE_CODE (parm) == RESULT_DECL);
1372
1373 if (x && !MEM_P (x))
1374 {
1375 unsigned int align = MINIMUM_ALIGNMENT (TREE_TYPE (parm),
1376 TYPE_MODE (TREE_TYPE (parm)),
1377 TYPE_ALIGN (TREE_TYPE (parm)));
1378
1379 /* If the variable alignment is very large we'll dynamicaly
1380 allocate it, which means that in-frame portion is just a
1381 pointer. ??? We've got a pseudo for sure here, do we
1382 actually dynamically allocate its spilling area if needed?
1383 ??? Isn't it a problem when Pmode alignment also exceeds
1384 MAX_SUPPORTED_STACK_ALIGNMENT, as can happen on cris and lm32? */
1385 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1386 align = GET_MODE_ALIGNMENT (Pmode);
1387
1388 record_alignment_for_reg_var (align);
1389 }
1390
1391 tree ssa = ssa_default_def (cfun, parm);
1392 if (!ssa)
1393 return set_rtl (parm, x);
1394
1395 int part = var_to_partition (SA.map, ssa);
1396 gcc_assert (part != NO_PARTITION);
1397
1398 bool changed = bitmap_bit_p (SA.partitions_for_parm_default_defs, part);
1399 gcc_assert (changed);
1400
1401 set_rtl (ssa, x);
1402 gcc_assert (DECL_RTL (parm) == x);
1403 }
1404
1405 /* A subroutine of expand_one_var. Called to immediately assign rtl
1406 to a variable to be allocated in the stack frame. */
1407
1408 static void
1409 expand_one_stack_var_1 (tree var)
1410 {
1411 poly_uint64 size;
1412 poly_int64 offset;
1413 unsigned byte_align;
1414
1415 if (TREE_CODE (var) == SSA_NAME)
1416 {
1417 tree type = TREE_TYPE (var);
1418 size = tree_to_poly_uint64 (TYPE_SIZE_UNIT (type));
1419 }
1420 else
1421 size = tree_to_poly_uint64 (DECL_SIZE_UNIT (var));
1422
1423 byte_align = align_local_variable (var, true);
1424
1425 /* We handle highly aligned variables in expand_stack_vars. */
1426 gcc_assert (byte_align * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT);
1427
1428 rtx base;
1429 if (hwasan_sanitize_stack_p ())
1430 {
1431 /* Allocate zero bytes to align the stack. */
1432 poly_int64 hwasan_orig_offset
1433 = align_frame_offset (HWASAN_TAG_GRANULE_SIZE);
1434 offset = alloc_stack_frame_space (size, byte_align);
1435 align_frame_offset (HWASAN_TAG_GRANULE_SIZE);
1436 base = hwasan_frame_base ();
1437 /* Use `frame_offset` to automatically account for machines where the
1438 frame grows upwards.
1439
1440 `offset` will always point to the "start" of the stack object, which
1441 will be the smallest address, for ! FRAME_GROWS_DOWNWARD this is *not*
1442 the "furthest" offset from the base delimiting the current stack
1443 object. `frame_offset` will always delimit the extent that the frame.
1444 */
1445 hwasan_record_stack_var (virtual_stack_vars_rtx, base,
1446 hwasan_orig_offset, frame_offset);
1447 }
1448 else
1449 {
1450 offset = alloc_stack_frame_space (size, byte_align);
1451 base = virtual_stack_vars_rtx;
1452 }
1453
1454 expand_one_stack_var_at (var, base,
1455 crtl->max_used_stack_slot_alignment, offset);
1456
1457 if (hwasan_sanitize_stack_p ())
1458 hwasan_increment_frame_tag ();
1459 }
1460
1461 /* Wrapper for expand_one_stack_var_1 that checks SSA_NAMEs are
1462 already assigned some MEM. */
1463
1464 static void
1465 expand_one_stack_var (tree var)
1466 {
1467 if (TREE_CODE (var) == SSA_NAME)
1468 {
1469 int part = var_to_partition (SA.map, var);
1470 if (part != NO_PARTITION)
1471 {
1472 rtx x = SA.partition_to_pseudo[part];
1473 gcc_assert (x);
1474 gcc_assert (MEM_P (x));
1475 return;
1476 }
1477 }
1478
1479 return expand_one_stack_var_1 (var);
1480 }
1481
1482 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1483 that will reside in a hard register. */
1484
1485 static void
1486 expand_one_hard_reg_var (tree var)
1487 {
1488 rest_of_decl_compilation (var, 0, 0);
1489 }
1490
1491 /* Record the alignment requirements of some variable assigned to a
1492 pseudo. */
1493
1494 static void
1495 record_alignment_for_reg_var (unsigned int align)
1496 {
1497 if (SUPPORTS_STACK_ALIGNMENT
1498 && crtl->stack_alignment_estimated < align)
1499 {
1500 /* stack_alignment_estimated shouldn't change after stack
1501 realign decision made */
1502 gcc_assert (!crtl->stack_realign_processed);
1503 crtl->stack_alignment_estimated = align;
1504 }
1505
1506 /* stack_alignment_needed > PREFERRED_STACK_BOUNDARY is permitted.
1507 So here we only make sure stack_alignment_needed >= align. */
1508 if (crtl->stack_alignment_needed < align)
1509 crtl->stack_alignment_needed = align;
1510 if (crtl->max_used_stack_slot_alignment < align)
1511 crtl->max_used_stack_slot_alignment = align;
1512 }
1513
1514 /* Create RTL for an SSA partition. */
1515
1516 static void
1517 expand_one_ssa_partition (tree var)
1518 {
1519 int part = var_to_partition (SA.map, var);
1520 gcc_assert (part != NO_PARTITION);
1521
1522 if (SA.partition_to_pseudo[part])
1523 return;
1524
1525 unsigned int align = MINIMUM_ALIGNMENT (TREE_TYPE (var),
1526 TYPE_MODE (TREE_TYPE (var)),
1527 TYPE_ALIGN (TREE_TYPE (var)));
1528
1529 /* If the variable alignment is very large we'll dynamicaly allocate
1530 it, which means that in-frame portion is just a pointer. */
1531 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1532 align = GET_MODE_ALIGNMENT (Pmode);
1533
1534 record_alignment_for_reg_var (align);
1535
1536 if (!use_register_for_decl (var))
1537 {
1538 if (defer_stack_allocation (var, true))
1539 add_stack_var (var, true);
1540 else
1541 expand_one_stack_var_1 (var);
1542 return;
1543 }
1544
1545 machine_mode reg_mode = promote_ssa_mode (var, NULL);
1546 rtx x = gen_reg_rtx (reg_mode);
1547
1548 set_rtl (var, x);
1549
1550 /* For a promoted variable, X will not be used directly but wrapped in a
1551 SUBREG with SUBREG_PROMOTED_VAR_P set, which means that the RTL land
1552 will assume that its upper bits can be inferred from its lower bits.
1553 Therefore, if X isn't initialized on every path from the entry, then
1554 we must do it manually in order to fulfill the above assumption. */
1555 if (reg_mode != TYPE_MODE (TREE_TYPE (var))
1556 && bitmap_bit_p (SA.partitions_for_undefined_values, part))
1557 emit_move_insn (x, CONST0_RTX (reg_mode));
1558 }
1559
1560 /* Record the association between the RTL generated for partition PART
1561 and the underlying variable of the SSA_NAME VAR. */
1562
1563 static void
1564 adjust_one_expanded_partition_var (tree var)
1565 {
1566 if (!var)
1567 return;
1568
1569 tree decl = SSA_NAME_VAR (var);
1570
1571 int part = var_to_partition (SA.map, var);
1572 if (part == NO_PARTITION)
1573 return;
1574
1575 rtx x = SA.partition_to_pseudo[part];
1576
1577 gcc_assert (x);
1578
1579 set_rtl (var, x);
1580
1581 if (!REG_P (x))
1582 return;
1583
1584 /* Note if the object is a user variable. */
1585 if (decl && !DECL_ARTIFICIAL (decl))
1586 mark_user_reg (x);
1587
1588 if (POINTER_TYPE_P (decl ? TREE_TYPE (decl) : TREE_TYPE (var)))
1589 mark_reg_pointer (x, get_pointer_alignment (var));
1590 }
1591
1592 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1593 that will reside in a pseudo register. */
1594
1595 static void
1596 expand_one_register_var (tree var)
1597 {
1598 if (TREE_CODE (var) == SSA_NAME)
1599 {
1600 int part = var_to_partition (SA.map, var);
1601 if (part != NO_PARTITION)
1602 {
1603 rtx x = SA.partition_to_pseudo[part];
1604 gcc_assert (x);
1605 gcc_assert (REG_P (x));
1606 return;
1607 }
1608 gcc_unreachable ();
1609 }
1610
1611 tree decl = var;
1612 tree type = TREE_TYPE (decl);
1613 machine_mode reg_mode = promote_decl_mode (decl, NULL);
1614 rtx x = gen_reg_rtx (reg_mode);
1615
1616 set_rtl (var, x);
1617
1618 /* Note if the object is a user variable. */
1619 if (!DECL_ARTIFICIAL (decl))
1620 mark_user_reg (x);
1621
1622 if (POINTER_TYPE_P (type))
1623 mark_reg_pointer (x, get_pointer_alignment (var));
1624 }
1625
1626 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL that
1627 has some associated error, e.g. its type is error-mark. We just need
1628 to pick something that won't crash the rest of the compiler. */
1629
1630 static void
1631 expand_one_error_var (tree var)
1632 {
1633 machine_mode mode = DECL_MODE (var);
1634 rtx x;
1635
1636 if (mode == BLKmode)
1637 x = gen_rtx_MEM (BLKmode, const0_rtx);
1638 else if (mode == VOIDmode)
1639 x = const0_rtx;
1640 else
1641 x = gen_reg_rtx (mode);
1642
1643 SET_DECL_RTL (var, x);
1644 }
1645
1646 /* A subroutine of expand_one_var. VAR is a variable that will be
1647 allocated to the local stack frame. Return true if we wish to
1648 add VAR to STACK_VARS so that it will be coalesced with other
1649 variables. Return false to allocate VAR immediately.
1650
1651 This function is used to reduce the number of variables considered
1652 for coalescing, which reduces the size of the quadratic problem. */
1653
1654 static bool
1655 defer_stack_allocation (tree var, bool toplevel)
1656 {
1657 tree size_unit = TREE_CODE (var) == SSA_NAME
1658 ? TYPE_SIZE_UNIT (TREE_TYPE (var))
1659 : DECL_SIZE_UNIT (var);
1660 poly_uint64 size;
1661
1662 /* Whether the variable is small enough for immediate allocation not to be
1663 a problem with regard to the frame size. */
1664 bool smallish
1665 = (poly_int_tree_p (size_unit, &size)
1666 && (estimated_poly_value (size)
1667 < param_min_size_for_stack_sharing));
1668
1669 /* If stack protection is enabled, *all* stack variables must be deferred,
1670 so that we can re-order the strings to the top of the frame.
1671 Similarly for Address Sanitizer. */
1672 if (flag_stack_protect || asan_sanitize_stack_p ())
1673 return true;
1674
1675 unsigned int align = TREE_CODE (var) == SSA_NAME
1676 ? TYPE_ALIGN (TREE_TYPE (var))
1677 : DECL_ALIGN (var);
1678
1679 /* We handle "large" alignment via dynamic allocation. We want to handle
1680 this extra complication in only one place, so defer them. */
1681 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1682 return true;
1683
1684 bool ignored = TREE_CODE (var) == SSA_NAME
1685 ? !SSAVAR (var) || DECL_IGNORED_P (SSA_NAME_VAR (var))
1686 : DECL_IGNORED_P (var);
1687
1688 /* When optimization is enabled, DECL_IGNORED_P variables originally scoped
1689 might be detached from their block and appear at toplevel when we reach
1690 here. We want to coalesce them with variables from other blocks when
1691 the immediate contribution to the frame size would be noticeable. */
1692 if (toplevel && optimize > 0 && ignored && !smallish)
1693 return true;
1694
1695 /* Variables declared in the outermost scope automatically conflict
1696 with every other variable. The only reason to want to defer them
1697 at all is that, after sorting, we can more efficiently pack
1698 small variables in the stack frame. Continue to defer at -O2. */
1699 if (toplevel && optimize < 2)
1700 return false;
1701
1702 /* Without optimization, *most* variables are allocated from the
1703 stack, which makes the quadratic problem large exactly when we
1704 want compilation to proceed as quickly as possible. On the
1705 other hand, we don't want the function's stack frame size to
1706 get completely out of hand. So we avoid adding scalars and
1707 "small" aggregates to the list at all. */
1708 if (optimize == 0 && smallish)
1709 return false;
1710
1711 return true;
1712 }
1713
1714 /* A subroutine of expand_used_vars. Expand one variable according to
1715 its flavor. Variables to be placed on the stack are not actually
1716 expanded yet, merely recorded.
1717 When REALLY_EXPAND is false, only add stack values to be allocated.
1718 Return stack usage this variable is supposed to take.
1719 */
1720
1721 static poly_uint64
1722 expand_one_var (tree var, bool toplevel, bool really_expand,
1723 bitmap forced_stack_var = NULL)
1724 {
1725 unsigned int align = BITS_PER_UNIT;
1726 tree origvar = var;
1727
1728 var = SSAVAR (var);
1729
1730 if (TREE_TYPE (var) != error_mark_node && VAR_P (var))
1731 {
1732 if (is_global_var (var))
1733 return 0;
1734
1735 /* Because we don't know if VAR will be in register or on stack,
1736 we conservatively assume it will be on stack even if VAR is
1737 eventually put into register after RA pass. For non-automatic
1738 variables, which won't be on stack, we collect alignment of
1739 type and ignore user specified alignment. Similarly for
1740 SSA_NAMEs for which use_register_for_decl returns true. */
1741 if (TREE_STATIC (var)
1742 || DECL_EXTERNAL (var)
1743 || (TREE_CODE (origvar) == SSA_NAME && use_register_for_decl (var)))
1744 align = MINIMUM_ALIGNMENT (TREE_TYPE (var),
1745 TYPE_MODE (TREE_TYPE (var)),
1746 TYPE_ALIGN (TREE_TYPE (var)));
1747 else if (DECL_HAS_VALUE_EXPR_P (var)
1748 || (DECL_RTL_SET_P (var) && MEM_P (DECL_RTL (var))))
1749 /* Don't consider debug only variables with DECL_HAS_VALUE_EXPR_P set
1750 or variables which were assigned a stack slot already by
1751 expand_one_stack_var_at - in the latter case DECL_ALIGN has been
1752 changed from the offset chosen to it. */
1753 align = crtl->stack_alignment_estimated;
1754 else
1755 align = MINIMUM_ALIGNMENT (var, DECL_MODE (var), DECL_ALIGN (var));
1756
1757 /* If the variable alignment is very large we'll dynamicaly allocate
1758 it, which means that in-frame portion is just a pointer. */
1759 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1760 align = GET_MODE_ALIGNMENT (Pmode);
1761 }
1762
1763 record_alignment_for_reg_var (align);
1764
1765 poly_uint64 size;
1766 if (TREE_CODE (origvar) == SSA_NAME)
1767 {
1768 gcc_assert (!VAR_P (var)
1769 || (!DECL_EXTERNAL (var)
1770 && !DECL_HAS_VALUE_EXPR_P (var)
1771 && !TREE_STATIC (var)
1772 && TREE_TYPE (var) != error_mark_node
1773 && !DECL_HARD_REGISTER (var)
1774 && really_expand));
1775 }
1776 if (!VAR_P (var) && TREE_CODE (origvar) != SSA_NAME)
1777 ;
1778 else if (DECL_EXTERNAL (var))
1779 ;
1780 else if (DECL_HAS_VALUE_EXPR_P (var))
1781 ;
1782 else if (TREE_STATIC (var))
1783 ;
1784 else if (TREE_CODE (origvar) != SSA_NAME && DECL_RTL_SET_P (var))
1785 ;
1786 else if (TREE_TYPE (var) == error_mark_node)
1787 {
1788 if (really_expand)
1789 expand_one_error_var (var);
1790 }
1791 else if (VAR_P (var) && DECL_HARD_REGISTER (var))
1792 {
1793 if (really_expand)
1794 {
1795 expand_one_hard_reg_var (var);
1796 if (!DECL_HARD_REGISTER (var))
1797 /* Invalid register specification. */
1798 expand_one_error_var (var);
1799 }
1800 }
1801 else if (use_register_for_decl (var)
1802 && (!forced_stack_var
1803 || !bitmap_bit_p (forced_stack_var, DECL_UID (var))))
1804 {
1805 if (really_expand)
1806 expand_one_register_var (origvar);
1807 }
1808 else if (!poly_int_tree_p (DECL_SIZE_UNIT (var), &size)
1809 || !valid_constant_size_p (DECL_SIZE_UNIT (var)))
1810 {
1811 /* Reject variables which cover more than half of the address-space. */
1812 if (really_expand)
1813 {
1814 if (DECL_NONLOCAL_FRAME (var))
1815 error_at (DECL_SOURCE_LOCATION (current_function_decl),
1816 "total size of local objects is too large");
1817 else
1818 error_at (DECL_SOURCE_LOCATION (var),
1819 "size of variable %q+D is too large", var);
1820 expand_one_error_var (var);
1821 }
1822 }
1823 else if (defer_stack_allocation (var, toplevel))
1824 add_stack_var (origvar, really_expand);
1825 else
1826 {
1827 if (really_expand)
1828 {
1829 if (lookup_attribute ("naked",
1830 DECL_ATTRIBUTES (current_function_decl)))
1831 error ("cannot allocate stack for variable %q+D, naked function",
1832 var);
1833
1834 expand_one_stack_var (origvar);
1835 }
1836 return size;
1837 }
1838 return 0;
1839 }
1840
1841 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1842 expanding variables. Those variables that can be put into registers
1843 are allocated pseudos; those that can't are put on the stack.
1844
1845 TOPLEVEL is true if this is the outermost BLOCK. */
1846
1847 static void
1848 expand_used_vars_for_block (tree block, bool toplevel, bitmap forced_stack_vars)
1849 {
1850 tree t;
1851
1852 /* Expand all variables at this level. */
1853 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1854 if (TREE_USED (t)
1855 && ((!VAR_P (t) && TREE_CODE (t) != RESULT_DECL)
1856 || !DECL_NONSHAREABLE (t)))
1857 expand_one_var (t, toplevel, true, forced_stack_vars);
1858
1859 /* Expand all variables at containing levels. */
1860 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1861 expand_used_vars_for_block (t, false, forced_stack_vars);
1862 }
1863
1864 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1865 and clear TREE_USED on all local variables. */
1866
1867 static void
1868 clear_tree_used (tree block)
1869 {
1870 tree t;
1871
1872 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1873 /* if (!TREE_STATIC (t) && !DECL_EXTERNAL (t)) */
1874 if ((!VAR_P (t) && TREE_CODE (t) != RESULT_DECL)
1875 || !DECL_NONSHAREABLE (t))
1876 TREE_USED (t) = 0;
1877
1878 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1879 clear_tree_used (t);
1880 }
1881
1882 /* Examine TYPE and determine a bit mask of the following features. */
1883
1884 #define SPCT_HAS_LARGE_CHAR_ARRAY 1
1885 #define SPCT_HAS_SMALL_CHAR_ARRAY 2
1886 #define SPCT_HAS_ARRAY 4
1887 #define SPCT_HAS_AGGREGATE 8
1888
1889 static unsigned int
1890 stack_protect_classify_type (tree type)
1891 {
1892 unsigned int ret = 0;
1893 tree t;
1894
1895 switch (TREE_CODE (type))
1896 {
1897 case ARRAY_TYPE:
1898 t = TYPE_MAIN_VARIANT (TREE_TYPE (type));
1899 if (t == char_type_node
1900 || t == signed_char_type_node
1901 || t == unsigned_char_type_node)
1902 {
1903 unsigned HOST_WIDE_INT max = param_ssp_buffer_size;
1904 unsigned HOST_WIDE_INT len;
1905
1906 if (!TYPE_SIZE_UNIT (type)
1907 || !tree_fits_uhwi_p (TYPE_SIZE_UNIT (type)))
1908 len = max;
1909 else
1910 len = tree_to_uhwi (TYPE_SIZE_UNIT (type));
1911
1912 if (len < max)
1913 ret = SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_ARRAY;
1914 else
1915 ret = SPCT_HAS_LARGE_CHAR_ARRAY | SPCT_HAS_ARRAY;
1916 }
1917 else
1918 ret = SPCT_HAS_ARRAY;
1919 break;
1920
1921 case UNION_TYPE:
1922 case QUAL_UNION_TYPE:
1923 case RECORD_TYPE:
1924 ret = SPCT_HAS_AGGREGATE;
1925 for (t = TYPE_FIELDS (type); t ; t = TREE_CHAIN (t))
1926 if (TREE_CODE (t) == FIELD_DECL)
1927 ret |= stack_protect_classify_type (TREE_TYPE (t));
1928 break;
1929
1930 default:
1931 break;
1932 }
1933
1934 return ret;
1935 }
1936
1937 /* Return nonzero if DECL should be segregated into the "vulnerable" upper
1938 part of the local stack frame. Remember if we ever return nonzero for
1939 any variable in this function. The return value is the phase number in
1940 which the variable should be allocated. */
1941
1942 static int
1943 stack_protect_decl_phase (tree decl)
1944 {
1945 unsigned int bits = stack_protect_classify_type (TREE_TYPE (decl));
1946 int ret = 0;
1947
1948 if (bits & SPCT_HAS_SMALL_CHAR_ARRAY)
1949 has_short_buffer = true;
1950
1951 tree attribs = DECL_ATTRIBUTES (current_function_decl);
1952 if (!lookup_attribute ("no_stack_protector", attribs)
1953 && (flag_stack_protect == SPCT_FLAG_ALL
1954 || flag_stack_protect == SPCT_FLAG_STRONG
1955 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
1956 && lookup_attribute ("stack_protect", attribs))))
1957 {
1958 if ((bits & (SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_LARGE_CHAR_ARRAY))
1959 && !(bits & SPCT_HAS_AGGREGATE))
1960 ret = 1;
1961 else if (bits & SPCT_HAS_ARRAY)
1962 ret = 2;
1963 }
1964 else
1965 ret = (bits & SPCT_HAS_LARGE_CHAR_ARRAY) != 0;
1966
1967 if (ret)
1968 has_protected_decls = true;
1969
1970 return ret;
1971 }
1972
1973 /* Two helper routines that check for phase 1 and phase 2. These are used
1974 as callbacks for expand_stack_vars. */
1975
1976 static bool
1977 stack_protect_decl_phase_1 (size_t i)
1978 {
1979 return stack_protect_decl_phase (stack_vars[i].decl) == 1;
1980 }
1981
1982 static bool
1983 stack_protect_decl_phase_2 (size_t i)
1984 {
1985 return stack_protect_decl_phase (stack_vars[i].decl) == 2;
1986 }
1987
1988 /* And helper function that checks for asan phase (with stack protector
1989 it is phase 3). This is used as callback for expand_stack_vars.
1990 Returns true if any of the vars in the partition need to be protected. */
1991
1992 static bool
1993 asan_decl_phase_3 (size_t i)
1994 {
1995 while (i != EOC)
1996 {
1997 if (asan_protect_stack_decl (stack_vars[i].decl))
1998 return true;
1999 i = stack_vars[i].next;
2000 }
2001 return false;
2002 }
2003
2004 /* Ensure that variables in different stack protection phases conflict
2005 so that they are not merged and share the same stack slot.
2006 Return true if there are any address taken variables. */
2007
2008 static bool
2009 add_stack_protection_conflicts (void)
2010 {
2011 size_t i, j, n = stack_vars_num;
2012 unsigned char *phase;
2013 bool ret = false;
2014
2015 phase = XNEWVEC (unsigned char, n);
2016 for (i = 0; i < n; ++i)
2017 {
2018 phase[i] = stack_protect_decl_phase (stack_vars[i].decl);
2019 if (TREE_ADDRESSABLE (stack_vars[i].decl))
2020 ret = true;
2021 }
2022
2023 for (i = 0; i < n; ++i)
2024 {
2025 unsigned char ph_i = phase[i];
2026 for (j = i + 1; j < n; ++j)
2027 if (ph_i != phase[j])
2028 add_stack_var_conflict (i, j);
2029 }
2030
2031 XDELETEVEC (phase);
2032 return ret;
2033 }
2034
2035 /* Create a decl for the guard at the top of the stack frame. */
2036
2037 static void
2038 create_stack_guard (void)
2039 {
2040 tree guard = build_decl (DECL_SOURCE_LOCATION (current_function_decl),
2041 VAR_DECL, NULL, ptr_type_node);
2042 TREE_THIS_VOLATILE (guard) = 1;
2043 TREE_USED (guard) = 1;
2044 expand_one_stack_var (guard);
2045 crtl->stack_protect_guard = guard;
2046 }
2047
2048 /* Prepare for expanding variables. */
2049 static void
2050 init_vars_expansion (void)
2051 {
2052 /* Conflict bitmaps, and a few related temporary bitmaps, go here. */
2053 bitmap_obstack_initialize (&stack_var_bitmap_obstack);
2054
2055 /* A map from decl to stack partition. */
2056 decl_to_stack_part = new hash_map<tree, size_t>;
2057
2058 /* Initialize local stack smashing state. */
2059 has_protected_decls = false;
2060 has_short_buffer = false;
2061 if (hwasan_sanitize_stack_p ())
2062 hwasan_record_frame_init ();
2063 }
2064
2065 /* Free up stack variable graph data. */
2066 static void
2067 fini_vars_expansion (void)
2068 {
2069 bitmap_obstack_release (&stack_var_bitmap_obstack);
2070 if (stack_vars)
2071 XDELETEVEC (stack_vars);
2072 if (stack_vars_sorted)
2073 XDELETEVEC (stack_vars_sorted);
2074 stack_vars = NULL;
2075 stack_vars_sorted = NULL;
2076 stack_vars_alloc = stack_vars_num = 0;
2077 delete decl_to_stack_part;
2078 decl_to_stack_part = NULL;
2079 }
2080
2081 /* Make a fair guess for the size of the stack frame of the function
2082 in NODE. This doesn't have to be exact, the result is only used in
2083 the inline heuristics. So we don't want to run the full stack var
2084 packing algorithm (which is quadratic in the number of stack vars).
2085 Instead, we calculate the total size of all stack vars. This turns
2086 out to be a pretty fair estimate -- packing of stack vars doesn't
2087 happen very often. */
2088
2089 HOST_WIDE_INT
2090 estimated_stack_frame_size (struct cgraph_node *node)
2091 {
2092 poly_int64 size = 0;
2093 size_t i;
2094 tree var;
2095 struct function *fn = DECL_STRUCT_FUNCTION (node->decl);
2096
2097 push_cfun (fn);
2098
2099 init_vars_expansion ();
2100
2101 FOR_EACH_LOCAL_DECL (fn, i, var)
2102 if (auto_var_in_fn_p (var, fn->decl))
2103 size += expand_one_var (var, true, false);
2104
2105 if (stack_vars_num > 0)
2106 {
2107 /* Fake sorting the stack vars for account_stack_vars (). */
2108 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
2109 for (i = 0; i < stack_vars_num; ++i)
2110 stack_vars_sorted[i] = i;
2111 size += account_stack_vars ();
2112 }
2113
2114 fini_vars_expansion ();
2115 pop_cfun ();
2116 return estimated_poly_value (size);
2117 }
2118
2119 /* Check if the current function has calls that use a return slot. */
2120
2121 static bool
2122 stack_protect_return_slot_p ()
2123 {
2124 basic_block bb;
2125
2126 FOR_ALL_BB_FN (bb, cfun)
2127 for (gimple_stmt_iterator gsi = gsi_start_bb (bb);
2128 !gsi_end_p (gsi); gsi_next (&gsi))
2129 {
2130 gimple *stmt = gsi_stmt (gsi);
2131 /* This assumes that calls to internal-only functions never
2132 use a return slot. */
2133 if (is_gimple_call (stmt)
2134 && !gimple_call_internal_p (stmt)
2135 && aggregate_value_p (TREE_TYPE (gimple_call_fntype (stmt)),
2136 gimple_call_fndecl (stmt)))
2137 return true;
2138 }
2139 return false;
2140 }
2141
2142 /* Expand all variables used in the function. */
2143
2144 static rtx_insn *
2145 expand_used_vars (bitmap forced_stack_vars)
2146 {
2147 tree var, outer_block = DECL_INITIAL (current_function_decl);
2148 auto_vec<tree> maybe_local_decls;
2149 rtx_insn *var_end_seq = NULL;
2150 unsigned i;
2151 unsigned len;
2152 bool gen_stack_protect_signal = false;
2153
2154 /* Compute the phase of the stack frame for this function. */
2155 {
2156 int align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
2157 int off = targetm.starting_frame_offset () % align;
2158 frame_phase = off ? align - off : 0;
2159 }
2160
2161 /* Set TREE_USED on all variables in the local_decls. */
2162 FOR_EACH_LOCAL_DECL (cfun, i, var)
2163 TREE_USED (var) = 1;
2164 /* Clear TREE_USED on all variables associated with a block scope. */
2165 clear_tree_used (DECL_INITIAL (current_function_decl));
2166
2167 init_vars_expansion ();
2168
2169 if (targetm.use_pseudo_pic_reg ())
2170 pic_offset_table_rtx = gen_reg_rtx (Pmode);
2171
2172 for (i = 0; i < SA.map->num_partitions; i++)
2173 {
2174 if (bitmap_bit_p (SA.partitions_for_parm_default_defs, i))
2175 continue;
2176
2177 tree var = partition_to_var (SA.map, i);
2178
2179 gcc_assert (!virtual_operand_p (var));
2180
2181 expand_one_ssa_partition (var);
2182 }
2183
2184 if (flag_stack_protect == SPCT_FLAG_STRONG)
2185 gen_stack_protect_signal = stack_protect_return_slot_p ();
2186
2187 /* At this point all variables on the local_decls with TREE_USED
2188 set are not associated with any block scope. Lay them out. */
2189
2190 len = vec_safe_length (cfun->local_decls);
2191 FOR_EACH_LOCAL_DECL (cfun, i, var)
2192 {
2193 bool expand_now = false;
2194
2195 /* Expanded above already. */
2196 if (is_gimple_reg (var))
2197 {
2198 TREE_USED (var) = 0;
2199 goto next;
2200 }
2201 /* We didn't set a block for static or extern because it's hard
2202 to tell the difference between a global variable (re)declared
2203 in a local scope, and one that's really declared there to
2204 begin with. And it doesn't really matter much, since we're
2205 not giving them stack space. Expand them now. */
2206 else if (TREE_STATIC (var) || DECL_EXTERNAL (var))
2207 expand_now = true;
2208
2209 /* Expand variables not associated with any block now. Those created by
2210 the optimizers could be live anywhere in the function. Those that
2211 could possibly have been scoped originally and detached from their
2212 block will have their allocation deferred so we coalesce them with
2213 others when optimization is enabled. */
2214 else if (TREE_USED (var))
2215 expand_now = true;
2216
2217 /* Finally, mark all variables on the list as used. We'll use
2218 this in a moment when we expand those associated with scopes. */
2219 TREE_USED (var) = 1;
2220
2221 if (expand_now)
2222 expand_one_var (var, true, true, forced_stack_vars);
2223
2224 next:
2225 if (DECL_ARTIFICIAL (var) && !DECL_IGNORED_P (var))
2226 {
2227 rtx rtl = DECL_RTL_IF_SET (var);
2228
2229 /* Keep artificial non-ignored vars in cfun->local_decls
2230 chain until instantiate_decls. */
2231 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
2232 add_local_decl (cfun, var);
2233 else if (rtl == NULL_RTX)
2234 /* If rtl isn't set yet, which can happen e.g. with
2235 -fstack-protector, retry before returning from this
2236 function. */
2237 maybe_local_decls.safe_push (var);
2238 }
2239 }
2240
2241 /* We duplicated some of the decls in CFUN->LOCAL_DECLS.
2242
2243 +-----------------+-----------------+
2244 | ...processed... | ...duplicates...|
2245 +-----------------+-----------------+
2246 ^
2247 +-- LEN points here.
2248
2249 We just want the duplicates, as those are the artificial
2250 non-ignored vars that we want to keep until instantiate_decls.
2251 Move them down and truncate the array. */
2252 if (!vec_safe_is_empty (cfun->local_decls))
2253 cfun->local_decls->block_remove (0, len);
2254
2255 /* At this point, all variables within the block tree with TREE_USED
2256 set are actually used by the optimized function. Lay them out. */
2257 expand_used_vars_for_block (outer_block, true, forced_stack_vars);
2258
2259 tree attribs = DECL_ATTRIBUTES (current_function_decl);
2260 if (stack_vars_num > 0)
2261 {
2262 bool has_addressable_vars = false;
2263
2264 add_scope_conflicts ();
2265
2266 /* If stack protection is enabled, we don't share space between
2267 vulnerable data and non-vulnerable data. */
2268 if (flag_stack_protect != 0
2269 && !lookup_attribute ("no_stack_protector", attribs)
2270 && (flag_stack_protect != SPCT_FLAG_EXPLICIT
2271 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
2272 && lookup_attribute ("stack_protect", attribs))))
2273 has_addressable_vars = add_stack_protection_conflicts ();
2274
2275 if (flag_stack_protect == SPCT_FLAG_STRONG && has_addressable_vars)
2276 gen_stack_protect_signal = true;
2277
2278 /* Now that we have collected all stack variables, and have computed a
2279 minimal interference graph, attempt to save some stack space. */
2280 partition_stack_vars ();
2281 if (dump_file)
2282 dump_stack_var_partition ();
2283 }
2284
2285
2286 if (!lookup_attribute ("no_stack_protector", attribs))
2287 switch (flag_stack_protect)
2288 {
2289 case SPCT_FLAG_ALL:
2290 create_stack_guard ();
2291 break;
2292
2293 case SPCT_FLAG_STRONG:
2294 if (gen_stack_protect_signal
2295 || cfun->calls_alloca
2296 || has_protected_decls
2297 || lookup_attribute ("stack_protect", attribs))
2298 create_stack_guard ();
2299 break;
2300
2301 case SPCT_FLAG_DEFAULT:
2302 if (cfun->calls_alloca
2303 || has_protected_decls
2304 || lookup_attribute ("stack_protect", attribs))
2305 create_stack_guard ();
2306 break;
2307
2308 case SPCT_FLAG_EXPLICIT:
2309 if (lookup_attribute ("stack_protect", attribs))
2310 create_stack_guard ();
2311 break;
2312
2313 default:
2314 break;
2315 }
2316
2317 /* Assign rtl to each variable based on these partitions. */
2318 if (stack_vars_num > 0)
2319 {
2320 class stack_vars_data data;
2321
2322 data.asan_base = NULL_RTX;
2323 data.asan_alignb = 0;
2324
2325 /* Reorder decls to be protected by iterating over the variables
2326 array multiple times, and allocating out of each phase in turn. */
2327 /* ??? We could probably integrate this into the qsort we did
2328 earlier, such that we naturally see these variables first,
2329 and thus naturally allocate things in the right order. */
2330 if (has_protected_decls)
2331 {
2332 /* Phase 1 contains only character arrays. */
2333 expand_stack_vars (stack_protect_decl_phase_1, &data);
2334
2335 /* Phase 2 contains other kinds of arrays. */
2336 if (!lookup_attribute ("no_stack_protector", attribs)
2337 && (flag_stack_protect == SPCT_FLAG_ALL
2338 || flag_stack_protect == SPCT_FLAG_STRONG
2339 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
2340 && lookup_attribute ("stack_protect", attribs))))
2341 expand_stack_vars (stack_protect_decl_phase_2, &data);
2342 }
2343
2344 if (asan_sanitize_stack_p ())
2345 /* Phase 3, any partitions that need asan protection
2346 in addition to phase 1 and 2. */
2347 expand_stack_vars (asan_decl_phase_3, &data);
2348
2349 /* ASAN description strings don't yet have a syntax for expressing
2350 polynomial offsets. */
2351 HOST_WIDE_INT prev_offset;
2352 if (!data.asan_vec.is_empty ()
2353 && frame_offset.is_constant (&prev_offset))
2354 {
2355 HOST_WIDE_INT offset, sz, redzonesz;
2356 redzonesz = ASAN_RED_ZONE_SIZE;
2357 sz = data.asan_vec[0] - prev_offset;
2358 if (data.asan_alignb > ASAN_RED_ZONE_SIZE
2359 && data.asan_alignb <= 4096
2360 && sz + ASAN_RED_ZONE_SIZE >= (int) data.asan_alignb)
2361 redzonesz = ((sz + ASAN_RED_ZONE_SIZE + data.asan_alignb - 1)
2362 & ~(data.asan_alignb - HOST_WIDE_INT_1)) - sz;
2363 /* Allocating a constant amount of space from a constant
2364 starting offset must give a constant result. */
2365 offset = (alloc_stack_frame_space (redzonesz, ASAN_RED_ZONE_SIZE)
2366 .to_constant ());
2367 data.asan_vec.safe_push (prev_offset);
2368 data.asan_vec.safe_push (offset);
2369 /* Leave space for alignment if STRICT_ALIGNMENT. */
2370 if (STRICT_ALIGNMENT)
2371 alloc_stack_frame_space ((GET_MODE_ALIGNMENT (SImode)
2372 << ASAN_SHADOW_SHIFT)
2373 / BITS_PER_UNIT, 1);
2374
2375 var_end_seq
2376 = asan_emit_stack_protection (virtual_stack_vars_rtx,
2377 data.asan_base,
2378 data.asan_alignb,
2379 data.asan_vec.address (),
2380 data.asan_decl_vec.address (),
2381 data.asan_vec.length ());
2382 }
2383
2384 expand_stack_vars (NULL, &data);
2385 }
2386
2387 if (hwasan_sanitize_stack_p ())
2388 hwasan_emit_prologue ();
2389 if (asan_sanitize_allocas_p () && cfun->calls_alloca)
2390 var_end_seq = asan_emit_allocas_unpoison (virtual_stack_dynamic_rtx,
2391 virtual_stack_vars_rtx,
2392 var_end_seq);
2393 else if (hwasan_sanitize_allocas_p () && cfun->calls_alloca)
2394 /* When using out-of-line instrumentation we only want to emit one function
2395 call for clearing the tags in a region of shadow stack. When there are
2396 alloca calls in this frame we want to emit a call using the
2397 virtual_stack_dynamic_rtx, but when not we use the hwasan_frame_extent
2398 rtx we created in expand_stack_vars. */
2399 var_end_seq = hwasan_emit_untag_frame (virtual_stack_dynamic_rtx,
2400 virtual_stack_vars_rtx);
2401 else if (hwasan_sanitize_stack_p ())
2402 /* If no variables were stored on the stack, `hwasan_get_frame_extent`
2403 will return NULL_RTX and hence `hwasan_emit_untag_frame` will return
2404 NULL (i.e. an empty sequence). */
2405 var_end_seq = hwasan_emit_untag_frame (hwasan_get_frame_extent (),
2406 virtual_stack_vars_rtx);
2407
2408 fini_vars_expansion ();
2409
2410 /* If there were any artificial non-ignored vars without rtl
2411 found earlier, see if deferred stack allocation hasn't assigned
2412 rtl to them. */
2413 FOR_EACH_VEC_ELT_REVERSE (maybe_local_decls, i, var)
2414 {
2415 rtx rtl = DECL_RTL_IF_SET (var);
2416
2417 /* Keep artificial non-ignored vars in cfun->local_decls
2418 chain until instantiate_decls. */
2419 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
2420 add_local_decl (cfun, var);
2421 }
2422
2423 /* If the target requires that FRAME_OFFSET be aligned, do it. */
2424 if (STACK_ALIGNMENT_NEEDED)
2425 {
2426 HOST_WIDE_INT align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
2427 if (FRAME_GROWS_DOWNWARD)
2428 frame_offset = aligned_lower_bound (frame_offset, align);
2429 else
2430 frame_offset = aligned_upper_bound (frame_offset, align);
2431 }
2432
2433 return var_end_seq;
2434 }
2435
2436
2437 /* If we need to produce a detailed dump, print the tree representation
2438 for STMT to the dump file. SINCE is the last RTX after which the RTL
2439 generated for STMT should have been appended. */
2440
2441 static void
2442 maybe_dump_rtl_for_gimple_stmt (gimple *stmt, rtx_insn *since)
2443 {
2444 if (dump_file && (dump_flags & TDF_DETAILS))
2445 {
2446 fprintf (dump_file, "\n;; ");
2447 print_gimple_stmt (dump_file, stmt, 0,
2448 TDF_SLIM | (dump_flags & TDF_LINENO));
2449 fprintf (dump_file, "\n");
2450
2451 print_rtl (dump_file, since ? NEXT_INSN (since) : since);
2452 }
2453 }
2454
2455 /* Maps the blocks that do not contain tree labels to rtx labels. */
2456
2457 static hash_map<basic_block, rtx_code_label *> *lab_rtx_for_bb;
2458
2459 /* Returns the label_rtx expression for a label starting basic block BB. */
2460
2461 static rtx_code_label *
2462 label_rtx_for_bb (basic_block bb ATTRIBUTE_UNUSED)
2463 {
2464 gimple_stmt_iterator gsi;
2465 tree lab;
2466
2467 if (bb->flags & BB_RTL)
2468 return block_label (bb);
2469
2470 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
2471 if (elt)
2472 return *elt;
2473
2474 /* Find the tree label if it is present. */
2475
2476 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
2477 {
2478 glabel *lab_stmt;
2479
2480 lab_stmt = dyn_cast <glabel *> (gsi_stmt (gsi));
2481 if (!lab_stmt)
2482 break;
2483
2484 lab = gimple_label_label (lab_stmt);
2485 if (DECL_NONLOCAL (lab))
2486 break;
2487
2488 return jump_target_rtx (lab);
2489 }
2490
2491 rtx_code_label *l = gen_label_rtx ();
2492 lab_rtx_for_bb->put (bb, l);
2493 return l;
2494 }
2495
2496
2497 /* A subroutine of expand_gimple_cond. Given E, a fallthrough edge
2498 of a basic block where we just expanded the conditional at the end,
2499 possibly clean up the CFG and instruction sequence. LAST is the
2500 last instruction before the just emitted jump sequence. */
2501
2502 static void
2503 maybe_cleanup_end_of_block (edge e, rtx_insn *last)
2504 {
2505 /* Special case: when jumpif decides that the condition is
2506 trivial it emits an unconditional jump (and the necessary
2507 barrier). But we still have two edges, the fallthru one is
2508 wrong. purge_dead_edges would clean this up later. Unfortunately
2509 we have to insert insns (and split edges) before
2510 find_many_sub_basic_blocks and hence before purge_dead_edges.
2511 But splitting edges might create new blocks which depend on the
2512 fact that if there are two edges there's no barrier. So the
2513 barrier would get lost and verify_flow_info would ICE. Instead
2514 of auditing all edge splitters to care for the barrier (which
2515 normally isn't there in a cleaned CFG), fix it here. */
2516 if (BARRIER_P (get_last_insn ()))
2517 {
2518 rtx_insn *insn;
2519 remove_edge (e);
2520 /* Now, we have a single successor block, if we have insns to
2521 insert on the remaining edge we potentially will insert
2522 it at the end of this block (if the dest block isn't feasible)
2523 in order to avoid splitting the edge. This insertion will take
2524 place in front of the last jump. But we might have emitted
2525 multiple jumps (conditional and one unconditional) to the
2526 same destination. Inserting in front of the last one then
2527 is a problem. See PR 40021. We fix this by deleting all
2528 jumps except the last unconditional one. */
2529 insn = PREV_INSN (get_last_insn ());
2530 /* Make sure we have an unconditional jump. Otherwise we're
2531 confused. */
2532 gcc_assert (JUMP_P (insn) && !any_condjump_p (insn));
2533 for (insn = PREV_INSN (insn); insn != last;)
2534 {
2535 insn = PREV_INSN (insn);
2536 if (JUMP_P (NEXT_INSN (insn)))
2537 {
2538 if (!any_condjump_p (NEXT_INSN (insn)))
2539 {
2540 gcc_assert (BARRIER_P (NEXT_INSN (NEXT_INSN (insn))));
2541 delete_insn (NEXT_INSN (NEXT_INSN (insn)));
2542 }
2543 delete_insn (NEXT_INSN (insn));
2544 }
2545 }
2546 }
2547 }
2548
2549 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_COND.
2550 Returns a new basic block if we've terminated the current basic
2551 block and created a new one. */
2552
2553 static basic_block
2554 expand_gimple_cond (basic_block bb, gcond *stmt)
2555 {
2556 basic_block new_bb, dest;
2557 edge true_edge;
2558 edge false_edge;
2559 rtx_insn *last2, *last;
2560 enum tree_code code;
2561 tree op0, op1;
2562
2563 code = gimple_cond_code (stmt);
2564 op0 = gimple_cond_lhs (stmt);
2565 op1 = gimple_cond_rhs (stmt);
2566 /* We're sometimes presented with such code:
2567 D.123_1 = x < y;
2568 if (D.123_1 != 0)
2569 ...
2570 This would expand to two comparisons which then later might
2571 be cleaned up by combine. But some pattern matchers like if-conversion
2572 work better when there's only one compare, so make up for this
2573 here as special exception if TER would have made the same change. */
2574 if (SA.values
2575 && TREE_CODE (op0) == SSA_NAME
2576 && TREE_CODE (TREE_TYPE (op0)) == BOOLEAN_TYPE
2577 && TREE_CODE (op1) == INTEGER_CST
2578 && ((gimple_cond_code (stmt) == NE_EXPR
2579 && integer_zerop (op1))
2580 || (gimple_cond_code (stmt) == EQ_EXPR
2581 && integer_onep (op1)))
2582 && bitmap_bit_p (SA.values, SSA_NAME_VERSION (op0)))
2583 {
2584 gimple *second = SSA_NAME_DEF_STMT (op0);
2585 if (gimple_code (second) == GIMPLE_ASSIGN)
2586 {
2587 enum tree_code code2 = gimple_assign_rhs_code (second);
2588 if (TREE_CODE_CLASS (code2) == tcc_comparison)
2589 {
2590 code = code2;
2591 op0 = gimple_assign_rhs1 (second);
2592 op1 = gimple_assign_rhs2 (second);
2593 }
2594 /* If jumps are cheap and the target does not support conditional
2595 compare, turn some more codes into jumpy sequences. */
2596 else if (BRANCH_COST (optimize_insn_for_speed_p (), false) < 4
2597 && targetm.gen_ccmp_first == NULL)
2598 {
2599 if ((code2 == BIT_AND_EXPR
2600 && TYPE_PRECISION (TREE_TYPE (op0)) == 1
2601 && TREE_CODE (gimple_assign_rhs2 (second)) != INTEGER_CST)
2602 || code2 == TRUTH_AND_EXPR)
2603 {
2604 code = TRUTH_ANDIF_EXPR;
2605 op0 = gimple_assign_rhs1 (second);
2606 op1 = gimple_assign_rhs2 (second);
2607 }
2608 else if (code2 == BIT_IOR_EXPR || code2 == TRUTH_OR_EXPR)
2609 {
2610 code = TRUTH_ORIF_EXPR;
2611 op0 = gimple_assign_rhs1 (second);
2612 op1 = gimple_assign_rhs2 (second);
2613 }
2614 }
2615 }
2616 }
2617
2618 /* Optimize (x % C1) == C2 or (x % C1) != C2 if it is beneficial
2619 into (x - C2) * C3 < C4. */
2620 if ((code == EQ_EXPR || code == NE_EXPR)
2621 && TREE_CODE (op0) == SSA_NAME
2622 && TREE_CODE (op1) == INTEGER_CST)
2623 code = maybe_optimize_mod_cmp (code, &op0, &op1);
2624
2625 /* Optimize (x - y) < 0 into x < y if x - y has undefined overflow. */
2626 if (!TYPE_UNSIGNED (TREE_TYPE (op0))
2627 && (code == LT_EXPR || code == LE_EXPR
2628 || code == GT_EXPR || code == GE_EXPR)
2629 && integer_zerop (op1)
2630 && TREE_CODE (op0) == SSA_NAME)
2631 maybe_optimize_sub_cmp_0 (code, &op0, &op1);
2632
2633 last2 = last = get_last_insn ();
2634
2635 extract_true_false_edges_from_block (bb, &true_edge, &false_edge);
2636 set_curr_insn_location (gimple_location (stmt));
2637
2638 /* These flags have no purpose in RTL land. */
2639 true_edge->flags &= ~EDGE_TRUE_VALUE;
2640 false_edge->flags &= ~EDGE_FALSE_VALUE;
2641
2642 /* We can either have a pure conditional jump with one fallthru edge or
2643 two-way jump that needs to be decomposed into two basic blocks. */
2644 if (false_edge->dest == bb->next_bb)
2645 {
2646 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2647 true_edge->probability);
2648 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2649 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2650 set_curr_insn_location (true_edge->goto_locus);
2651 false_edge->flags |= EDGE_FALLTHRU;
2652 maybe_cleanup_end_of_block (false_edge, last);
2653 return NULL;
2654 }
2655 if (true_edge->dest == bb->next_bb)
2656 {
2657 jumpifnot_1 (code, op0, op1, label_rtx_for_bb (false_edge->dest),
2658 false_edge->probability);
2659 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2660 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2661 set_curr_insn_location (false_edge->goto_locus);
2662 true_edge->flags |= EDGE_FALLTHRU;
2663 maybe_cleanup_end_of_block (true_edge, last);
2664 return NULL;
2665 }
2666
2667 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2668 true_edge->probability);
2669 last = get_last_insn ();
2670 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2671 set_curr_insn_location (false_edge->goto_locus);
2672 emit_jump (label_rtx_for_bb (false_edge->dest));
2673
2674 BB_END (bb) = last;
2675 if (BARRIER_P (BB_END (bb)))
2676 BB_END (bb) = PREV_INSN (BB_END (bb));
2677 update_bb_for_insn (bb);
2678
2679 new_bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
2680 dest = false_edge->dest;
2681 redirect_edge_succ (false_edge, new_bb);
2682 false_edge->flags |= EDGE_FALLTHRU;
2683 new_bb->count = false_edge->count ();
2684 loop_p loop = find_common_loop (bb->loop_father, dest->loop_father);
2685 add_bb_to_loop (new_bb, loop);
2686 if (loop->latch == bb
2687 && loop->header == dest)
2688 loop->latch = new_bb;
2689 make_single_succ_edge (new_bb, dest, 0);
2690 if (BARRIER_P (BB_END (new_bb)))
2691 BB_END (new_bb) = PREV_INSN (BB_END (new_bb));
2692 update_bb_for_insn (new_bb);
2693
2694 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
2695
2696 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2697 {
2698 set_curr_insn_location (true_edge->goto_locus);
2699 true_edge->goto_locus = curr_insn_location ();
2700 }
2701
2702 return new_bb;
2703 }
2704
2705 /* Mark all calls that can have a transaction restart. */
2706
2707 static void
2708 mark_transaction_restart_calls (gimple *stmt)
2709 {
2710 struct tm_restart_node dummy;
2711 tm_restart_node **slot;
2712
2713 if (!cfun->gimple_df->tm_restart)
2714 return;
2715
2716 dummy.stmt = stmt;
2717 slot = cfun->gimple_df->tm_restart->find_slot (&dummy, NO_INSERT);
2718 if (slot)
2719 {
2720 struct tm_restart_node *n = *slot;
2721 tree list = n->label_or_list;
2722 rtx_insn *insn;
2723
2724 for (insn = next_real_insn (get_last_insn ());
2725 !CALL_P (insn);
2726 insn = next_real_insn (insn))
2727 continue;
2728
2729 if (TREE_CODE (list) == LABEL_DECL)
2730 add_reg_note (insn, REG_TM, label_rtx (list));
2731 else
2732 for (; list ; list = TREE_CHAIN (list))
2733 add_reg_note (insn, REG_TM, label_rtx (TREE_VALUE (list)));
2734 }
2735 }
2736
2737 /* A subroutine of expand_gimple_stmt_1, expanding one GIMPLE_CALL
2738 statement STMT. */
2739
2740 static void
2741 expand_call_stmt (gcall *stmt)
2742 {
2743 tree exp, decl, lhs;
2744 bool builtin_p;
2745 size_t i;
2746
2747 if (gimple_call_internal_p (stmt))
2748 {
2749 expand_internal_call (stmt);
2750 return;
2751 }
2752
2753 /* If this is a call to a built-in function and it has no effect other
2754 than setting the lhs, try to implement it using an internal function
2755 instead. */
2756 decl = gimple_call_fndecl (stmt);
2757 if (gimple_call_lhs (stmt)
2758 && !gimple_has_side_effects (stmt)
2759 && (optimize || (decl && called_as_built_in (decl))))
2760 {
2761 internal_fn ifn = replacement_internal_fn (stmt);
2762 if (ifn != IFN_LAST)
2763 {
2764 expand_internal_call (ifn, stmt);
2765 return;
2766 }
2767 }
2768
2769 exp = build_vl_exp (CALL_EXPR, gimple_call_num_args (stmt) + 3);
2770
2771 CALL_EXPR_FN (exp) = gimple_call_fn (stmt);
2772 builtin_p = decl && fndecl_built_in_p (decl);
2773
2774 /* If this is not a builtin function, the function type through which the
2775 call is made may be different from the type of the function. */
2776 if (!builtin_p)
2777 CALL_EXPR_FN (exp)
2778 = fold_convert (build_pointer_type (gimple_call_fntype (stmt)),
2779 CALL_EXPR_FN (exp));
2780
2781 TREE_TYPE (exp) = gimple_call_return_type (stmt);
2782 CALL_EXPR_STATIC_CHAIN (exp) = gimple_call_chain (stmt);
2783
2784 for (i = 0; i < gimple_call_num_args (stmt); i++)
2785 {
2786 tree arg = gimple_call_arg (stmt, i);
2787 gimple *def;
2788 /* TER addresses into arguments of builtin functions so we have a
2789 chance to infer more correct alignment information. See PR39954. */
2790 if (builtin_p
2791 && TREE_CODE (arg) == SSA_NAME
2792 && (def = get_gimple_for_ssa_name (arg))
2793 && gimple_assign_rhs_code (def) == ADDR_EXPR)
2794 arg = gimple_assign_rhs1 (def);
2795 CALL_EXPR_ARG (exp, i) = arg;
2796 }
2797
2798 if (gimple_has_side_effects (stmt)
2799 /* ??? Downstream in expand_expr_real_1 we assume that expressions
2800 w/o side-effects do not throw so work around this here. */
2801 || stmt_could_throw_p (cfun, stmt))
2802 TREE_SIDE_EFFECTS (exp) = 1;
2803
2804 if (gimple_call_nothrow_p (stmt))
2805 TREE_NOTHROW (exp) = 1;
2806
2807 CALL_EXPR_TAILCALL (exp) = gimple_call_tail_p (stmt);
2808 CALL_EXPR_MUST_TAIL_CALL (exp) = gimple_call_must_tail_p (stmt);
2809 CALL_EXPR_RETURN_SLOT_OPT (exp) = gimple_call_return_slot_opt_p (stmt);
2810 if (decl
2811 && fndecl_built_in_p (decl, BUILT_IN_NORMAL)
2812 && ALLOCA_FUNCTION_CODE_P (DECL_FUNCTION_CODE (decl)))
2813 CALL_ALLOCA_FOR_VAR_P (exp) = gimple_call_alloca_for_var_p (stmt);
2814 else
2815 CALL_FROM_THUNK_P (exp) = gimple_call_from_thunk_p (stmt);
2816 CALL_EXPR_VA_ARG_PACK (exp) = gimple_call_va_arg_pack_p (stmt);
2817 CALL_EXPR_BY_DESCRIPTOR (exp) = gimple_call_by_descriptor_p (stmt);
2818 SET_EXPR_LOCATION (exp, gimple_location (stmt));
2819
2820 /* Must come after copying location. */
2821 copy_warning (exp, stmt);
2822
2823 /* Ensure RTL is created for debug args. */
2824 if (decl && DECL_HAS_DEBUG_ARGS_P (decl))
2825 {
2826 vec<tree, va_gc> **debug_args = decl_debug_args_lookup (decl);
2827 unsigned int ix;
2828 tree dtemp;
2829
2830 if (debug_args)
2831 for (ix = 1; (*debug_args)->iterate (ix, &dtemp); ix += 2)
2832 {
2833 gcc_assert (TREE_CODE (dtemp) == DEBUG_EXPR_DECL);
2834 expand_debug_expr (dtemp);
2835 }
2836 }
2837
2838 rtx_insn *before_call = get_last_insn ();
2839 lhs = gimple_call_lhs (stmt);
2840 if (lhs)
2841 expand_assignment (lhs, exp, false);
2842 else
2843 expand_expr (exp, const0_rtx, VOIDmode, EXPAND_NORMAL);
2844
2845 /* If the gimple call is an indirect call and has 'nocf_check'
2846 attribute find a generated CALL insn to mark it as no
2847 control-flow verification is needed. */
2848 if (gimple_call_nocf_check_p (stmt)
2849 && !gimple_call_fndecl (stmt))
2850 {
2851 rtx_insn *last = get_last_insn ();
2852 while (!CALL_P (last)
2853 && last != before_call)
2854 last = PREV_INSN (last);
2855
2856 if (last != before_call)
2857 add_reg_note (last, REG_CALL_NOCF_CHECK, const0_rtx);
2858 }
2859
2860 mark_transaction_restart_calls (stmt);
2861 }
2862
2863
2864 /* Generate RTL for an asm statement (explicit assembler code).
2865 STRING is a STRING_CST node containing the assembler code text,
2866 or an ADDR_EXPR containing a STRING_CST. VOL nonzero means the
2867 insn is volatile; don't optimize it. */
2868
2869 static void
2870 expand_asm_loc (tree string, int vol, location_t locus)
2871 {
2872 rtx body;
2873
2874 body = gen_rtx_ASM_INPUT_loc (VOIDmode,
2875 ggc_strdup (TREE_STRING_POINTER (string)),
2876 locus);
2877
2878 MEM_VOLATILE_P (body) = vol;
2879
2880 /* Non-empty basic ASM implicitly clobbers memory. */
2881 if (TREE_STRING_LENGTH (string) != 0)
2882 {
2883 rtx asm_op, clob;
2884 unsigned i, nclobbers;
2885 auto_vec<rtx> input_rvec, output_rvec;
2886 auto_vec<machine_mode> input_mode;
2887 auto_vec<const char *> constraints;
2888 auto_vec<rtx> clobber_rvec;
2889 HARD_REG_SET clobbered_regs;
2890 CLEAR_HARD_REG_SET (clobbered_regs);
2891
2892 clob = gen_rtx_MEM (BLKmode, gen_rtx_SCRATCH (VOIDmode));
2893 clobber_rvec.safe_push (clob);
2894
2895 if (targetm.md_asm_adjust)
2896 targetm.md_asm_adjust (output_rvec, input_rvec, input_mode,
2897 constraints, clobber_rvec, clobbered_regs,
2898 locus);
2899
2900 asm_op = body;
2901 nclobbers = clobber_rvec.length ();
2902 body = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (1 + nclobbers));
2903
2904 XVECEXP (body, 0, 0) = asm_op;
2905 for (i = 0; i < nclobbers; i++)
2906 XVECEXP (body, 0, i + 1) = gen_rtx_CLOBBER (VOIDmode, clobber_rvec[i]);
2907 }
2908
2909 emit_insn (body);
2910 }
2911
2912 /* Return the number of times character C occurs in string S. */
2913 static int
2914 n_occurrences (int c, const char *s)
2915 {
2916 int n = 0;
2917 while (*s)
2918 n += (*s++ == c);
2919 return n;
2920 }
2921
2922 /* A subroutine of expand_asm_operands. Check that all operands have
2923 the same number of alternatives. Return true if so. */
2924
2925 static bool
2926 check_operand_nalternatives (const vec<const char *> &constraints)
2927 {
2928 unsigned len = constraints.length();
2929 if (len > 0)
2930 {
2931 int nalternatives = n_occurrences (',', constraints[0]);
2932
2933 if (nalternatives + 1 > MAX_RECOG_ALTERNATIVES)
2934 {
2935 error ("too many alternatives in %<asm%>");
2936 return false;
2937 }
2938
2939 for (unsigned i = 1; i < len; ++i)
2940 if (n_occurrences (',', constraints[i]) != nalternatives)
2941 {
2942 error ("operand constraints for %<asm%> differ "
2943 "in number of alternatives");
2944 return false;
2945 }
2946 }
2947 return true;
2948 }
2949
2950 /* Check for overlap between registers marked in CLOBBERED_REGS and
2951 anything inappropriate in T. Emit error and return the register
2952 variable definition for error, NULL_TREE for ok. */
2953
2954 static bool
2955 tree_conflicts_with_clobbers_p (tree t, HARD_REG_SET *clobbered_regs,
2956 location_t loc)
2957 {
2958 /* Conflicts between asm-declared register variables and the clobber
2959 list are not allowed. */
2960 tree overlap = tree_overlaps_hard_reg_set (t, clobbered_regs);
2961
2962 if (overlap)
2963 {
2964 error_at (loc, "%<asm%> specifier for variable %qE conflicts with "
2965 "%<asm%> clobber list", DECL_NAME (overlap));
2966
2967 /* Reset registerness to stop multiple errors emitted for a single
2968 variable. */
2969 DECL_REGISTER (overlap) = 0;
2970 return true;
2971 }
2972
2973 return false;
2974 }
2975
2976 /* Check that the given REGNO spanning NREGS is a valid
2977 asm clobber operand. Some HW registers cannot be
2978 saved/restored, hence they should not be clobbered by
2979 asm statements. */
2980 static bool
2981 asm_clobber_reg_is_valid (int regno, int nregs, const char *regname)
2982 {
2983 bool is_valid = true;
2984 HARD_REG_SET regset;
2985
2986 CLEAR_HARD_REG_SET (regset);
2987
2988 add_range_to_hard_reg_set (&regset, regno, nregs);
2989
2990 /* Clobbering the PIC register is an error. */
2991 if (PIC_OFFSET_TABLE_REGNUM != INVALID_REGNUM
2992 && overlaps_hard_reg_set_p (regset, Pmode, PIC_OFFSET_TABLE_REGNUM))
2993 {
2994 /* ??? Diagnose during gimplification? */
2995 error ("PIC register clobbered by %qs in %<asm%>", regname);
2996 is_valid = false;
2997 }
2998 else if (!in_hard_reg_set_p
2999 (accessible_reg_set, reg_raw_mode[regno], regno))
3000 {
3001 /* ??? Diagnose during gimplification? */
3002 error ("the register %qs cannot be clobbered in %<asm%>"
3003 " for the current target", regname);
3004 is_valid = false;
3005 }
3006
3007 /* Clobbering the stack pointer register is deprecated. GCC expects
3008 the value of the stack pointer after an asm statement to be the same
3009 as it was before, so no asm can validly clobber the stack pointer in
3010 the usual sense. Adding the stack pointer to the clobber list has
3011 traditionally had some undocumented and somewhat obscure side-effects. */
3012 if (overlaps_hard_reg_set_p (regset, Pmode, STACK_POINTER_REGNUM))
3013 {
3014 crtl->sp_is_clobbered_by_asm = true;
3015 if (warning (OPT_Wdeprecated, "listing the stack pointer register"
3016 " %qs in a clobber list is deprecated", regname))
3017 inform (input_location, "the value of the stack pointer after"
3018 " an %<asm%> statement must be the same as it was before"
3019 " the statement");
3020 }
3021
3022 return is_valid;
3023 }
3024
3025 /* Generate RTL for an asm statement with arguments.
3026 STRING is the instruction template.
3027 OUTPUTS is a list of output arguments (lvalues); INPUTS a list of inputs.
3028 Each output or input has an expression in the TREE_VALUE and
3029 a tree list in TREE_PURPOSE which in turn contains a constraint
3030 name in TREE_VALUE (or NULL_TREE) and a constraint string
3031 in TREE_PURPOSE.
3032 CLOBBERS is a list of STRING_CST nodes each naming a hard register
3033 that is clobbered by this insn.
3034
3035 LABELS is a list of labels, and if LABELS is non-NULL, FALLTHRU_BB
3036 should be the fallthru basic block of the asm goto.
3037
3038 Not all kinds of lvalue that may appear in OUTPUTS can be stored directly.
3039 Some elements of OUTPUTS may be replaced with trees representing temporary
3040 values. The caller should copy those temporary values to the originally
3041 specified lvalues.
3042
3043 VOL nonzero means the insn is volatile; don't optimize it. */
3044
3045 static void
3046 expand_asm_stmt (gasm *stmt)
3047 {
3048 class save_input_location
3049 {
3050 location_t old;
3051
3052 public:
3053 explicit save_input_location(location_t where)
3054 {
3055 old = input_location;
3056 input_location = where;
3057 }
3058
3059 ~save_input_location()
3060 {
3061 input_location = old;
3062 }
3063 };
3064
3065 location_t locus = gimple_location (stmt);
3066
3067 if (gimple_asm_input_p (stmt))
3068 {
3069 const char *s = gimple_asm_string (stmt);
3070 tree string = build_string (strlen (s), s);
3071 expand_asm_loc (string, gimple_asm_volatile_p (stmt), locus);
3072 return;
3073 }
3074
3075 /* There are some legacy diagnostics in here. */
3076 save_input_location s_i_l(locus);
3077
3078 unsigned noutputs = gimple_asm_noutputs (stmt);
3079 unsigned ninputs = gimple_asm_ninputs (stmt);
3080 unsigned nlabels = gimple_asm_nlabels (stmt);
3081 unsigned i;
3082 bool error_seen = false;
3083
3084 /* ??? Diagnose during gimplification? */
3085 if (ninputs + noutputs + nlabels > MAX_RECOG_OPERANDS)
3086 {
3087 error_at (locus, "more than %d operands in %<asm%>", MAX_RECOG_OPERANDS);
3088 return;
3089 }
3090
3091 auto_vec<tree, MAX_RECOG_OPERANDS> output_tvec;
3092 auto_vec<tree, MAX_RECOG_OPERANDS> input_tvec;
3093 auto_vec<const char *, MAX_RECOG_OPERANDS> constraints;
3094
3095 /* Copy the gimple vectors into new vectors that we can manipulate. */
3096
3097 output_tvec.safe_grow (noutputs, true);
3098 input_tvec.safe_grow (ninputs, true);
3099 constraints.safe_grow (noutputs + ninputs, true);
3100
3101 for (i = 0; i < noutputs; ++i)
3102 {
3103 tree t = gimple_asm_output_op (stmt, i);
3104 output_tvec[i] = TREE_VALUE (t);
3105 constraints[i] = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
3106 }
3107 for (i = 0; i < ninputs; i++)
3108 {
3109 tree t = gimple_asm_input_op (stmt, i);
3110 input_tvec[i] = TREE_VALUE (t);
3111 constraints[i + noutputs]
3112 = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
3113 }
3114
3115 /* ??? Diagnose during gimplification? */
3116 if (! check_operand_nalternatives (constraints))
3117 return;
3118
3119 /* Count the number of meaningful clobbered registers, ignoring what
3120 we would ignore later. */
3121 auto_vec<rtx> clobber_rvec;
3122 HARD_REG_SET clobbered_regs;
3123 CLEAR_HARD_REG_SET (clobbered_regs);
3124
3125 if (unsigned n = gimple_asm_nclobbers (stmt))
3126 {
3127 clobber_rvec.reserve (n);
3128 for (i = 0; i < n; i++)
3129 {
3130 tree t = gimple_asm_clobber_op (stmt, i);
3131 const char *regname = TREE_STRING_POINTER (TREE_VALUE (t));
3132 int nregs, j;
3133
3134 j = decode_reg_name_and_count (regname, &nregs);
3135 if (j < 0)
3136 {
3137 if (j == -2)
3138 {
3139 /* ??? Diagnose during gimplification? */
3140 error_at (locus, "unknown register name %qs in %<asm%>",
3141 regname);
3142 error_seen = true;
3143 }
3144 else if (j == -4)
3145 {
3146 rtx x = gen_rtx_MEM (BLKmode, gen_rtx_SCRATCH (VOIDmode));
3147 clobber_rvec.safe_push (x);
3148 }
3149 else
3150 {
3151 /* Otherwise we should have -1 == empty string
3152 or -3 == cc, which is not a register. */
3153 gcc_assert (j == -1 || j == -3);
3154 }
3155 }
3156 else
3157 for (int reg = j; reg < j + nregs; reg++)
3158 {
3159 if (!asm_clobber_reg_is_valid (reg, nregs, regname))
3160 return;
3161
3162 SET_HARD_REG_BIT (clobbered_regs, reg);
3163 rtx x = gen_rtx_REG (reg_raw_mode[reg], reg);
3164 clobber_rvec.safe_push (x);
3165 }
3166 }
3167 }
3168
3169 /* First pass over inputs and outputs checks validity and sets
3170 mark_addressable if needed. */
3171 /* ??? Diagnose during gimplification? */
3172
3173 for (i = 0; i < noutputs; ++i)
3174 {
3175 tree val = output_tvec[i];
3176 tree type = TREE_TYPE (val);
3177 const char *constraint;
3178 bool is_inout;
3179 bool allows_reg;
3180 bool allows_mem;
3181
3182 /* Try to parse the output constraint. If that fails, there's
3183 no point in going further. */
3184 constraint = constraints[i];
3185 if (!parse_output_constraint (&constraint, i, ninputs, noutputs,
3186 &allows_mem, &allows_reg, &is_inout))
3187 return;
3188
3189 /* If the output is a hard register, verify it doesn't conflict with
3190 any other operand's possible hard register use. */
3191 if (DECL_P (val)
3192 && REG_P (DECL_RTL (val))
3193 && HARD_REGISTER_P (DECL_RTL (val)))
3194 {
3195 unsigned j, output_hregno = REGNO (DECL_RTL (val));
3196 bool early_clobber_p = strchr (constraints[i], '&') != NULL;
3197 unsigned long match;
3198
3199 /* Verify the other outputs do not use the same hard register. */
3200 for (j = i + 1; j < noutputs; ++j)
3201 if (DECL_P (output_tvec[j])
3202 && REG_P (DECL_RTL (output_tvec[j]))
3203 && HARD_REGISTER_P (DECL_RTL (output_tvec[j]))
3204 && output_hregno == REGNO (DECL_RTL (output_tvec[j])))
3205 {
3206 error_at (locus, "invalid hard register usage between output "
3207 "operands");
3208 error_seen = true;
3209 }
3210
3211 /* Verify matching constraint operands use the same hard register
3212 and that the non-matching constraint operands do not use the same
3213 hard register if the output is an early clobber operand. */
3214 for (j = 0; j < ninputs; ++j)
3215 if (DECL_P (input_tvec[j])
3216 && REG_P (DECL_RTL (input_tvec[j]))
3217 && HARD_REGISTER_P (DECL_RTL (input_tvec[j])))
3218 {
3219 unsigned input_hregno = REGNO (DECL_RTL (input_tvec[j]));
3220 switch (*constraints[j + noutputs])
3221 {
3222 case '0': case '1': case '2': case '3': case '4':
3223 case '5': case '6': case '7': case '8': case '9':
3224 match = strtoul (constraints[j + noutputs], NULL, 10);
3225 break;
3226 default:
3227 match = ULONG_MAX;
3228 break;
3229 }
3230 if (i == match
3231 && output_hregno != input_hregno)
3232 {
3233 error_at (locus, "invalid hard register usage between "
3234 "output operand and matching constraint operand");
3235 error_seen = true;
3236 }
3237 else if (early_clobber_p
3238 && i != match
3239 && output_hregno == input_hregno)
3240 {
3241 error_at (locus, "invalid hard register usage between "
3242 "earlyclobber operand and input operand");
3243 error_seen = true;
3244 }
3245 }
3246 }
3247
3248 if (! allows_reg
3249 && (allows_mem
3250 || is_inout
3251 || (DECL_P (val)
3252 && REG_P (DECL_RTL (val))
3253 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type))))
3254 mark_addressable (val);
3255 }
3256
3257 for (i = 0; i < ninputs; ++i)
3258 {
3259 bool allows_reg, allows_mem;
3260 const char *constraint;
3261
3262 constraint = constraints[i + noutputs];
3263 if (! parse_input_constraint (&constraint, i, ninputs, noutputs, 0,
3264 constraints.address (),
3265 &allows_mem, &allows_reg))
3266 return;
3267
3268 if (! allows_reg && allows_mem)
3269 mark_addressable (input_tvec[i]);
3270 }
3271
3272 /* Second pass evaluates arguments. */
3273
3274 /* Make sure stack is consistent for asm goto. */
3275 if (nlabels > 0)
3276 do_pending_stack_adjust ();
3277 int old_generating_concat_p = generating_concat_p;
3278
3279 /* Vector of RTX's of evaluated output operands. */
3280 auto_vec<rtx, MAX_RECOG_OPERANDS> output_rvec;
3281 auto_vec<int, MAX_RECOG_OPERANDS> inout_opnum;
3282 rtx_insn *after_rtl_seq = NULL, *after_rtl_end = NULL;
3283
3284 output_rvec.safe_grow (noutputs, true);
3285
3286 for (i = 0; i < noutputs; ++i)
3287 {
3288 tree val = output_tvec[i];
3289 tree type = TREE_TYPE (val);
3290 bool is_inout, allows_reg, allows_mem, ok;
3291 rtx op;
3292
3293 ok = parse_output_constraint (&constraints[i], i, ninputs,
3294 noutputs, &allows_mem, &allows_reg,
3295 &is_inout);
3296 gcc_assert (ok);
3297
3298 /* If an output operand is not a decl or indirect ref and our constraint
3299 allows a register, make a temporary to act as an intermediate.
3300 Make the asm insn write into that, then we will copy it to
3301 the real output operand. Likewise for promoted variables. */
3302
3303 generating_concat_p = 0;
3304
3305 if ((TREE_CODE (val) == INDIRECT_REF && allows_mem)
3306 || (DECL_P (val)
3307 && (allows_mem || REG_P (DECL_RTL (val)))
3308 && ! (REG_P (DECL_RTL (val))
3309 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type)))
3310 || ! allows_reg
3311 || is_inout
3312 || TREE_ADDRESSABLE (type))
3313 {
3314 op = expand_expr (val, NULL_RTX, VOIDmode,
3315 !allows_reg ? EXPAND_MEMORY : EXPAND_WRITE);
3316 if (MEM_P (op))
3317 op = validize_mem (op);
3318
3319 if (! allows_reg && !MEM_P (op))
3320 {
3321 error_at (locus, "output number %d not directly addressable", i);
3322 error_seen = true;
3323 }
3324 if ((! allows_mem && MEM_P (op) && GET_MODE (op) != BLKmode)
3325 || GET_CODE (op) == CONCAT)
3326 {
3327 rtx old_op = op;
3328 op = gen_reg_rtx (GET_MODE (op));
3329
3330 generating_concat_p = old_generating_concat_p;
3331
3332 if (is_inout)
3333 emit_move_insn (op, old_op);
3334
3335 push_to_sequence2 (after_rtl_seq, after_rtl_end);
3336 emit_move_insn (old_op, op);
3337 after_rtl_seq = get_insns ();
3338 after_rtl_end = get_last_insn ();
3339 end_sequence ();
3340 }
3341 }
3342 else
3343 {
3344 op = assign_temp (type, 0, 1);
3345 op = validize_mem (op);
3346 if (!MEM_P (op) && TREE_CODE (val) == SSA_NAME)
3347 set_reg_attrs_for_decl_rtl (SSA_NAME_VAR (val), op);
3348
3349 generating_concat_p = old_generating_concat_p;
3350
3351 push_to_sequence2 (after_rtl_seq, after_rtl_end);
3352 expand_assignment (val, make_tree (type, op), false);
3353 after_rtl_seq = get_insns ();
3354 after_rtl_end = get_last_insn ();
3355 end_sequence ();
3356 }
3357 output_rvec[i] = op;
3358
3359 if (is_inout)
3360 inout_opnum.safe_push (i);
3361 }
3362
3363 const char *str = gimple_asm_string (stmt);
3364 if (error_seen)
3365 {
3366 ninputs = 0;
3367 noutputs = 0;
3368 inout_opnum.truncate (0);
3369 output_rvec.truncate (0);
3370 clobber_rvec.truncate (0);
3371 constraints.truncate (0);
3372 CLEAR_HARD_REG_SET (clobbered_regs);
3373 str = "";
3374 }
3375
3376 auto_vec<rtx, MAX_RECOG_OPERANDS> input_rvec;
3377 auto_vec<machine_mode, MAX_RECOG_OPERANDS> input_mode;
3378
3379 input_rvec.safe_grow (ninputs, true);
3380 input_mode.safe_grow (ninputs, true);
3381
3382 generating_concat_p = 0;
3383
3384 for (i = 0; i < ninputs; ++i)
3385 {
3386 tree val = input_tvec[i];
3387 tree type = TREE_TYPE (val);
3388 bool allows_reg, allows_mem, ok;
3389 const char *constraint;
3390 rtx op;
3391
3392 constraint = constraints[i + noutputs];
3393 ok = parse_input_constraint (&constraint, i, ninputs, noutputs, 0,
3394 constraints.address (),
3395 &allows_mem, &allows_reg);
3396 gcc_assert (ok);
3397
3398 /* EXPAND_INITIALIZER will not generate code for valid initializer
3399 constants, but will still generate code for other types of operand.
3400 This is the behavior we want for constant constraints. */
3401 op = expand_expr (val, NULL_RTX, VOIDmode,
3402 allows_reg ? EXPAND_NORMAL
3403 : allows_mem ? EXPAND_MEMORY
3404 : EXPAND_INITIALIZER);
3405
3406 /* Never pass a CONCAT to an ASM. */
3407 if (GET_CODE (op) == CONCAT)
3408 op = force_reg (GET_MODE (op), op);
3409 else if (MEM_P (op))
3410 op = validize_mem (op);
3411
3412 if (asm_operand_ok (op, constraint, NULL) <= 0)
3413 {
3414 if (allows_reg && TYPE_MODE (type) != BLKmode)
3415 op = force_reg (TYPE_MODE (type), op);
3416 else if (!allows_mem)
3417 warning_at (locus, 0, "%<asm%> operand %d probably does not match "
3418 "constraints", i + noutputs);
3419 else if (MEM_P (op))
3420 {
3421 /* We won't recognize either volatile memory or memory
3422 with a queued address as available a memory_operand
3423 at this point. Ignore it: clearly this *is* a memory. */
3424 }
3425 else
3426 gcc_unreachable ();
3427 }
3428 input_rvec[i] = op;
3429 input_mode[i] = TYPE_MODE (type);
3430 }
3431
3432 /* For in-out operands, copy output rtx to input rtx. */
3433 unsigned ninout = inout_opnum.length ();
3434 for (i = 0; i < ninout; i++)
3435 {
3436 int j = inout_opnum[i];
3437 rtx o = output_rvec[j];
3438
3439 input_rvec.safe_push (o);
3440 input_mode.safe_push (GET_MODE (o));
3441
3442 char buffer[16];
3443 sprintf (buffer, "%d", j);
3444 constraints.safe_push (ggc_strdup (buffer));
3445 }
3446 ninputs += ninout;
3447
3448 /* Sometimes we wish to automatically clobber registers across an asm.
3449 Case in point is when the i386 backend moved from cc0 to a hard reg --
3450 maintaining source-level compatibility means automatically clobbering
3451 the flags register. */
3452 rtx_insn *after_md_seq = NULL;
3453 if (targetm.md_asm_adjust)
3454 after_md_seq
3455 = targetm.md_asm_adjust (output_rvec, input_rvec, input_mode,
3456 constraints, clobber_rvec, clobbered_regs,
3457 locus);
3458
3459 /* Do not allow the hook to change the output and input count,
3460 lest it mess up the operand numbering. */
3461 gcc_assert (output_rvec.length() == noutputs);
3462 gcc_assert (input_rvec.length() == ninputs);
3463 gcc_assert (constraints.length() == noutputs + ninputs);
3464
3465 /* But it certainly can adjust the clobbers. */
3466 unsigned nclobbers = clobber_rvec.length ();
3467
3468 /* Third pass checks for easy conflicts. */
3469 /* ??? Why are we doing this on trees instead of rtx. */
3470
3471 bool clobber_conflict_found = 0;
3472 for (i = 0; i < noutputs; ++i)
3473 if (tree_conflicts_with_clobbers_p (output_tvec[i], &clobbered_regs, locus))
3474 clobber_conflict_found = 1;
3475 for (i = 0; i < ninputs - ninout; ++i)
3476 if (tree_conflicts_with_clobbers_p (input_tvec[i], &clobbered_regs, locus))
3477 clobber_conflict_found = 1;
3478
3479 /* Make vectors for the expression-rtx, constraint strings,
3480 and named operands. */
3481
3482 rtvec argvec = rtvec_alloc (ninputs);
3483 rtvec constraintvec = rtvec_alloc (ninputs);
3484 rtvec labelvec = rtvec_alloc (nlabels);
3485
3486 rtx body = gen_rtx_ASM_OPERANDS ((noutputs == 0 ? VOIDmode
3487 : GET_MODE (output_rvec[0])),
3488 ggc_strdup (str),
3489 "", 0, argvec, constraintvec,
3490 labelvec, locus);
3491 MEM_VOLATILE_P (body) = gimple_asm_volatile_p (stmt);
3492
3493 for (i = 0; i < ninputs; ++i)
3494 {
3495 ASM_OPERANDS_INPUT (body, i) = input_rvec[i];
3496 ASM_OPERANDS_INPUT_CONSTRAINT_EXP (body, i)
3497 = gen_rtx_ASM_INPUT_loc (input_mode[i],
3498 constraints[i + noutputs],
3499 locus);
3500 }
3501
3502 /* Copy labels to the vector. */
3503 rtx_code_label *fallthru_label = NULL;
3504 if (nlabels > 0)
3505 {
3506 basic_block fallthru_bb = NULL;
3507 edge fallthru = find_fallthru_edge (gimple_bb (stmt)->succs);
3508 if (fallthru)
3509 fallthru_bb = fallthru->dest;
3510
3511 for (i = 0; i < nlabels; ++i)
3512 {
3513 tree label = TREE_VALUE (gimple_asm_label_op (stmt, i));
3514 rtx_insn *r;
3515 /* If asm goto has any labels in the fallthru basic block, use
3516 a label that we emit immediately after the asm goto. Expansion
3517 may insert further instructions into the same basic block after
3518 asm goto and if we don't do this, insertion of instructions on
3519 the fallthru edge might misbehave. See PR58670. */
3520 if (fallthru_bb && label_to_block (cfun, label) == fallthru_bb)
3521 {
3522 if (fallthru_label == NULL_RTX)
3523 fallthru_label = gen_label_rtx ();
3524 r = fallthru_label;
3525 }
3526 else
3527 r = label_rtx (label);
3528 ASM_OPERANDS_LABEL (body, i) = gen_rtx_LABEL_REF (Pmode, r);
3529 }
3530 }
3531
3532 /* Now, for each output, construct an rtx
3533 (set OUTPUT (asm_operands INSN OUTPUTCONSTRAINT OUTPUTNUMBER
3534 ARGVEC CONSTRAINTS OPNAMES))
3535 If there is more than one, put them inside a PARALLEL. */
3536
3537 if (noutputs == 0 && nclobbers == 0)
3538 {
3539 /* No output operands: put in a raw ASM_OPERANDS rtx. */
3540 if (nlabels > 0)
3541 emit_jump_insn (body);
3542 else
3543 emit_insn (body);
3544 }
3545 else if (noutputs == 1 && nclobbers == 0)
3546 {
3547 ASM_OPERANDS_OUTPUT_CONSTRAINT (body) = constraints[0];
3548 if (nlabels > 0)
3549 emit_jump_insn (gen_rtx_SET (output_rvec[0], body));
3550 else
3551 emit_insn (gen_rtx_SET (output_rvec[0], body));
3552 }
3553 else
3554 {
3555 rtx obody = body;
3556 int num = noutputs;
3557
3558 if (num == 0)
3559 num = 1;
3560
3561 body = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (num + nclobbers));
3562
3563 /* For each output operand, store a SET. */
3564 for (i = 0; i < noutputs; ++i)
3565 {
3566 rtx src, o = output_rvec[i];
3567 if (i == 0)
3568 {
3569 ASM_OPERANDS_OUTPUT_CONSTRAINT (obody) = constraints[0];
3570 src = obody;
3571 }
3572 else
3573 {
3574 src = gen_rtx_ASM_OPERANDS (GET_MODE (o),
3575 ASM_OPERANDS_TEMPLATE (obody),
3576 constraints[i], i, argvec,
3577 constraintvec, labelvec, locus);
3578 MEM_VOLATILE_P (src) = gimple_asm_volatile_p (stmt);
3579 }
3580 XVECEXP (body, 0, i) = gen_rtx_SET (o, src);
3581 }
3582
3583 /* If there are no outputs (but there are some clobbers)
3584 store the bare ASM_OPERANDS into the PARALLEL. */
3585 if (i == 0)
3586 XVECEXP (body, 0, i++) = obody;
3587
3588 /* Store (clobber REG) for each clobbered register specified. */
3589 for (unsigned j = 0; j < nclobbers; ++j)
3590 {
3591 rtx clobbered_reg = clobber_rvec[j];
3592
3593 /* Do sanity check for overlap between clobbers and respectively
3594 input and outputs that hasn't been handled. Such overlap
3595 should have been detected and reported above. */
3596 if (!clobber_conflict_found && REG_P (clobbered_reg))
3597 {
3598 /* We test the old body (obody) contents to avoid
3599 tripping over the under-construction body. */
3600 for (unsigned k = 0; k < noutputs; ++k)
3601 if (reg_overlap_mentioned_p (clobbered_reg, output_rvec[k]))
3602 internal_error ("%<asm%> clobber conflict with "
3603 "output operand");
3604
3605 for (unsigned k = 0; k < ninputs - ninout; ++k)
3606 if (reg_overlap_mentioned_p (clobbered_reg, input_rvec[k]))
3607 internal_error ("%<asm%> clobber conflict with "
3608 "input operand");
3609 }
3610
3611 XVECEXP (body, 0, i++) = gen_rtx_CLOBBER (VOIDmode, clobbered_reg);
3612 }
3613
3614 if (nlabels > 0)
3615 emit_jump_insn (body);
3616 else
3617 emit_insn (body);
3618 }
3619
3620 generating_concat_p = old_generating_concat_p;
3621
3622 if (fallthru_label)
3623 emit_label (fallthru_label);
3624
3625 if (after_md_seq)
3626 emit_insn (after_md_seq);
3627 if (after_rtl_seq)
3628 {
3629 if (nlabels == 0)
3630 emit_insn (after_rtl_seq);
3631 else
3632 {
3633 edge e;
3634 edge_iterator ei;
3635
3636 FOR_EACH_EDGE (e, ei, gimple_bb (stmt)->succs)
3637 {
3638 start_sequence ();
3639 for (rtx_insn *curr = after_rtl_seq;
3640 curr != NULL_RTX;
3641 curr = NEXT_INSN (curr))
3642 emit_insn (copy_insn (PATTERN (curr)));
3643 rtx_insn *copy = get_insns ();
3644 end_sequence ();
3645 insert_insn_on_edge (copy, e);
3646 }
3647 }
3648 }
3649
3650 free_temp_slots ();
3651 crtl->has_asm_statement = 1;
3652 }
3653
3654 /* Emit code to jump to the address
3655 specified by the pointer expression EXP. */
3656
3657 static void
3658 expand_computed_goto (tree exp)
3659 {
3660 rtx x = expand_normal (exp);
3661
3662 do_pending_stack_adjust ();
3663 emit_indirect_jump (x);
3664 }
3665
3666 /* Generate RTL code for a `goto' statement with target label LABEL.
3667 LABEL should be a LABEL_DECL tree node that was or will later be
3668 defined with `expand_label'. */
3669
3670 static void
3671 expand_goto (tree label)
3672 {
3673 if (flag_checking)
3674 {
3675 /* Check for a nonlocal goto to a containing function. Should have
3676 gotten translated to __builtin_nonlocal_goto. */
3677 tree context = decl_function_context (label);
3678 gcc_assert (!context || context == current_function_decl);
3679 }
3680
3681 emit_jump (jump_target_rtx (label));
3682 }
3683
3684 /* Output a return with no value. */
3685
3686 static void
3687 expand_null_return_1 (void)
3688 {
3689 clear_pending_stack_adjust ();
3690 do_pending_stack_adjust ();
3691 emit_jump (return_label);
3692 }
3693
3694 /* Generate RTL to return from the current function, with no value.
3695 (That is, we do not do anything about returning any value.) */
3696
3697 void
3698 expand_null_return (void)
3699 {
3700 /* If this function was declared to return a value, but we
3701 didn't, clobber the return registers so that they are not
3702 propagated live to the rest of the function. */
3703 clobber_return_register ();
3704
3705 expand_null_return_1 ();
3706 }
3707
3708 /* Generate RTL to return from the current function, with value VAL. */
3709
3710 static void
3711 expand_value_return (rtx val)
3712 {
3713 /* Copy the value to the return location unless it's already there. */
3714
3715 tree decl = DECL_RESULT (current_function_decl);
3716 rtx return_reg = DECL_RTL (decl);
3717 if (return_reg != val)
3718 {
3719 tree funtype = TREE_TYPE (current_function_decl);
3720 tree type = TREE_TYPE (decl);
3721 int unsignedp = TYPE_UNSIGNED (type);
3722 machine_mode old_mode = DECL_MODE (decl);
3723 machine_mode mode;
3724 if (DECL_BY_REFERENCE (decl))
3725 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 2);
3726 else
3727 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 1);
3728
3729 if (mode != old_mode)
3730 val = convert_modes (mode, old_mode, val, unsignedp);
3731
3732 if (GET_CODE (return_reg) == PARALLEL)
3733 emit_group_load (return_reg, val, type, int_size_in_bytes (type));
3734 else
3735 emit_move_insn (return_reg, val);
3736 }
3737
3738 expand_null_return_1 ();
3739 }
3740
3741 /* Generate RTL to evaluate the expression RETVAL and return it
3742 from the current function. */
3743
3744 static void
3745 expand_return (tree retval)
3746 {
3747 rtx result_rtl;
3748 rtx val = 0;
3749 tree retval_rhs;
3750
3751 /* If function wants no value, give it none. */
3752 if (TREE_CODE (TREE_TYPE (TREE_TYPE (current_function_decl))) == VOID_TYPE)
3753 {
3754 expand_normal (retval);
3755 expand_null_return ();
3756 return;
3757 }
3758
3759 if (retval == error_mark_node)
3760 {
3761 /* Treat this like a return of no value from a function that
3762 returns a value. */
3763 expand_null_return ();
3764 return;
3765 }
3766 else if ((TREE_CODE (retval) == MODIFY_EXPR
3767 || TREE_CODE (retval) == INIT_EXPR)
3768 && TREE_CODE (TREE_OPERAND (retval, 0)) == RESULT_DECL)
3769 retval_rhs = TREE_OPERAND (retval, 1);
3770 else
3771 retval_rhs = retval;
3772
3773 result_rtl = DECL_RTL (DECL_RESULT (current_function_decl));
3774
3775 /* If we are returning the RESULT_DECL, then the value has already
3776 been stored into it, so we don't have to do anything special. */
3777 if (TREE_CODE (retval_rhs) == RESULT_DECL)
3778 expand_value_return (result_rtl);
3779
3780 /* If the result is an aggregate that is being returned in one (or more)
3781 registers, load the registers here. */
3782
3783 else if (retval_rhs != 0
3784 && TYPE_MODE (TREE_TYPE (retval_rhs)) == BLKmode
3785 && REG_P (result_rtl))
3786 {
3787 val = copy_blkmode_to_reg (GET_MODE (result_rtl), retval_rhs);
3788 if (val)
3789 {
3790 /* Use the mode of the result value on the return register. */
3791 PUT_MODE (result_rtl, GET_MODE (val));
3792 expand_value_return (val);
3793 }
3794 else
3795 expand_null_return ();
3796 }
3797 else if (retval_rhs != 0
3798 && !VOID_TYPE_P (TREE_TYPE (retval_rhs))
3799 && (REG_P (result_rtl)
3800 || (GET_CODE (result_rtl) == PARALLEL)))
3801 {
3802 /* Compute the return value into a temporary (usually a pseudo reg). */
3803 val
3804 = assign_temp (TREE_TYPE (DECL_RESULT (current_function_decl)), 0, 1);
3805 val = expand_expr (retval_rhs, val, GET_MODE (val), EXPAND_NORMAL);
3806 val = force_not_mem (val);
3807 expand_value_return (val);
3808 }
3809 else
3810 {
3811 /* No hard reg used; calculate value into hard return reg. */
3812 expand_expr (retval, const0_rtx, VOIDmode, EXPAND_NORMAL);
3813 expand_value_return (result_rtl);
3814 }
3815 }
3816
3817 /* Expand a clobber of LHS. If LHS is stored it in a multi-part
3818 register, tell the rtl optimizers that its value is no longer
3819 needed. */
3820
3821 static void
3822 expand_clobber (tree lhs)
3823 {
3824 if (DECL_P (lhs))
3825 {
3826 rtx decl_rtl = DECL_RTL_IF_SET (lhs);
3827 if (decl_rtl && REG_P (decl_rtl))
3828 {
3829 machine_mode decl_mode = GET_MODE (decl_rtl);
3830 if (maybe_gt (GET_MODE_SIZE (decl_mode),
3831 REGMODE_NATURAL_SIZE (decl_mode)))
3832 emit_clobber (decl_rtl);
3833 }
3834 }
3835 }
3836
3837 /* A subroutine of expand_gimple_stmt, expanding one gimple statement
3838 STMT that doesn't require special handling for outgoing edges. That
3839 is no tailcalls and no GIMPLE_COND. */
3840
3841 static void
3842 expand_gimple_stmt_1 (gimple *stmt)
3843 {
3844 tree op0;
3845
3846 set_curr_insn_location (gimple_location (stmt));
3847
3848 switch (gimple_code (stmt))
3849 {
3850 case GIMPLE_GOTO:
3851 op0 = gimple_goto_dest (stmt);
3852 if (TREE_CODE (op0) == LABEL_DECL)
3853 expand_goto (op0);
3854 else
3855 expand_computed_goto (op0);
3856 break;
3857 case GIMPLE_LABEL:
3858 expand_label (gimple_label_label (as_a <glabel *> (stmt)));
3859 break;
3860 case GIMPLE_NOP:
3861 case GIMPLE_PREDICT:
3862 break;
3863 case GIMPLE_SWITCH:
3864 {
3865 gswitch *swtch = as_a <gswitch *> (stmt);
3866 if (gimple_switch_num_labels (swtch) == 1)
3867 expand_goto (CASE_LABEL (gimple_switch_default_label (swtch)));
3868 else
3869 expand_case (swtch);
3870 }
3871 break;
3872 case GIMPLE_ASM:
3873 expand_asm_stmt (as_a <gasm *> (stmt));
3874 break;
3875 case GIMPLE_CALL:
3876 expand_call_stmt (as_a <gcall *> (stmt));
3877 break;
3878
3879 case GIMPLE_RETURN:
3880 {
3881 op0 = gimple_return_retval (as_a <greturn *> (stmt));
3882
3883 /* If a return doesn't have a location, it very likely represents
3884 multiple user returns so we cannot let it inherit the location
3885 of the last statement of the previous basic block in RTL. */
3886 if (!gimple_has_location (stmt))
3887 set_curr_insn_location (cfun->function_end_locus);
3888
3889 if (op0 && op0 != error_mark_node)
3890 {
3891 tree result = DECL_RESULT (current_function_decl);
3892
3893 /* If we are not returning the current function's RESULT_DECL,
3894 build an assignment to it. */
3895 if (op0 != result)
3896 {
3897 /* I believe that a function's RESULT_DECL is unique. */
3898 gcc_assert (TREE_CODE (op0) != RESULT_DECL);
3899
3900 /* ??? We'd like to use simply expand_assignment here,
3901 but this fails if the value is of BLKmode but the return
3902 decl is a register. expand_return has special handling
3903 for this combination, which eventually should move
3904 to common code. See comments there. Until then, let's
3905 build a modify expression :-/ */
3906 op0 = build2 (MODIFY_EXPR, TREE_TYPE (result),
3907 result, op0);
3908 }
3909 }
3910
3911 if (!op0)
3912 expand_null_return ();
3913 else
3914 expand_return (op0);
3915 }
3916 break;
3917
3918 case GIMPLE_ASSIGN:
3919 {
3920 gassign *assign_stmt = as_a <gassign *> (stmt);
3921 tree lhs = gimple_assign_lhs (assign_stmt);
3922
3923 /* Tree expand used to fiddle with |= and &= of two bitfield
3924 COMPONENT_REFs here. This can't happen with gimple, the LHS
3925 of binary assigns must be a gimple reg. */
3926
3927 if (TREE_CODE (lhs) != SSA_NAME
3928 || gimple_assign_rhs_class (assign_stmt) == GIMPLE_SINGLE_RHS)
3929 {
3930 tree rhs = gimple_assign_rhs1 (assign_stmt);
3931 gcc_assert (gimple_assign_rhs_class (assign_stmt)
3932 == GIMPLE_SINGLE_RHS);
3933 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (rhs)
3934 /* Do not put locations on possibly shared trees. */
3935 && !is_gimple_min_invariant (rhs))
3936 SET_EXPR_LOCATION (rhs, gimple_location (stmt));
3937 if (TREE_CLOBBER_P (rhs))
3938 /* This is a clobber to mark the going out of scope for
3939 this LHS. */
3940 expand_clobber (lhs);
3941 else
3942 expand_assignment (lhs, rhs,
3943 gimple_assign_nontemporal_move_p (
3944 assign_stmt));
3945 }
3946 else
3947 {
3948 rtx target, temp;
3949 bool nontemporal = gimple_assign_nontemporal_move_p (assign_stmt);
3950 struct separate_ops ops;
3951 bool promoted = false;
3952
3953 target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
3954 if (GET_CODE (target) == SUBREG && SUBREG_PROMOTED_VAR_P (target))
3955 promoted = true;
3956
3957 ops.code = gimple_assign_rhs_code (assign_stmt);
3958 ops.type = TREE_TYPE (lhs);
3959 switch (get_gimple_rhs_class (ops.code))
3960 {
3961 case GIMPLE_TERNARY_RHS:
3962 ops.op2 = gimple_assign_rhs3 (assign_stmt);
3963 /* Fallthru */
3964 case GIMPLE_BINARY_RHS:
3965 ops.op1 = gimple_assign_rhs2 (assign_stmt);
3966 /* Fallthru */
3967 case GIMPLE_UNARY_RHS:
3968 ops.op0 = gimple_assign_rhs1 (assign_stmt);
3969 break;
3970 default:
3971 gcc_unreachable ();
3972 }
3973 ops.location = gimple_location (stmt);
3974
3975 /* If we want to use a nontemporal store, force the value to
3976 register first. If we store into a promoted register,
3977 don't directly expand to target. */
3978 temp = nontemporal || promoted ? NULL_RTX : target;
3979 temp = expand_expr_real_2 (&ops, temp, GET_MODE (target),
3980 EXPAND_NORMAL);
3981
3982 if (temp == target)
3983 ;
3984 else if (promoted)
3985 {
3986 int unsignedp = SUBREG_PROMOTED_SIGN (target);
3987 /* If TEMP is a VOIDmode constant, use convert_modes to make
3988 sure that we properly convert it. */
3989 if (CONSTANT_P (temp) && GET_MODE (temp) == VOIDmode)
3990 {
3991 temp = convert_modes (GET_MODE (target),
3992 TYPE_MODE (ops.type),
3993 temp, unsignedp);
3994 temp = convert_modes (GET_MODE (SUBREG_REG (target)),
3995 GET_MODE (target), temp, unsignedp);
3996 }
3997
3998 convert_move (SUBREG_REG (target), temp, unsignedp);
3999 }
4000 else if (nontemporal && emit_storent_insn (target, temp))
4001 ;
4002 else
4003 {
4004 temp = force_operand (temp, target);
4005 if (temp != target)
4006 emit_move_insn (target, temp);
4007 }
4008 }
4009 }
4010 break;
4011
4012 default:
4013 gcc_unreachable ();
4014 }
4015 }
4016
4017 /* Expand one gimple statement STMT and return the last RTL instruction
4018 before any of the newly generated ones.
4019
4020 In addition to generating the necessary RTL instructions this also
4021 sets REG_EH_REGION notes if necessary and sets the current source
4022 location for diagnostics. */
4023
4024 static rtx_insn *
4025 expand_gimple_stmt (gimple *stmt)
4026 {
4027 location_t saved_location = input_location;
4028 rtx_insn *last = get_last_insn ();
4029 int lp_nr;
4030
4031 gcc_assert (cfun);
4032
4033 /* We need to save and restore the current source location so that errors
4034 discovered during expansion are emitted with the right location. But
4035 it would be better if the diagnostic routines used the source location
4036 embedded in the tree nodes rather than globals. */
4037 if (gimple_has_location (stmt))
4038 input_location = gimple_location (stmt);
4039
4040 expand_gimple_stmt_1 (stmt);
4041
4042 /* Free any temporaries used to evaluate this statement. */
4043 free_temp_slots ();
4044
4045 input_location = saved_location;
4046
4047 /* Mark all insns that may trap. */
4048 lp_nr = lookup_stmt_eh_lp (stmt);
4049 if (lp_nr)
4050 {
4051 rtx_insn *insn;
4052 for (insn = next_real_insn (last); insn;
4053 insn = next_real_insn (insn))
4054 {
4055 if (! find_reg_note (insn, REG_EH_REGION, NULL_RTX)
4056 /* If we want exceptions for non-call insns, any
4057 may_trap_p instruction may throw. */
4058 && GET_CODE (PATTERN (insn)) != CLOBBER
4059 && GET_CODE (PATTERN (insn)) != USE
4060 && insn_could_throw_p (insn))
4061 make_reg_eh_region_note (insn, 0, lp_nr);
4062 }
4063 }
4064
4065 return last;
4066 }
4067
4068 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_CALL
4069 that has CALL_EXPR_TAILCALL set. Returns non-null if we actually
4070 generated a tail call (something that might be denied by the ABI
4071 rules governing the call; see calls.c).
4072
4073 Sets CAN_FALLTHRU if we generated a *conditional* tail call, and
4074 can still reach the rest of BB. The case here is __builtin_sqrt,
4075 where the NaN result goes through the external function (with a
4076 tailcall) and the normal result happens via a sqrt instruction. */
4077
4078 static basic_block
4079 expand_gimple_tailcall (basic_block bb, gcall *stmt, bool *can_fallthru)
4080 {
4081 rtx_insn *last2, *last;
4082 edge e;
4083 edge_iterator ei;
4084 profile_probability probability;
4085
4086 last2 = last = expand_gimple_stmt (stmt);
4087
4088 for (last = NEXT_INSN (last); last; last = NEXT_INSN (last))
4089 if (CALL_P (last) && SIBLING_CALL_P (last))
4090 goto found;
4091
4092 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
4093
4094 *can_fallthru = true;
4095 return NULL;
4096
4097 found:
4098 /* ??? Wouldn't it be better to just reset any pending stack adjust?
4099 Any instructions emitted here are about to be deleted. */
4100 do_pending_stack_adjust ();
4101
4102 /* Remove any non-eh, non-abnormal edges that don't go to exit. */
4103 /* ??? I.e. the fallthrough edge. HOWEVER! If there were to be
4104 EH or abnormal edges, we shouldn't have created a tail call in
4105 the first place. So it seems to me we should just be removing
4106 all edges here, or redirecting the existing fallthru edge to
4107 the exit block. */
4108
4109 probability = profile_probability::never ();
4110
4111 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
4112 {
4113 if (!(e->flags & (EDGE_ABNORMAL | EDGE_EH)))
4114 {
4115 if (e->dest != EXIT_BLOCK_PTR_FOR_FN (cfun))
4116 e->dest->count -= e->count ();
4117 probability += e->probability;
4118 remove_edge (e);
4119 }
4120 else
4121 ei_next (&ei);
4122 }
4123
4124 /* This is somewhat ugly: the call_expr expander often emits instructions
4125 after the sibcall (to perform the function return). These confuse the
4126 find_many_sub_basic_blocks code, so we need to get rid of these. */
4127 last = NEXT_INSN (last);
4128 gcc_assert (BARRIER_P (last));
4129
4130 *can_fallthru = false;
4131 while (NEXT_INSN (last))
4132 {
4133 /* For instance an sqrt builtin expander expands if with
4134 sibcall in the then and label for `else`. */
4135 if (LABEL_P (NEXT_INSN (last)))
4136 {
4137 *can_fallthru = true;
4138 break;
4139 }
4140 delete_insn (NEXT_INSN (last));
4141 }
4142
4143 e = make_edge (bb, EXIT_BLOCK_PTR_FOR_FN (cfun), EDGE_ABNORMAL
4144 | EDGE_SIBCALL);
4145 e->probability = probability;
4146 BB_END (bb) = last;
4147 update_bb_for_insn (bb);
4148
4149 if (NEXT_INSN (last))
4150 {
4151 bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
4152
4153 last = BB_END (bb);
4154 if (BARRIER_P (last))
4155 BB_END (bb) = PREV_INSN (last);
4156 }
4157
4158 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
4159
4160 return bb;
4161 }
4162
4163 /* Return the difference between the floor and the truncated result of
4164 a signed division by OP1 with remainder MOD. */
4165 static rtx
4166 floor_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
4167 {
4168 /* (mod != 0 ? (op1 / mod < 0 ? -1 : 0) : 0) */
4169 return gen_rtx_IF_THEN_ELSE
4170 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
4171 gen_rtx_IF_THEN_ELSE
4172 (mode, gen_rtx_LT (BImode,
4173 gen_rtx_DIV (mode, op1, mod),
4174 const0_rtx),
4175 constm1_rtx, const0_rtx),
4176 const0_rtx);
4177 }
4178
4179 /* Return the difference between the ceil and the truncated result of
4180 a signed division by OP1 with remainder MOD. */
4181 static rtx
4182 ceil_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
4183 {
4184 /* (mod != 0 ? (op1 / mod > 0 ? 1 : 0) : 0) */
4185 return gen_rtx_IF_THEN_ELSE
4186 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
4187 gen_rtx_IF_THEN_ELSE
4188 (mode, gen_rtx_GT (BImode,
4189 gen_rtx_DIV (mode, op1, mod),
4190 const0_rtx),
4191 const1_rtx, const0_rtx),
4192 const0_rtx);
4193 }
4194
4195 /* Return the difference between the ceil and the truncated result of
4196 an unsigned division by OP1 with remainder MOD. */
4197 static rtx
4198 ceil_udiv_adjust (machine_mode mode, rtx mod, rtx op1 ATTRIBUTE_UNUSED)
4199 {
4200 /* (mod != 0 ? 1 : 0) */
4201 return gen_rtx_IF_THEN_ELSE
4202 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
4203 const1_rtx, const0_rtx);
4204 }
4205
4206 /* Return the difference between the rounded and the truncated result
4207 of a signed division by OP1 with remainder MOD. Halfway cases are
4208 rounded away from zero, rather than to the nearest even number. */
4209 static rtx
4210 round_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
4211 {
4212 /* (abs (mod) >= abs (op1) - abs (mod)
4213 ? (op1 / mod > 0 ? 1 : -1)
4214 : 0) */
4215 return gen_rtx_IF_THEN_ELSE
4216 (mode, gen_rtx_GE (BImode, gen_rtx_ABS (mode, mod),
4217 gen_rtx_MINUS (mode,
4218 gen_rtx_ABS (mode, op1),
4219 gen_rtx_ABS (mode, mod))),
4220 gen_rtx_IF_THEN_ELSE
4221 (mode, gen_rtx_GT (BImode,
4222 gen_rtx_DIV (mode, op1, mod),
4223 const0_rtx),
4224 const1_rtx, constm1_rtx),
4225 const0_rtx);
4226 }
4227
4228 /* Return the difference between the rounded and the truncated result
4229 of a unsigned division by OP1 with remainder MOD. Halfway cases
4230 are rounded away from zero, rather than to the nearest even
4231 number. */
4232 static rtx
4233 round_udiv_adjust (machine_mode mode, rtx mod, rtx op1)
4234 {
4235 /* (mod >= op1 - mod ? 1 : 0) */
4236 return gen_rtx_IF_THEN_ELSE
4237 (mode, gen_rtx_GE (BImode, mod,
4238 gen_rtx_MINUS (mode, op1, mod)),
4239 const1_rtx, const0_rtx);
4240 }
4241
4242 /* Convert X to MODE, that must be Pmode or ptr_mode, without emitting
4243 any rtl. */
4244
4245 static rtx
4246 convert_debug_memory_address (scalar_int_mode mode, rtx x,
4247 addr_space_t as)
4248 {
4249 #ifndef POINTERS_EXTEND_UNSIGNED
4250 gcc_assert (mode == Pmode
4251 || mode == targetm.addr_space.address_mode (as));
4252 gcc_assert (GET_MODE (x) == mode || GET_MODE (x) == VOIDmode);
4253 #else
4254 rtx temp;
4255
4256 gcc_assert (targetm.addr_space.valid_pointer_mode (mode, as));
4257
4258 if (GET_MODE (x) == mode || GET_MODE (x) == VOIDmode)
4259 return x;
4260
4261 /* X must have some form of address mode already. */
4262 scalar_int_mode xmode = as_a <scalar_int_mode> (GET_MODE (x));
4263 if (GET_MODE_PRECISION (mode) < GET_MODE_PRECISION (xmode))
4264 x = lowpart_subreg (mode, x, xmode);
4265 else if (POINTERS_EXTEND_UNSIGNED > 0)
4266 x = gen_rtx_ZERO_EXTEND (mode, x);
4267 else if (!POINTERS_EXTEND_UNSIGNED)
4268 x = gen_rtx_SIGN_EXTEND (mode, x);
4269 else
4270 {
4271 switch (GET_CODE (x))
4272 {
4273 case SUBREG:
4274 if ((SUBREG_PROMOTED_VAR_P (x)
4275 || (REG_P (SUBREG_REG (x)) && REG_POINTER (SUBREG_REG (x)))
4276 || (GET_CODE (SUBREG_REG (x)) == PLUS
4277 && REG_P (XEXP (SUBREG_REG (x), 0))
4278 && REG_POINTER (XEXP (SUBREG_REG (x), 0))
4279 && CONST_INT_P (XEXP (SUBREG_REG (x), 1))))
4280 && GET_MODE (SUBREG_REG (x)) == mode)
4281 return SUBREG_REG (x);
4282 break;
4283 case LABEL_REF:
4284 temp = gen_rtx_LABEL_REF (mode, label_ref_label (x));
4285 LABEL_REF_NONLOCAL_P (temp) = LABEL_REF_NONLOCAL_P (x);
4286 return temp;
4287 case SYMBOL_REF:
4288 temp = shallow_copy_rtx (x);
4289 PUT_MODE (temp, mode);
4290 return temp;
4291 case CONST:
4292 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
4293 if (temp)
4294 temp = gen_rtx_CONST (mode, temp);
4295 return temp;
4296 case PLUS:
4297 case MINUS:
4298 if (CONST_INT_P (XEXP (x, 1)))
4299 {
4300 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
4301 if (temp)
4302 return gen_rtx_fmt_ee (GET_CODE (x), mode, temp, XEXP (x, 1));
4303 }
4304 break;
4305 default:
4306 break;
4307 }
4308 /* Don't know how to express ptr_extend as operation in debug info. */
4309 return NULL;
4310 }
4311 #endif /* POINTERS_EXTEND_UNSIGNED */
4312
4313 return x;
4314 }
4315
4316 /* Map from SSA_NAMEs to corresponding DEBUG_EXPR_DECLs created
4317 by avoid_deep_ter_for_debug. */
4318
4319 static hash_map<tree, tree> *deep_ter_debug_map;
4320
4321 /* Split too deep TER chains for debug stmts using debug temporaries. */
4322
4323 static void
4324 avoid_deep_ter_for_debug (gimple *stmt, int depth)
4325 {
4326 use_operand_p use_p;
4327 ssa_op_iter iter;
4328 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
4329 {
4330 tree use = USE_FROM_PTR (use_p);
4331 if (TREE_CODE (use) != SSA_NAME || SSA_NAME_IS_DEFAULT_DEF (use))
4332 continue;
4333 gimple *g = get_gimple_for_ssa_name (use);
4334 if (g == NULL)
4335 continue;
4336 if (depth > 6 && !stmt_ends_bb_p (g))
4337 {
4338 if (deep_ter_debug_map == NULL)
4339 deep_ter_debug_map = new hash_map<tree, tree>;
4340
4341 tree &vexpr = deep_ter_debug_map->get_or_insert (use);
4342 if (vexpr != NULL)
4343 continue;
4344 vexpr = make_node (DEBUG_EXPR_DECL);
4345 gimple *def_temp = gimple_build_debug_bind (vexpr, use, g);
4346 DECL_ARTIFICIAL (vexpr) = 1;
4347 TREE_TYPE (vexpr) = TREE_TYPE (use);
4348 SET_DECL_MODE (vexpr, TYPE_MODE (TREE_TYPE (use)));
4349 gimple_stmt_iterator gsi = gsi_for_stmt (g);
4350 gsi_insert_after (&gsi, def_temp, GSI_NEW_STMT);
4351 avoid_deep_ter_for_debug (def_temp, 0);
4352 }
4353 else
4354 avoid_deep_ter_for_debug (g, depth + 1);
4355 }
4356 }
4357
4358 /* Return an RTX equivalent to the value of the parameter DECL. */
4359
4360 static rtx
4361 expand_debug_parm_decl (tree decl)
4362 {
4363 rtx incoming = DECL_INCOMING_RTL (decl);
4364
4365 if (incoming
4366 && GET_MODE (incoming) != BLKmode
4367 && ((REG_P (incoming) && HARD_REGISTER_P (incoming))
4368 || (MEM_P (incoming)
4369 && REG_P (XEXP (incoming, 0))
4370 && HARD_REGISTER_P (XEXP (incoming, 0)))))
4371 {
4372 rtx rtl = gen_rtx_ENTRY_VALUE (GET_MODE (incoming));
4373
4374 #ifdef HAVE_window_save
4375 /* DECL_INCOMING_RTL uses the INCOMING_REGNO of parameter registers.
4376 If the target machine has an explicit window save instruction, the
4377 actual entry value is the corresponding OUTGOING_REGNO instead. */
4378 if (REG_P (incoming)
4379 && OUTGOING_REGNO (REGNO (incoming)) != REGNO (incoming))
4380 incoming
4381 = gen_rtx_REG_offset (incoming, GET_MODE (incoming),
4382 OUTGOING_REGNO (REGNO (incoming)), 0);
4383 else if (MEM_P (incoming))
4384 {
4385 rtx reg = XEXP (incoming, 0);
4386 if (OUTGOING_REGNO (REGNO (reg)) != REGNO (reg))
4387 {
4388 reg = gen_raw_REG (GET_MODE (reg), OUTGOING_REGNO (REGNO (reg)));
4389 incoming = replace_equiv_address_nv (incoming, reg);
4390 }
4391 else
4392 incoming = copy_rtx (incoming);
4393 }
4394 #endif
4395
4396 ENTRY_VALUE_EXP (rtl) = incoming;
4397 return rtl;
4398 }
4399
4400 if (incoming
4401 && GET_MODE (incoming) != BLKmode
4402 && !TREE_ADDRESSABLE (decl)
4403 && MEM_P (incoming)
4404 && (XEXP (incoming, 0) == virtual_incoming_args_rtx
4405 || (GET_CODE (XEXP (incoming, 0)) == PLUS
4406 && XEXP (XEXP (incoming, 0), 0) == virtual_incoming_args_rtx
4407 && CONST_INT_P (XEXP (XEXP (incoming, 0), 1)))))
4408 return copy_rtx (incoming);
4409
4410 return NULL_RTX;
4411 }
4412
4413 /* Return an RTX equivalent to the value of the tree expression EXP. */
4414
4415 static rtx
4416 expand_debug_expr (tree exp)
4417 {
4418 rtx op0 = NULL_RTX, op1 = NULL_RTX, op2 = NULL_RTX;
4419 machine_mode mode = TYPE_MODE (TREE_TYPE (exp));
4420 machine_mode inner_mode = VOIDmode;
4421 int unsignedp = TYPE_UNSIGNED (TREE_TYPE (exp));
4422 addr_space_t as;
4423 scalar_int_mode op0_mode, op1_mode, addr_mode;
4424
4425 switch (TREE_CODE_CLASS (TREE_CODE (exp)))
4426 {
4427 case tcc_expression:
4428 switch (TREE_CODE (exp))
4429 {
4430 case COND_EXPR:
4431 case DOT_PROD_EXPR:
4432 case SAD_EXPR:
4433 case WIDEN_MULT_PLUS_EXPR:
4434 case WIDEN_MULT_MINUS_EXPR:
4435 goto ternary;
4436
4437 case TRUTH_ANDIF_EXPR:
4438 case TRUTH_ORIF_EXPR:
4439 case TRUTH_AND_EXPR:
4440 case TRUTH_OR_EXPR:
4441 case TRUTH_XOR_EXPR:
4442 goto binary;
4443
4444 case TRUTH_NOT_EXPR:
4445 goto unary;
4446
4447 default:
4448 break;
4449 }
4450 break;
4451
4452 ternary:
4453 op2 = expand_debug_expr (TREE_OPERAND (exp, 2));
4454 if (!op2)
4455 return NULL_RTX;
4456 /* Fall through. */
4457
4458 binary:
4459 case tcc_binary:
4460 if (mode == BLKmode)
4461 return NULL_RTX;
4462 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
4463 if (!op1)
4464 return NULL_RTX;
4465 switch (TREE_CODE (exp))
4466 {
4467 case LSHIFT_EXPR:
4468 case RSHIFT_EXPR:
4469 case LROTATE_EXPR:
4470 case RROTATE_EXPR:
4471 case WIDEN_LSHIFT_EXPR:
4472 /* Ensure second operand isn't wider than the first one. */
4473 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 1)));
4474 if (is_a <scalar_int_mode> (inner_mode, &op1_mode)
4475 && (GET_MODE_UNIT_PRECISION (mode)
4476 < GET_MODE_PRECISION (op1_mode)))
4477 op1 = lowpart_subreg (GET_MODE_INNER (mode), op1, op1_mode);
4478 break;
4479 default:
4480 break;
4481 }
4482 /* Fall through. */
4483
4484 unary:
4485 case tcc_unary:
4486 if (mode == BLKmode)
4487 return NULL_RTX;
4488 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4489 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4490 if (!op0)
4491 return NULL_RTX;
4492 break;
4493
4494 case tcc_comparison:
4495 unsignedp = TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0)));
4496 goto binary;
4497
4498 case tcc_type:
4499 case tcc_statement:
4500 gcc_unreachable ();
4501
4502 case tcc_constant:
4503 case tcc_exceptional:
4504 case tcc_declaration:
4505 case tcc_reference:
4506 case tcc_vl_exp:
4507 break;
4508 }
4509
4510 switch (TREE_CODE (exp))
4511 {
4512 case STRING_CST:
4513 if (!lookup_constant_def (exp))
4514 {
4515 if (strlen (TREE_STRING_POINTER (exp)) + 1
4516 != (size_t) TREE_STRING_LENGTH (exp))
4517 return NULL_RTX;
4518 op0 = gen_rtx_CONST_STRING (Pmode, TREE_STRING_POINTER (exp));
4519 op0 = gen_rtx_MEM (BLKmode, op0);
4520 set_mem_attributes (op0, exp, 0);
4521 return op0;
4522 }
4523 /* Fall through. */
4524
4525 case INTEGER_CST:
4526 case REAL_CST:
4527 case FIXED_CST:
4528 op0 = expand_expr (exp, NULL_RTX, mode, EXPAND_INITIALIZER);
4529 return op0;
4530
4531 case POLY_INT_CST:
4532 return immed_wide_int_const (poly_int_cst_value (exp), mode);
4533
4534 case COMPLEX_CST:
4535 gcc_assert (COMPLEX_MODE_P (mode));
4536 op0 = expand_debug_expr (TREE_REALPART (exp));
4537 op1 = expand_debug_expr (TREE_IMAGPART (exp));
4538 return gen_rtx_CONCAT (mode, op0, op1);
4539
4540 case DEBUG_EXPR_DECL:
4541 op0 = DECL_RTL_IF_SET (exp);
4542
4543 if (op0)
4544 {
4545 if (GET_MODE (op0) != mode)
4546 gcc_assert (VECTOR_TYPE_P (TREE_TYPE (exp)));
4547 else
4548 return op0;
4549 }
4550
4551 op0 = gen_rtx_DEBUG_EXPR (mode);
4552 DEBUG_EXPR_TREE_DECL (op0) = exp;
4553 SET_DECL_RTL (exp, op0);
4554
4555 return op0;
4556
4557 case VAR_DECL:
4558 case PARM_DECL:
4559 case FUNCTION_DECL:
4560 case LABEL_DECL:
4561 case CONST_DECL:
4562 case RESULT_DECL:
4563 op0 = DECL_RTL_IF_SET (exp);
4564
4565 /* This decl was probably optimized away. */
4566 if (!op0
4567 /* At least label RTXen are sometimes replaced by
4568 NOTE_INSN_DELETED_LABEL. Any notes here are not
4569 handled by copy_rtx. */
4570 || NOTE_P (op0))
4571 {
4572 if (!VAR_P (exp)
4573 || DECL_EXTERNAL (exp)
4574 || !TREE_STATIC (exp)
4575 || !DECL_NAME (exp)
4576 || DECL_HARD_REGISTER (exp)
4577 || DECL_IN_CONSTANT_POOL (exp)
4578 || mode == VOIDmode)
4579 return NULL;
4580
4581 op0 = make_decl_rtl_for_debug (exp);
4582 if (!MEM_P (op0)
4583 || GET_CODE (XEXP (op0, 0)) != SYMBOL_REF
4584 || SYMBOL_REF_DECL (XEXP (op0, 0)) != exp)
4585 return NULL;
4586 }
4587 else
4588 op0 = copy_rtx (op0);
4589
4590 if (GET_MODE (op0) == BLKmode
4591 /* If op0 is not BLKmode, but mode is, adjust_mode
4592 below would ICE. While it is likely a FE bug,
4593 try to be robust here. See PR43166. */
4594 || mode == BLKmode
4595 || (mode == VOIDmode && GET_MODE (op0) != VOIDmode))
4596 {
4597 gcc_assert (MEM_P (op0));
4598 op0 = adjust_address_nv (op0, mode, 0);
4599 return op0;
4600 }
4601
4602 /* Fall through. */
4603
4604 adjust_mode:
4605 case PAREN_EXPR:
4606 CASE_CONVERT:
4607 {
4608 inner_mode = GET_MODE (op0);
4609
4610 if (mode == inner_mode)
4611 return op0;
4612
4613 if (inner_mode == VOIDmode)
4614 {
4615 if (TREE_CODE (exp) == SSA_NAME)
4616 inner_mode = TYPE_MODE (TREE_TYPE (exp));
4617 else
4618 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4619 if (mode == inner_mode)
4620 return op0;
4621 }
4622
4623 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
4624 {
4625 if (GET_MODE_UNIT_BITSIZE (mode)
4626 == GET_MODE_UNIT_BITSIZE (inner_mode))
4627 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
4628 else if (GET_MODE_UNIT_BITSIZE (mode)
4629 < GET_MODE_UNIT_BITSIZE (inner_mode))
4630 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
4631 else
4632 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
4633 }
4634 else if (FLOAT_MODE_P (mode))
4635 {
4636 gcc_assert (TREE_CODE (exp) != SSA_NAME);
4637 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
4638 op0 = simplify_gen_unary (UNSIGNED_FLOAT, mode, op0, inner_mode);
4639 else
4640 op0 = simplify_gen_unary (FLOAT, mode, op0, inner_mode);
4641 }
4642 else if (FLOAT_MODE_P (inner_mode))
4643 {
4644 if (unsignedp)
4645 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
4646 else
4647 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
4648 }
4649 else if (GET_MODE_UNIT_PRECISION (mode)
4650 == GET_MODE_UNIT_PRECISION (inner_mode))
4651 op0 = lowpart_subreg (mode, op0, inner_mode);
4652 else if (GET_MODE_UNIT_PRECISION (mode)
4653 < GET_MODE_UNIT_PRECISION (inner_mode))
4654 op0 = simplify_gen_unary (TRUNCATE, mode, op0, inner_mode);
4655 else if (UNARY_CLASS_P (exp)
4656 ? TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0)))
4657 : unsignedp)
4658 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
4659 else
4660 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
4661
4662 return op0;
4663 }
4664
4665 case MEM_REF:
4666 if (!is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
4667 {
4668 tree newexp = fold_binary (MEM_REF, TREE_TYPE (exp),
4669 TREE_OPERAND (exp, 0),
4670 TREE_OPERAND (exp, 1));
4671 if (newexp)
4672 return expand_debug_expr (newexp);
4673 }
4674 /* FALLTHROUGH */
4675 case INDIRECT_REF:
4676 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4677 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4678 if (!op0)
4679 return NULL;
4680
4681 if (TREE_CODE (exp) == MEM_REF)
4682 {
4683 if (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
4684 || (GET_CODE (op0) == PLUS
4685 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR))
4686 /* (mem (debug_implicit_ptr)) might confuse aliasing.
4687 Instead just use get_inner_reference. */
4688 goto component_ref;
4689
4690 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
4691 poly_int64 offset;
4692 if (!op1 || !poly_int_rtx_p (op1, &offset))
4693 return NULL;
4694
4695 op0 = plus_constant (inner_mode, op0, offset);
4696 }
4697
4698 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
4699
4700 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
4701 op0, as);
4702 if (op0 == NULL_RTX)
4703 return NULL;
4704
4705 op0 = gen_rtx_MEM (mode, op0);
4706 set_mem_attributes (op0, exp, 0);
4707 if (TREE_CODE (exp) == MEM_REF
4708 && !is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
4709 set_mem_expr (op0, NULL_TREE);
4710 set_mem_addr_space (op0, as);
4711
4712 return op0;
4713
4714 case TARGET_MEM_REF:
4715 if (TREE_CODE (TMR_BASE (exp)) == ADDR_EXPR
4716 && !DECL_RTL_SET_P (TREE_OPERAND (TMR_BASE (exp), 0)))
4717 return NULL;
4718
4719 op0 = expand_debug_expr
4720 (tree_mem_ref_addr (build_pointer_type (TREE_TYPE (exp)), exp));
4721 if (!op0)
4722 return NULL;
4723
4724 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
4725 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
4726 op0, as);
4727 if (op0 == NULL_RTX)
4728 return NULL;
4729
4730 op0 = gen_rtx_MEM (mode, op0);
4731
4732 set_mem_attributes (op0, exp, 0);
4733 set_mem_addr_space (op0, as);
4734
4735 return op0;
4736
4737 component_ref:
4738 case ARRAY_REF:
4739 case ARRAY_RANGE_REF:
4740 case COMPONENT_REF:
4741 case BIT_FIELD_REF:
4742 case REALPART_EXPR:
4743 case IMAGPART_EXPR:
4744 case VIEW_CONVERT_EXPR:
4745 {
4746 machine_mode mode1;
4747 poly_int64 bitsize, bitpos;
4748 tree offset;
4749 int reversep, volatilep = 0;
4750 tree tem
4751 = get_inner_reference (exp, &bitsize, &bitpos, &offset, &mode1,
4752 &unsignedp, &reversep, &volatilep);
4753 rtx orig_op0;
4754
4755 if (known_eq (bitsize, 0))
4756 return NULL;
4757
4758 orig_op0 = op0 = expand_debug_expr (tem);
4759
4760 if (!op0)
4761 return NULL;
4762
4763 if (offset)
4764 {
4765 machine_mode addrmode, offmode;
4766
4767 if (!MEM_P (op0))
4768 return NULL;
4769
4770 op0 = XEXP (op0, 0);
4771 addrmode = GET_MODE (op0);
4772 if (addrmode == VOIDmode)
4773 addrmode = Pmode;
4774
4775 op1 = expand_debug_expr (offset);
4776 if (!op1)
4777 return NULL;
4778
4779 offmode = GET_MODE (op1);
4780 if (offmode == VOIDmode)
4781 offmode = TYPE_MODE (TREE_TYPE (offset));
4782
4783 if (addrmode != offmode)
4784 op1 = lowpart_subreg (addrmode, op1, offmode);
4785
4786 /* Don't use offset_address here, we don't need a
4787 recognizable address, and we don't want to generate
4788 code. */
4789 op0 = gen_rtx_MEM (mode, simplify_gen_binary (PLUS, addrmode,
4790 op0, op1));
4791 }
4792
4793 if (MEM_P (op0))
4794 {
4795 if (mode1 == VOIDmode)
4796 {
4797 if (maybe_gt (bitsize, MAX_BITSIZE_MODE_ANY_INT))
4798 return NULL;
4799 /* Bitfield. */
4800 mode1 = smallest_int_mode_for_size (bitsize);
4801 }
4802 poly_int64 bytepos = bits_to_bytes_round_down (bitpos);
4803 if (maybe_ne (bytepos, 0))
4804 {
4805 op0 = adjust_address_nv (op0, mode1, bytepos);
4806 bitpos = num_trailing_bits (bitpos);
4807 }
4808 else if (known_eq (bitpos, 0)
4809 && known_eq (bitsize, GET_MODE_BITSIZE (mode)))
4810 op0 = adjust_address_nv (op0, mode, 0);
4811 else if (GET_MODE (op0) != mode1)
4812 op0 = adjust_address_nv (op0, mode1, 0);
4813 else
4814 op0 = copy_rtx (op0);
4815 if (op0 == orig_op0)
4816 op0 = shallow_copy_rtx (op0);
4817 if (TREE_CODE (tem) != SSA_NAME)
4818 set_mem_attributes (op0, exp, 0);
4819 }
4820
4821 if (known_eq (bitpos, 0) && mode == GET_MODE (op0))
4822 return op0;
4823
4824 if (maybe_lt (bitpos, 0))
4825 return NULL;
4826
4827 if (GET_MODE (op0) == BLKmode || mode == BLKmode)
4828 return NULL;
4829
4830 poly_int64 bytepos;
4831 if (multiple_p (bitpos, BITS_PER_UNIT, &bytepos)
4832 && known_eq (bitsize, GET_MODE_BITSIZE (mode1)))
4833 {
4834 machine_mode opmode = GET_MODE (op0);
4835
4836 if (opmode == VOIDmode)
4837 opmode = TYPE_MODE (TREE_TYPE (tem));
4838
4839 /* This condition may hold if we're expanding the address
4840 right past the end of an array that turned out not to
4841 be addressable (i.e., the address was only computed in
4842 debug stmts). The gen_subreg below would rightfully
4843 crash, and the address doesn't really exist, so just
4844 drop it. */
4845 if (known_ge (bitpos, GET_MODE_BITSIZE (opmode)))
4846 return NULL;
4847
4848 if (multiple_p (bitpos, GET_MODE_BITSIZE (mode)))
4849 return simplify_gen_subreg (mode, op0, opmode, bytepos);
4850 }
4851
4852 return simplify_gen_ternary (SCALAR_INT_MODE_P (GET_MODE (op0))
4853 && TYPE_UNSIGNED (TREE_TYPE (exp))
4854 ? SIGN_EXTRACT
4855 : ZERO_EXTRACT, mode,
4856 GET_MODE (op0) != VOIDmode
4857 ? GET_MODE (op0)
4858 : TYPE_MODE (TREE_TYPE (tem)),
4859 op0, gen_int_mode (bitsize, word_mode),
4860 gen_int_mode (bitpos, word_mode));
4861 }
4862
4863 case ABS_EXPR:
4864 case ABSU_EXPR:
4865 return simplify_gen_unary (ABS, mode, op0, mode);
4866
4867 case NEGATE_EXPR:
4868 return simplify_gen_unary (NEG, mode, op0, mode);
4869
4870 case BIT_NOT_EXPR:
4871 return simplify_gen_unary (NOT, mode, op0, mode);
4872
4873 case FLOAT_EXPR:
4874 return simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
4875 0)))
4876 ? UNSIGNED_FLOAT : FLOAT, mode, op0,
4877 inner_mode);
4878
4879 case FIX_TRUNC_EXPR:
4880 return simplify_gen_unary (unsignedp ? UNSIGNED_FIX : FIX, mode, op0,
4881 inner_mode);
4882
4883 case POINTER_PLUS_EXPR:
4884 /* For the rare target where pointers are not the same size as
4885 size_t, we need to check for mis-matched modes and correct
4886 the addend. */
4887 if (op0 && op1
4888 && is_a <scalar_int_mode> (GET_MODE (op0), &op0_mode)
4889 && is_a <scalar_int_mode> (GET_MODE (op1), &op1_mode)
4890 && op0_mode != op1_mode)
4891 {
4892 if (GET_MODE_BITSIZE (op0_mode) < GET_MODE_BITSIZE (op1_mode)
4893 /* If OP0 is a partial mode, then we must truncate, even
4894 if it has the same bitsize as OP1 as GCC's
4895 representation of partial modes is opaque. */
4896 || (GET_MODE_CLASS (op0_mode) == MODE_PARTIAL_INT
4897 && (GET_MODE_BITSIZE (op0_mode)
4898 == GET_MODE_BITSIZE (op1_mode))))
4899 op1 = simplify_gen_unary (TRUNCATE, op0_mode, op1, op1_mode);
4900 else
4901 /* We always sign-extend, regardless of the signedness of
4902 the operand, because the operand is always unsigned
4903 here even if the original C expression is signed. */
4904 op1 = simplify_gen_unary (SIGN_EXTEND, op0_mode, op1, op1_mode);
4905 }
4906 /* Fall through. */
4907 case PLUS_EXPR:
4908 return simplify_gen_binary (PLUS, mode, op0, op1);
4909
4910 case MINUS_EXPR:
4911 case POINTER_DIFF_EXPR:
4912 return simplify_gen_binary (MINUS, mode, op0, op1);
4913
4914 case MULT_EXPR:
4915 return simplify_gen_binary (MULT, mode, op0, op1);
4916
4917 case RDIV_EXPR:
4918 case TRUNC_DIV_EXPR:
4919 case EXACT_DIV_EXPR:
4920 if (unsignedp)
4921 return simplify_gen_binary (UDIV, mode, op0, op1);
4922 else
4923 return simplify_gen_binary (DIV, mode, op0, op1);
4924
4925 case TRUNC_MOD_EXPR:
4926 return simplify_gen_binary (unsignedp ? UMOD : MOD, mode, op0, op1);
4927
4928 case FLOOR_DIV_EXPR:
4929 if (unsignedp)
4930 return simplify_gen_binary (UDIV, mode, op0, op1);
4931 else
4932 {
4933 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4934 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4935 rtx adj = floor_sdiv_adjust (mode, mod, op1);
4936 return simplify_gen_binary (PLUS, mode, div, adj);
4937 }
4938
4939 case FLOOR_MOD_EXPR:
4940 if (unsignedp)
4941 return simplify_gen_binary (UMOD, mode, op0, op1);
4942 else
4943 {
4944 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4945 rtx adj = floor_sdiv_adjust (mode, mod, op1);
4946 adj = simplify_gen_unary (NEG, mode,
4947 simplify_gen_binary (MULT, mode, adj, op1),
4948 mode);
4949 return simplify_gen_binary (PLUS, mode, mod, adj);
4950 }
4951
4952 case CEIL_DIV_EXPR:
4953 if (unsignedp)
4954 {
4955 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
4956 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4957 rtx adj = ceil_udiv_adjust (mode, mod, op1);
4958 return simplify_gen_binary (PLUS, mode, div, adj);
4959 }
4960 else
4961 {
4962 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4963 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4964 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
4965 return simplify_gen_binary (PLUS, mode, div, adj);
4966 }
4967
4968 case CEIL_MOD_EXPR:
4969 if (unsignedp)
4970 {
4971 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4972 rtx adj = ceil_udiv_adjust (mode, mod, op1);
4973 adj = simplify_gen_unary (NEG, mode,
4974 simplify_gen_binary (MULT, mode, adj, op1),
4975 mode);
4976 return simplify_gen_binary (PLUS, mode, mod, adj);
4977 }
4978 else
4979 {
4980 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4981 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
4982 adj = simplify_gen_unary (NEG, mode,
4983 simplify_gen_binary (MULT, mode, adj, op1),
4984 mode);
4985 return simplify_gen_binary (PLUS, mode, mod, adj);
4986 }
4987
4988 case ROUND_DIV_EXPR:
4989 if (unsignedp)
4990 {
4991 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
4992 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4993 rtx adj = round_udiv_adjust (mode, mod, op1);
4994 return simplify_gen_binary (PLUS, mode, div, adj);
4995 }
4996 else
4997 {
4998 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4999 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
5000 rtx adj = round_sdiv_adjust (mode, mod, op1);
5001 return simplify_gen_binary (PLUS, mode, div, adj);
5002 }
5003
5004 case ROUND_MOD_EXPR:
5005 if (unsignedp)
5006 {
5007 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
5008 rtx adj = round_udiv_adjust (mode, mod, op1);
5009 adj = simplify_gen_unary (NEG, mode,
5010 simplify_gen_binary (MULT, mode, adj, op1),
5011 mode);
5012 return simplify_gen_binary (PLUS, mode, mod, adj);
5013 }
5014 else
5015 {
5016 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
5017 rtx adj = round_sdiv_adjust (mode, mod, op1);
5018 adj = simplify_gen_unary (NEG, mode,
5019 simplify_gen_binary (MULT, mode, adj, op1),
5020 mode);
5021 return simplify_gen_binary (PLUS, mode, mod, adj);
5022 }
5023
5024 case LSHIFT_EXPR:
5025 return simplify_gen_binary (ASHIFT, mode, op0, op1);
5026
5027 case RSHIFT_EXPR:
5028 if (unsignedp)
5029 return simplify_gen_binary (LSHIFTRT, mode, op0, op1);
5030 else
5031 return simplify_gen_binary (ASHIFTRT, mode, op0, op1);
5032
5033 case LROTATE_EXPR:
5034 return simplify_gen_binary (ROTATE, mode, op0, op1);
5035
5036 case RROTATE_EXPR:
5037 return simplify_gen_binary (ROTATERT, mode, op0, op1);
5038
5039 case MIN_EXPR:
5040 return simplify_gen_binary (unsignedp ? UMIN : SMIN, mode, op0, op1);
5041
5042 case MAX_EXPR:
5043 return simplify_gen_binary (unsignedp ? UMAX : SMAX, mode, op0, op1);
5044
5045 case BIT_AND_EXPR:
5046 case TRUTH_AND_EXPR:
5047 return simplify_gen_binary (AND, mode, op0, op1);
5048
5049 case BIT_IOR_EXPR:
5050 case TRUTH_OR_EXPR:
5051 return simplify_gen_binary (IOR, mode, op0, op1);
5052
5053 case BIT_XOR_EXPR:
5054 case TRUTH_XOR_EXPR:
5055 return simplify_gen_binary (XOR, mode, op0, op1);
5056
5057 case TRUTH_ANDIF_EXPR:
5058 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, const0_rtx);
5059
5060 case TRUTH_ORIF_EXPR:
5061 return gen_rtx_IF_THEN_ELSE (mode, op0, const_true_rtx, op1);
5062
5063 case TRUTH_NOT_EXPR:
5064 return simplify_gen_relational (EQ, mode, inner_mode, op0, const0_rtx);
5065
5066 case LT_EXPR:
5067 return simplify_gen_relational (unsignedp ? LTU : LT, mode, inner_mode,
5068 op0, op1);
5069
5070 case LE_EXPR:
5071 return simplify_gen_relational (unsignedp ? LEU : LE, mode, inner_mode,
5072 op0, op1);
5073
5074 case GT_EXPR:
5075 return simplify_gen_relational (unsignedp ? GTU : GT, mode, inner_mode,
5076 op0, op1);
5077
5078 case GE_EXPR:
5079 return simplify_gen_relational (unsignedp ? GEU : GE, mode, inner_mode,
5080 op0, op1);
5081
5082 case EQ_EXPR:
5083 return simplify_gen_relational (EQ, mode, inner_mode, op0, op1);
5084
5085 case NE_EXPR:
5086 return simplify_gen_relational (NE, mode, inner_mode, op0, op1);
5087
5088 case UNORDERED_EXPR:
5089 return simplify_gen_relational (UNORDERED, mode, inner_mode, op0, op1);
5090
5091 case ORDERED_EXPR:
5092 return simplify_gen_relational (ORDERED, mode, inner_mode, op0, op1);
5093
5094 case UNLT_EXPR:
5095 return simplify_gen_relational (UNLT, mode, inner_mode, op0, op1);
5096
5097 case UNLE_EXPR:
5098 return simplify_gen_relational (UNLE, mode, inner_mode, op0, op1);
5099
5100 case UNGT_EXPR:
5101 return simplify_gen_relational (UNGT, mode, inner_mode, op0, op1);
5102
5103 case UNGE_EXPR:
5104 return simplify_gen_relational (UNGE, mode, inner_mode, op0, op1);
5105
5106 case UNEQ_EXPR:
5107 return simplify_gen_relational (UNEQ, mode, inner_mode, op0, op1);
5108
5109 case LTGT_EXPR:
5110 return simplify_gen_relational (LTGT, mode, inner_mode, op0, op1);
5111
5112 case COND_EXPR:
5113 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, op2);
5114
5115 case COMPLEX_EXPR:
5116 gcc_assert (COMPLEX_MODE_P (mode));
5117 if (GET_MODE (op0) == VOIDmode)
5118 op0 = gen_rtx_CONST (GET_MODE_INNER (mode), op0);
5119 if (GET_MODE (op1) == VOIDmode)
5120 op1 = gen_rtx_CONST (GET_MODE_INNER (mode), op1);
5121 return gen_rtx_CONCAT (mode, op0, op1);
5122
5123 case CONJ_EXPR:
5124 if (GET_CODE (op0) == CONCAT)
5125 return gen_rtx_CONCAT (mode, XEXP (op0, 0),
5126 simplify_gen_unary (NEG, GET_MODE_INNER (mode),
5127 XEXP (op0, 1),
5128 GET_MODE_INNER (mode)));
5129 else
5130 {
5131 scalar_mode imode = GET_MODE_INNER (mode);
5132 rtx re, im;
5133
5134 if (MEM_P (op0))
5135 {
5136 re = adjust_address_nv (op0, imode, 0);
5137 im = adjust_address_nv (op0, imode, GET_MODE_SIZE (imode));
5138 }
5139 else
5140 {
5141 scalar_int_mode ifmode;
5142 scalar_int_mode ihmode;
5143 rtx halfsize;
5144 if (!int_mode_for_mode (mode).exists (&ifmode)
5145 || !int_mode_for_mode (imode).exists (&ihmode))
5146 return NULL;
5147 halfsize = GEN_INT (GET_MODE_BITSIZE (ihmode));
5148 re = op0;
5149 if (mode != ifmode)
5150 re = gen_rtx_SUBREG (ifmode, re, 0);
5151 re = gen_rtx_ZERO_EXTRACT (ihmode, re, halfsize, const0_rtx);
5152 if (imode != ihmode)
5153 re = gen_rtx_SUBREG (imode, re, 0);
5154 im = copy_rtx (op0);
5155 if (mode != ifmode)
5156 im = gen_rtx_SUBREG (ifmode, im, 0);
5157 im = gen_rtx_ZERO_EXTRACT (ihmode, im, halfsize, halfsize);
5158 if (imode != ihmode)
5159 im = gen_rtx_SUBREG (imode, im, 0);
5160 }
5161 im = gen_rtx_NEG (imode, im);
5162 return gen_rtx_CONCAT (mode, re, im);
5163 }
5164
5165 case ADDR_EXPR:
5166 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
5167 if (!op0 || !MEM_P (op0))
5168 {
5169 if ((TREE_CODE (TREE_OPERAND (exp, 0)) == VAR_DECL
5170 || TREE_CODE (TREE_OPERAND (exp, 0)) == PARM_DECL
5171 || TREE_CODE (TREE_OPERAND (exp, 0)) == RESULT_DECL)
5172 && (!TREE_ADDRESSABLE (TREE_OPERAND (exp, 0))
5173 || target_for_debug_bind (TREE_OPERAND (exp, 0))))
5174 return gen_rtx_DEBUG_IMPLICIT_PTR (mode, TREE_OPERAND (exp, 0));
5175
5176 if (handled_component_p (TREE_OPERAND (exp, 0)))
5177 {
5178 poly_int64 bitoffset, bitsize, maxsize, byteoffset;
5179 bool reverse;
5180 tree decl
5181 = get_ref_base_and_extent (TREE_OPERAND (exp, 0), &bitoffset,
5182 &bitsize, &maxsize, &reverse);
5183 if ((VAR_P (decl)
5184 || TREE_CODE (decl) == PARM_DECL
5185 || TREE_CODE (decl) == RESULT_DECL)
5186 && (!TREE_ADDRESSABLE (decl)
5187 || target_for_debug_bind (decl))
5188 && multiple_p (bitoffset, BITS_PER_UNIT, &byteoffset)
5189 && known_gt (bitsize, 0)
5190 && known_eq (bitsize, maxsize))
5191 {
5192 rtx base = gen_rtx_DEBUG_IMPLICIT_PTR (mode, decl);
5193 return plus_constant (mode, base, byteoffset);
5194 }
5195 }
5196
5197 if (TREE_CODE (TREE_OPERAND (exp, 0)) == MEM_REF
5198 && TREE_CODE (TREE_OPERAND (TREE_OPERAND (exp, 0), 0))
5199 == ADDR_EXPR)
5200 {
5201 op0 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
5202 0));
5203 if (op0 != NULL
5204 && (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
5205 || (GET_CODE (op0) == PLUS
5206 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR
5207 && CONST_INT_P (XEXP (op0, 1)))))
5208 {
5209 op1 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
5210 1));
5211 poly_int64 offset;
5212 if (!op1 || !poly_int_rtx_p (op1, &offset))
5213 return NULL;
5214
5215 return plus_constant (mode, op0, offset);
5216 }
5217 }
5218
5219 return NULL;
5220 }
5221
5222 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (exp)));
5223 addr_mode = SCALAR_INT_TYPE_MODE (TREE_TYPE (exp));
5224 op0 = convert_debug_memory_address (addr_mode, XEXP (op0, 0), as);
5225
5226 return op0;
5227
5228 case VECTOR_CST:
5229 {
5230 unsigned HOST_WIDE_INT i, nelts;
5231
5232 if (!VECTOR_CST_NELTS (exp).is_constant (&nelts))
5233 return NULL;
5234
5235 op0 = gen_rtx_CONCATN (mode, rtvec_alloc (nelts));
5236
5237 for (i = 0; i < nelts; ++i)
5238 {
5239 op1 = expand_debug_expr (VECTOR_CST_ELT (exp, i));
5240 if (!op1)
5241 return NULL;
5242 XVECEXP (op0, 0, i) = op1;
5243 }
5244
5245 return op0;
5246 }
5247
5248 case CONSTRUCTOR:
5249 if (TREE_CLOBBER_P (exp))
5250 return NULL;
5251 else if (TREE_CODE (TREE_TYPE (exp)) == VECTOR_TYPE)
5252 {
5253 unsigned i;
5254 unsigned HOST_WIDE_INT nelts;
5255 tree val;
5256
5257 if (!TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp)).is_constant (&nelts))
5258 goto flag_unsupported;
5259
5260 op0 = gen_rtx_CONCATN (mode, rtvec_alloc (nelts));
5261
5262 FOR_EACH_CONSTRUCTOR_VALUE (CONSTRUCTOR_ELTS (exp), i, val)
5263 {
5264 op1 = expand_debug_expr (val);
5265 if (!op1)
5266 return NULL;
5267 XVECEXP (op0, 0, i) = op1;
5268 }
5269
5270 if (i < nelts)
5271 {
5272 op1 = expand_debug_expr
5273 (build_zero_cst (TREE_TYPE (TREE_TYPE (exp))));
5274
5275 if (!op1)
5276 return NULL;
5277
5278 for (; i < nelts; i++)
5279 XVECEXP (op0, 0, i) = op1;
5280 }
5281
5282 return op0;
5283 }
5284 else
5285 goto flag_unsupported;
5286
5287 case CALL_EXPR:
5288 /* ??? Maybe handle some builtins? */
5289 return NULL;
5290
5291 case SSA_NAME:
5292 {
5293 gimple *g = get_gimple_for_ssa_name (exp);
5294 if (g)
5295 {
5296 tree t = NULL_TREE;
5297 if (deep_ter_debug_map)
5298 {
5299 tree *slot = deep_ter_debug_map->get (exp);
5300 if (slot)
5301 t = *slot;
5302 }
5303 if (t == NULL_TREE)
5304 t = gimple_assign_rhs_to_tree (g);
5305 op0 = expand_debug_expr (t);
5306 if (!op0)
5307 return NULL;
5308 }
5309 else
5310 {
5311 /* If this is a reference to an incoming value of
5312 parameter that is never used in the code or where the
5313 incoming value is never used in the code, use
5314 PARM_DECL's DECL_RTL if set. */
5315 if (SSA_NAME_IS_DEFAULT_DEF (exp)
5316 && SSA_NAME_VAR (exp)
5317 && TREE_CODE (SSA_NAME_VAR (exp)) == PARM_DECL
5318 && has_zero_uses (exp))
5319 {
5320 op0 = expand_debug_parm_decl (SSA_NAME_VAR (exp));
5321 if (op0)
5322 goto adjust_mode;
5323 op0 = expand_debug_expr (SSA_NAME_VAR (exp));
5324 if (op0)
5325 goto adjust_mode;
5326 }
5327
5328 int part = var_to_partition (SA.map, exp);
5329
5330 if (part == NO_PARTITION)
5331 return NULL;
5332
5333 gcc_assert (part >= 0 && (unsigned)part < SA.map->num_partitions);
5334
5335 op0 = copy_rtx (SA.partition_to_pseudo[part]);
5336 }
5337 goto adjust_mode;
5338 }
5339
5340 case ERROR_MARK:
5341 return NULL;
5342
5343 /* Vector stuff. For most of the codes we don't have rtl codes. */
5344 case REALIGN_LOAD_EXPR:
5345 case VEC_COND_EXPR:
5346 case VEC_PACK_FIX_TRUNC_EXPR:
5347 case VEC_PACK_FLOAT_EXPR:
5348 case VEC_PACK_SAT_EXPR:
5349 case VEC_PACK_TRUNC_EXPR:
5350 case VEC_UNPACK_FIX_TRUNC_HI_EXPR:
5351 case VEC_UNPACK_FIX_TRUNC_LO_EXPR:
5352 case VEC_UNPACK_FLOAT_HI_EXPR:
5353 case VEC_UNPACK_FLOAT_LO_EXPR:
5354 case VEC_UNPACK_HI_EXPR:
5355 case VEC_UNPACK_LO_EXPR:
5356 case VEC_WIDEN_MULT_HI_EXPR:
5357 case VEC_WIDEN_MULT_LO_EXPR:
5358 case VEC_WIDEN_MULT_EVEN_EXPR:
5359 case VEC_WIDEN_MULT_ODD_EXPR:
5360 case VEC_WIDEN_LSHIFT_HI_EXPR:
5361 case VEC_WIDEN_LSHIFT_LO_EXPR:
5362 case VEC_PERM_EXPR:
5363 case VEC_DUPLICATE_EXPR:
5364 case VEC_SERIES_EXPR:
5365 case SAD_EXPR:
5366 return NULL;
5367
5368 /* Misc codes. */
5369 case ADDR_SPACE_CONVERT_EXPR:
5370 case FIXED_CONVERT_EXPR:
5371 case OBJ_TYPE_REF:
5372 case WITH_SIZE_EXPR:
5373 case BIT_INSERT_EXPR:
5374 return NULL;
5375
5376 case DOT_PROD_EXPR:
5377 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5378 && SCALAR_INT_MODE_P (mode))
5379 {
5380 op0
5381 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5382 0)))
5383 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
5384 inner_mode);
5385 op1
5386 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5387 1)))
5388 ? ZERO_EXTEND : SIGN_EXTEND, mode, op1,
5389 inner_mode);
5390 op0 = simplify_gen_binary (MULT, mode, op0, op1);
5391 return simplify_gen_binary (PLUS, mode, op0, op2);
5392 }
5393 return NULL;
5394
5395 case WIDEN_MULT_EXPR:
5396 case WIDEN_MULT_PLUS_EXPR:
5397 case WIDEN_MULT_MINUS_EXPR:
5398 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5399 && SCALAR_INT_MODE_P (mode))
5400 {
5401 inner_mode = GET_MODE (op0);
5402 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
5403 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
5404 else
5405 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
5406 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 1))))
5407 op1 = simplify_gen_unary (ZERO_EXTEND, mode, op1, inner_mode);
5408 else
5409 op1 = simplify_gen_unary (SIGN_EXTEND, mode, op1, inner_mode);
5410 op0 = simplify_gen_binary (MULT, mode, op0, op1);
5411 if (TREE_CODE (exp) == WIDEN_MULT_EXPR)
5412 return op0;
5413 else if (TREE_CODE (exp) == WIDEN_MULT_PLUS_EXPR)
5414 return simplify_gen_binary (PLUS, mode, op0, op2);
5415 else
5416 return simplify_gen_binary (MINUS, mode, op2, op0);
5417 }
5418 return NULL;
5419
5420 case MULT_HIGHPART_EXPR:
5421 /* ??? Similar to the above. */
5422 return NULL;
5423
5424 case WIDEN_SUM_EXPR:
5425 case WIDEN_LSHIFT_EXPR:
5426 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5427 && SCALAR_INT_MODE_P (mode))
5428 {
5429 op0
5430 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5431 0)))
5432 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
5433 inner_mode);
5434 return simplify_gen_binary (TREE_CODE (exp) == WIDEN_LSHIFT_EXPR
5435 ? ASHIFT : PLUS, mode, op0, op1);
5436 }
5437 return NULL;
5438
5439 default:
5440 flag_unsupported:
5441 if (flag_checking)
5442 {
5443 debug_tree (exp);
5444 gcc_unreachable ();
5445 }
5446 return NULL;
5447 }
5448 }
5449
5450 /* Return an RTX equivalent to the source bind value of the tree expression
5451 EXP. */
5452
5453 static rtx
5454 expand_debug_source_expr (tree exp)
5455 {
5456 rtx op0 = NULL_RTX;
5457 machine_mode mode = VOIDmode, inner_mode;
5458
5459 switch (TREE_CODE (exp))
5460 {
5461 case VAR_DECL:
5462 if (DECL_ABSTRACT_ORIGIN (exp))
5463 return expand_debug_source_expr (DECL_ABSTRACT_ORIGIN (exp));
5464 break;
5465 case PARM_DECL:
5466 {
5467 mode = DECL_MODE (exp);
5468 op0 = expand_debug_parm_decl (exp);
5469 if (op0)
5470 break;
5471 /* See if this isn't an argument that has been completely
5472 optimized out. */
5473 if (!DECL_RTL_SET_P (exp)
5474 && !DECL_INCOMING_RTL (exp)
5475 && DECL_ABSTRACT_ORIGIN (current_function_decl))
5476 {
5477 tree aexp = DECL_ORIGIN (exp);
5478 if (DECL_CONTEXT (aexp)
5479 == DECL_ABSTRACT_ORIGIN (current_function_decl))
5480 {
5481 vec<tree, va_gc> **debug_args;
5482 unsigned int ix;
5483 tree ddecl;
5484 debug_args = decl_debug_args_lookup (current_function_decl);
5485 if (debug_args != NULL)
5486 {
5487 for (ix = 0; vec_safe_iterate (*debug_args, ix, &ddecl);
5488 ix += 2)
5489 if (ddecl == aexp)
5490 return gen_rtx_DEBUG_PARAMETER_REF (mode, aexp);
5491 }
5492 }
5493 }
5494 break;
5495 }
5496 default:
5497 break;
5498 }
5499
5500 if (op0 == NULL_RTX)
5501 return NULL_RTX;
5502
5503 inner_mode = GET_MODE (op0);
5504 if (mode == inner_mode)
5505 return op0;
5506
5507 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
5508 {
5509 if (GET_MODE_UNIT_BITSIZE (mode)
5510 == GET_MODE_UNIT_BITSIZE (inner_mode))
5511 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
5512 else if (GET_MODE_UNIT_BITSIZE (mode)
5513 < GET_MODE_UNIT_BITSIZE (inner_mode))
5514 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
5515 else
5516 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
5517 }
5518 else if (FLOAT_MODE_P (mode))
5519 gcc_unreachable ();
5520 else if (FLOAT_MODE_P (inner_mode))
5521 {
5522 if (TYPE_UNSIGNED (TREE_TYPE (exp)))
5523 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
5524 else
5525 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
5526 }
5527 else if (GET_MODE_UNIT_PRECISION (mode)
5528 == GET_MODE_UNIT_PRECISION (inner_mode))
5529 op0 = lowpart_subreg (mode, op0, inner_mode);
5530 else if (GET_MODE_UNIT_PRECISION (mode)
5531 < GET_MODE_UNIT_PRECISION (inner_mode))
5532 op0 = simplify_gen_unary (TRUNCATE, mode, op0, inner_mode);
5533 else if (TYPE_UNSIGNED (TREE_TYPE (exp)))
5534 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
5535 else
5536 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
5537
5538 return op0;
5539 }
5540
5541 /* Ensure INSN_VAR_LOCATION_LOC (insn) doesn't have unbound complexity.
5542 Allow 4 levels of rtl nesting for most rtl codes, and if we see anything
5543 deeper than that, create DEBUG_EXPRs and emit DEBUG_INSNs before INSN. */
5544
5545 static void
5546 avoid_complex_debug_insns (rtx_insn *insn, rtx *exp_p, int depth)
5547 {
5548 rtx exp = *exp_p;
5549
5550 if (exp == NULL_RTX)
5551 return;
5552
5553 if ((OBJECT_P (exp) && !MEM_P (exp)) || GET_CODE (exp) == CLOBBER)
5554 return;
5555
5556 if (depth == 4)
5557 {
5558 /* Create DEBUG_EXPR (and DEBUG_EXPR_DECL). */
5559 rtx dval = make_debug_expr_from_rtl (exp);
5560
5561 /* Emit a debug bind insn before INSN. */
5562 rtx bind = gen_rtx_VAR_LOCATION (GET_MODE (exp),
5563 DEBUG_EXPR_TREE_DECL (dval), exp,
5564 VAR_INIT_STATUS_INITIALIZED);
5565
5566 emit_debug_insn_before (bind, insn);
5567 *exp_p = dval;
5568 return;
5569 }
5570
5571 const char *format_ptr = GET_RTX_FORMAT (GET_CODE (exp));
5572 int i, j;
5573 for (i = 0; i < GET_RTX_LENGTH (GET_CODE (exp)); i++)
5574 switch (*format_ptr++)
5575 {
5576 case 'e':
5577 avoid_complex_debug_insns (insn, &XEXP (exp, i), depth + 1);
5578 break;
5579
5580 case 'E':
5581 case 'V':
5582 for (j = 0; j < XVECLEN (exp, i); j++)
5583 avoid_complex_debug_insns (insn, &XVECEXP (exp, i, j), depth + 1);
5584 break;
5585
5586 default:
5587 break;
5588 }
5589 }
5590
5591 /* Expand the _LOCs in debug insns. We run this after expanding all
5592 regular insns, so that any variables referenced in the function
5593 will have their DECL_RTLs set. */
5594
5595 static void
5596 expand_debug_locations (void)
5597 {
5598 rtx_insn *insn;
5599 rtx_insn *last = get_last_insn ();
5600 int save_strict_alias = flag_strict_aliasing;
5601
5602 /* New alias sets while setting up memory attributes cause
5603 -fcompare-debug failures, even though it doesn't bring about any
5604 codegen changes. */
5605 flag_strict_aliasing = 0;
5606
5607 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
5608 if (DEBUG_BIND_INSN_P (insn))
5609 {
5610 tree value = (tree)INSN_VAR_LOCATION_LOC (insn);
5611 rtx val;
5612 rtx_insn *prev_insn, *insn2;
5613 machine_mode mode;
5614
5615 if (value == NULL_TREE)
5616 val = NULL_RTX;
5617 else
5618 {
5619 if (INSN_VAR_LOCATION_STATUS (insn)
5620 == VAR_INIT_STATUS_UNINITIALIZED)
5621 val = expand_debug_source_expr (value);
5622 /* The avoid_deep_ter_for_debug function inserts
5623 debug bind stmts after SSA_NAME definition, with the
5624 SSA_NAME as the whole bind location. Disable temporarily
5625 expansion of that SSA_NAME into the DEBUG_EXPR_DECL
5626 being defined in this DEBUG_INSN. */
5627 else if (deep_ter_debug_map && TREE_CODE (value) == SSA_NAME)
5628 {
5629 tree *slot = deep_ter_debug_map->get (value);
5630 if (slot)
5631 {
5632 if (*slot == INSN_VAR_LOCATION_DECL (insn))
5633 *slot = NULL_TREE;
5634 else
5635 slot = NULL;
5636 }
5637 val = expand_debug_expr (value);
5638 if (slot)
5639 *slot = INSN_VAR_LOCATION_DECL (insn);
5640 }
5641 else
5642 val = expand_debug_expr (value);
5643 gcc_assert (last == get_last_insn ());
5644 }
5645
5646 if (!val)
5647 val = gen_rtx_UNKNOWN_VAR_LOC ();
5648 else
5649 {
5650 mode = GET_MODE (INSN_VAR_LOCATION (insn));
5651
5652 gcc_assert (mode == GET_MODE (val)
5653 || (GET_MODE (val) == VOIDmode
5654 && (CONST_SCALAR_INT_P (val)
5655 || GET_CODE (val) == CONST_FIXED
5656 || GET_CODE (val) == LABEL_REF)));
5657 }
5658
5659 INSN_VAR_LOCATION_LOC (insn) = val;
5660 prev_insn = PREV_INSN (insn);
5661 for (insn2 = insn; insn2 != prev_insn; insn2 = PREV_INSN (insn2))
5662 avoid_complex_debug_insns (insn2, &INSN_VAR_LOCATION_LOC (insn2), 0);
5663 }
5664
5665 flag_strict_aliasing = save_strict_alias;
5666 }
5667
5668 /* Performs swapping operands of commutative operations to expand
5669 the expensive one first. */
5670
5671 static void
5672 reorder_operands (basic_block bb)
5673 {
5674 unsigned int *lattice; /* Hold cost of each statement. */
5675 unsigned int i = 0, n = 0;
5676 gimple_stmt_iterator gsi;
5677 gimple_seq stmts;
5678 gimple *stmt;
5679 bool swap;
5680 tree op0, op1;
5681 ssa_op_iter iter;
5682 use_operand_p use_p;
5683 gimple *def0, *def1;
5684
5685 /* Compute cost of each statement using estimate_num_insns. */
5686 stmts = bb_seq (bb);
5687 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
5688 {
5689 stmt = gsi_stmt (gsi);
5690 if (!is_gimple_debug (stmt))
5691 gimple_set_uid (stmt, n++);
5692 }
5693 lattice = XNEWVEC (unsigned int, n);
5694 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
5695 {
5696 unsigned cost;
5697 stmt = gsi_stmt (gsi);
5698 if (is_gimple_debug (stmt))
5699 continue;
5700 cost = estimate_num_insns (stmt, &eni_size_weights);
5701 lattice[i] = cost;
5702 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
5703 {
5704 tree use = USE_FROM_PTR (use_p);
5705 gimple *def_stmt;
5706 if (TREE_CODE (use) != SSA_NAME)
5707 continue;
5708 def_stmt = get_gimple_for_ssa_name (use);
5709 if (!def_stmt)
5710 continue;
5711 lattice[i] += lattice[gimple_uid (def_stmt)];
5712 }
5713 i++;
5714 if (!is_gimple_assign (stmt)
5715 || !commutative_tree_code (gimple_assign_rhs_code (stmt)))
5716 continue;
5717 op0 = gimple_op (stmt, 1);
5718 op1 = gimple_op (stmt, 2);
5719 if (TREE_CODE (op0) != SSA_NAME
5720 || TREE_CODE (op1) != SSA_NAME)
5721 continue;
5722 /* Swap operands if the second one is more expensive. */
5723 def0 = get_gimple_for_ssa_name (op0);
5724 def1 = get_gimple_for_ssa_name (op1);
5725 if (!def1)
5726 continue;
5727 swap = false;
5728 if (!def0 || lattice[gimple_uid (def1)] > lattice[gimple_uid (def0)])
5729 swap = true;
5730 if (swap)
5731 {
5732 if (dump_file && (dump_flags & TDF_DETAILS))
5733 {
5734 fprintf (dump_file, "Swap operands in stmt:\n");
5735 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
5736 fprintf (dump_file, "Cost left opnd=%d, right opnd=%d\n",
5737 def0 ? lattice[gimple_uid (def0)] : 0,
5738 lattice[gimple_uid (def1)]);
5739 }
5740 swap_ssa_operands (stmt, gimple_assign_rhs1_ptr (stmt),
5741 gimple_assign_rhs2_ptr (stmt));
5742 }
5743 }
5744 XDELETE (lattice);
5745 }
5746
5747 /* Expand basic block BB from GIMPLE trees to RTL. */
5748
5749 static basic_block
5750 expand_gimple_basic_block (basic_block bb, bool disable_tail_calls)
5751 {
5752 gimple_stmt_iterator gsi;
5753 gimple_seq stmts;
5754 gimple *stmt = NULL;
5755 rtx_note *note = NULL;
5756 rtx_insn *last;
5757 edge e;
5758 edge_iterator ei;
5759
5760 if (dump_file)
5761 fprintf (dump_file, "\n;; Generating RTL for gimple basic block %d\n",
5762 bb->index);
5763
5764 /* Note that since we are now transitioning from GIMPLE to RTL, we
5765 cannot use the gsi_*_bb() routines because they expect the basic
5766 block to be in GIMPLE, instead of RTL. Therefore, we need to
5767 access the BB sequence directly. */
5768 if (optimize)
5769 reorder_operands (bb);
5770 stmts = bb_seq (bb);
5771 bb->il.gimple.seq = NULL;
5772 bb->il.gimple.phi_nodes = NULL;
5773 rtl_profile_for_bb (bb);
5774 init_rtl_bb_info (bb);
5775 bb->flags |= BB_RTL;
5776
5777 /* Remove the RETURN_EXPR if we may fall though to the exit
5778 instead. */
5779 gsi = gsi_last (stmts);
5780 if (!gsi_end_p (gsi)
5781 && gimple_code (gsi_stmt (gsi)) == GIMPLE_RETURN)
5782 {
5783 greturn *ret_stmt = as_a <greturn *> (gsi_stmt (gsi));
5784
5785 gcc_assert (single_succ_p (bb));
5786 gcc_assert (single_succ (bb) == EXIT_BLOCK_PTR_FOR_FN (cfun));
5787
5788 if (bb->next_bb == EXIT_BLOCK_PTR_FOR_FN (cfun)
5789 && !gimple_return_retval (ret_stmt))
5790 {
5791 gsi_remove (&gsi, false);
5792 single_succ_edge (bb)->flags |= EDGE_FALLTHRU;
5793 }
5794 }
5795
5796 gsi = gsi_start (stmts);
5797 if (!gsi_end_p (gsi))
5798 {
5799 stmt = gsi_stmt (gsi);
5800 if (gimple_code (stmt) != GIMPLE_LABEL)
5801 stmt = NULL;
5802 }
5803
5804 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
5805
5806 if (stmt || elt)
5807 {
5808 gcc_checking_assert (!note);
5809 last = get_last_insn ();
5810
5811 if (stmt)
5812 {
5813 expand_gimple_stmt (stmt);
5814 gsi_next (&gsi);
5815 }
5816
5817 if (elt)
5818 emit_label (*elt);
5819
5820 BB_HEAD (bb) = NEXT_INSN (last);
5821 if (NOTE_P (BB_HEAD (bb)))
5822 BB_HEAD (bb) = NEXT_INSN (BB_HEAD (bb));
5823 gcc_assert (LABEL_P (BB_HEAD (bb)));
5824 note = emit_note_after (NOTE_INSN_BASIC_BLOCK, BB_HEAD (bb));
5825
5826 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5827 }
5828 else
5829 BB_HEAD (bb) = note = emit_note (NOTE_INSN_BASIC_BLOCK);
5830
5831 if (note)
5832 NOTE_BASIC_BLOCK (note) = bb;
5833
5834 for (; !gsi_end_p (gsi); gsi_next (&gsi))
5835 {
5836 basic_block new_bb;
5837
5838 stmt = gsi_stmt (gsi);
5839
5840 /* If this statement is a non-debug one, and we generate debug
5841 insns, then this one might be the last real use of a TERed
5842 SSA_NAME, but where there are still some debug uses further
5843 down. Expanding the current SSA name in such further debug
5844 uses by their RHS might lead to wrong debug info, as coalescing
5845 might make the operands of such RHS be placed into the same
5846 pseudo as something else. Like so:
5847 a_1 = a_0 + 1; // Assume a_1 is TERed and a_0 is dead
5848 use(a_1);
5849 a_2 = ...
5850 #DEBUG ... => a_1
5851 As a_0 and a_2 don't overlap in lifetime, assume they are coalesced.
5852 If we now would expand a_1 by it's RHS (a_0 + 1) in the debug use,
5853 the write to a_2 would actually have clobbered the place which
5854 formerly held a_0.
5855
5856 So, instead of that, we recognize the situation, and generate
5857 debug temporaries at the last real use of TERed SSA names:
5858 a_1 = a_0 + 1;
5859 #DEBUG #D1 => a_1
5860 use(a_1);
5861 a_2 = ...
5862 #DEBUG ... => #D1
5863 */
5864 if (MAY_HAVE_DEBUG_BIND_INSNS
5865 && SA.values
5866 && !is_gimple_debug (stmt))
5867 {
5868 ssa_op_iter iter;
5869 tree op;
5870 gimple *def;
5871
5872 location_t sloc = curr_insn_location ();
5873
5874 /* Look for SSA names that have their last use here (TERed
5875 names always have only one real use). */
5876 FOR_EACH_SSA_TREE_OPERAND (op, stmt, iter, SSA_OP_USE)
5877 if ((def = get_gimple_for_ssa_name (op)))
5878 {
5879 imm_use_iterator imm_iter;
5880 use_operand_p use_p;
5881 bool have_debug_uses = false;
5882
5883 FOR_EACH_IMM_USE_FAST (use_p, imm_iter, op)
5884 {
5885 if (gimple_debug_bind_p (USE_STMT (use_p)))
5886 {
5887 have_debug_uses = true;
5888 break;
5889 }
5890 }
5891
5892 if (have_debug_uses)
5893 {
5894 /* OP is a TERed SSA name, with DEF its defining
5895 statement, and where OP is used in further debug
5896 instructions. Generate a debug temporary, and
5897 replace all uses of OP in debug insns with that
5898 temporary. */
5899 gimple *debugstmt;
5900 tree value = gimple_assign_rhs_to_tree (def);
5901 tree vexpr = make_node (DEBUG_EXPR_DECL);
5902 rtx val;
5903 machine_mode mode;
5904
5905 set_curr_insn_location (gimple_location (def));
5906
5907 DECL_ARTIFICIAL (vexpr) = 1;
5908 TREE_TYPE (vexpr) = TREE_TYPE (value);
5909 if (DECL_P (value))
5910 mode = DECL_MODE (value);
5911 else
5912 mode = TYPE_MODE (TREE_TYPE (value));
5913 SET_DECL_MODE (vexpr, mode);
5914
5915 val = gen_rtx_VAR_LOCATION
5916 (mode, vexpr, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
5917
5918 emit_debug_insn (val);
5919
5920 FOR_EACH_IMM_USE_STMT (debugstmt, imm_iter, op)
5921 {
5922 if (!gimple_debug_bind_p (debugstmt))
5923 continue;
5924
5925 FOR_EACH_IMM_USE_ON_STMT (use_p, imm_iter)
5926 SET_USE (use_p, vexpr);
5927
5928 update_stmt (debugstmt);
5929 }
5930 }
5931 }
5932 set_curr_insn_location (sloc);
5933 }
5934
5935 currently_expanding_gimple_stmt = stmt;
5936
5937 /* Expand this statement, then evaluate the resulting RTL and
5938 fixup the CFG accordingly. */
5939 if (gimple_code (stmt) == GIMPLE_COND)
5940 {
5941 new_bb = expand_gimple_cond (bb, as_a <gcond *> (stmt));
5942 if (new_bb)
5943 return new_bb;
5944 }
5945 else if (is_gimple_debug (stmt))
5946 {
5947 location_t sloc = curr_insn_location ();
5948 gimple_stmt_iterator nsi = gsi;
5949
5950 for (;;)
5951 {
5952 tree var;
5953 tree value = NULL_TREE;
5954 rtx val = NULL_RTX;
5955 machine_mode mode;
5956
5957 if (!gimple_debug_nonbind_marker_p (stmt))
5958 {
5959 if (gimple_debug_bind_p (stmt))
5960 {
5961 var = gimple_debug_bind_get_var (stmt);
5962
5963 if (TREE_CODE (var) != DEBUG_EXPR_DECL
5964 && TREE_CODE (var) != LABEL_DECL
5965 && !target_for_debug_bind (var))
5966 goto delink_debug_stmt;
5967
5968 if (DECL_P (var) && !VECTOR_TYPE_P (TREE_TYPE (var)))
5969 mode = DECL_MODE (var);
5970 else
5971 mode = TYPE_MODE (TREE_TYPE (var));
5972
5973 if (gimple_debug_bind_has_value_p (stmt))
5974 value = gimple_debug_bind_get_value (stmt);
5975
5976 val = gen_rtx_VAR_LOCATION
5977 (mode, var, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
5978 }
5979 else if (gimple_debug_source_bind_p (stmt))
5980 {
5981 var = gimple_debug_source_bind_get_var (stmt);
5982
5983 value = gimple_debug_source_bind_get_value (stmt);
5984
5985 if (!VECTOR_TYPE_P (TREE_TYPE (var)))
5986 mode = DECL_MODE (var);
5987 else
5988 mode = TYPE_MODE (TREE_TYPE (var));
5989
5990 val = gen_rtx_VAR_LOCATION (mode, var, (rtx)value,
5991 VAR_INIT_STATUS_UNINITIALIZED);
5992 }
5993 else
5994 gcc_unreachable ();
5995 }
5996 /* If this function was first compiled with markers
5997 enabled, but they're now disable (e.g. LTO), drop
5998 them on the floor. */
5999 else if (gimple_debug_nonbind_marker_p (stmt)
6000 && !MAY_HAVE_DEBUG_MARKER_INSNS)
6001 goto delink_debug_stmt;
6002 else if (gimple_debug_begin_stmt_p (stmt))
6003 val = GEN_RTX_DEBUG_MARKER_BEGIN_STMT_PAT ();
6004 else if (gimple_debug_inline_entry_p (stmt))
6005 val = GEN_RTX_DEBUG_MARKER_INLINE_ENTRY_PAT ();
6006 else
6007 gcc_unreachable ();
6008
6009 last = get_last_insn ();
6010
6011 set_curr_insn_location (gimple_location (stmt));
6012
6013 emit_debug_insn (val);
6014
6015 if (dump_file && (dump_flags & TDF_DETAILS))
6016 {
6017 /* We can't dump the insn with a TREE where an RTX
6018 is expected. */
6019 if (GET_CODE (val) == VAR_LOCATION)
6020 {
6021 gcc_checking_assert (PAT_VAR_LOCATION_LOC (val) == (rtx)value);
6022 PAT_VAR_LOCATION_LOC (val) = const0_rtx;
6023 }
6024 maybe_dump_rtl_for_gimple_stmt (stmt, last);
6025 if (GET_CODE (val) == VAR_LOCATION)
6026 PAT_VAR_LOCATION_LOC (val) = (rtx)value;
6027 }
6028
6029 delink_debug_stmt:
6030 /* In order not to generate too many debug temporaries,
6031 we delink all uses of debug statements we already expanded.
6032 Therefore debug statements between definition and real
6033 use of TERed SSA names will continue to use the SSA name,
6034 and not be replaced with debug temps. */
6035 delink_stmt_imm_use (stmt);
6036
6037 gsi = nsi;
6038 gsi_next (&nsi);
6039 if (gsi_end_p (nsi))
6040 break;
6041 stmt = gsi_stmt (nsi);
6042 if (!is_gimple_debug (stmt))
6043 break;
6044 }
6045
6046 set_curr_insn_location (sloc);
6047 }
6048 else
6049 {
6050 gcall *call_stmt = dyn_cast <gcall *> (stmt);
6051 if (call_stmt
6052 && gimple_call_tail_p (call_stmt)
6053 && disable_tail_calls)
6054 gimple_call_set_tail (call_stmt, false);
6055
6056 if (call_stmt && gimple_call_tail_p (call_stmt))
6057 {
6058 bool can_fallthru;
6059 new_bb = expand_gimple_tailcall (bb, call_stmt, &can_fallthru);
6060 if (new_bb)
6061 {
6062 if (can_fallthru)
6063 bb = new_bb;
6064 else
6065 return new_bb;
6066 }
6067 }
6068 else
6069 {
6070 def_operand_p def_p;
6071 def_p = SINGLE_SSA_DEF_OPERAND (stmt, SSA_OP_DEF);
6072
6073 if (def_p != NULL)
6074 {
6075 /* Ignore this stmt if it is in the list of
6076 replaceable expressions. */
6077 if (SA.values
6078 && bitmap_bit_p (SA.values,
6079 SSA_NAME_VERSION (DEF_FROM_PTR (def_p))))
6080 continue;
6081 }
6082 last = expand_gimple_stmt (stmt);
6083 maybe_dump_rtl_for_gimple_stmt (stmt, last);
6084 }
6085 }
6086 }
6087
6088 currently_expanding_gimple_stmt = NULL;
6089
6090 /* Expand implicit goto and convert goto_locus. */
6091 FOR_EACH_EDGE (e, ei, bb->succs)
6092 {
6093 if (e->goto_locus != UNKNOWN_LOCATION || !stmt)
6094 set_curr_insn_location (e->goto_locus);
6095 if ((e->flags & EDGE_FALLTHRU) && e->dest != bb->next_bb)
6096 {
6097 emit_jump (label_rtx_for_bb (e->dest));
6098 e->flags &= ~EDGE_FALLTHRU;
6099 }
6100 }
6101
6102 /* Expanded RTL can create a jump in the last instruction of block.
6103 This later might be assumed to be a jump to successor and break edge insertion.
6104 We need to insert dummy move to prevent this. PR41440. */
6105 if (single_succ_p (bb)
6106 && (single_succ_edge (bb)->flags & EDGE_FALLTHRU)
6107 && (last = get_last_insn ())
6108 && (JUMP_P (last)
6109 || (DEBUG_INSN_P (last)
6110 && JUMP_P (prev_nondebug_insn (last)))))
6111 {
6112 rtx dummy = gen_reg_rtx (SImode);
6113 emit_insn_after_noloc (gen_move_insn (dummy, dummy), last, NULL);
6114 }
6115
6116 do_pending_stack_adjust ();
6117
6118 /* Find the block tail. The last insn in the block is the insn
6119 before a barrier and/or table jump insn. */
6120 last = get_last_insn ();
6121 if (BARRIER_P (last))
6122 last = PREV_INSN (last);
6123 if (JUMP_TABLE_DATA_P (last))
6124 last = PREV_INSN (PREV_INSN (last));
6125 if (BARRIER_P (last))
6126 last = PREV_INSN (last);
6127 BB_END (bb) = last;
6128
6129 update_bb_for_insn (bb);
6130
6131 return bb;
6132 }
6133
6134
6135 /* Create a basic block for initialization code. */
6136
6137 static basic_block
6138 construct_init_block (void)
6139 {
6140 basic_block init_block, first_block;
6141 edge e = NULL;
6142 int flags;
6143
6144 /* Multiple entry points not supported yet. */
6145 gcc_assert (EDGE_COUNT (ENTRY_BLOCK_PTR_FOR_FN (cfun)->succs) == 1);
6146 init_rtl_bb_info (ENTRY_BLOCK_PTR_FOR_FN (cfun));
6147 init_rtl_bb_info (EXIT_BLOCK_PTR_FOR_FN (cfun));
6148 ENTRY_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
6149 EXIT_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
6150
6151 e = EDGE_SUCC (ENTRY_BLOCK_PTR_FOR_FN (cfun), 0);
6152
6153 /* When entry edge points to first basic block, we don't need jump,
6154 otherwise we have to jump into proper target. */
6155 if (e && e->dest != ENTRY_BLOCK_PTR_FOR_FN (cfun)->next_bb)
6156 {
6157 tree label = gimple_block_label (e->dest);
6158
6159 emit_jump (jump_target_rtx (label));
6160 flags = 0;
6161 }
6162 else
6163 flags = EDGE_FALLTHRU;
6164
6165 init_block = create_basic_block (NEXT_INSN (get_insns ()),
6166 get_last_insn (),
6167 ENTRY_BLOCK_PTR_FOR_FN (cfun));
6168 init_block->count = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count;
6169 add_bb_to_loop (init_block, ENTRY_BLOCK_PTR_FOR_FN (cfun)->loop_father);
6170 if (e)
6171 {
6172 first_block = e->dest;
6173 redirect_edge_succ (e, init_block);
6174 make_single_succ_edge (init_block, first_block, flags);
6175 }
6176 else
6177 make_single_succ_edge (init_block, EXIT_BLOCK_PTR_FOR_FN (cfun),
6178 EDGE_FALLTHRU);
6179
6180 update_bb_for_insn (init_block);
6181 return init_block;
6182 }
6183
6184 /* For each lexical block, set BLOCK_NUMBER to the depth at which it is
6185 found in the block tree. */
6186
6187 static void
6188 set_block_levels (tree block, int level)
6189 {
6190 while (block)
6191 {
6192 BLOCK_NUMBER (block) = level;
6193 set_block_levels (BLOCK_SUBBLOCKS (block), level + 1);
6194 block = BLOCK_CHAIN (block);
6195 }
6196 }
6197
6198 /* Create a block containing landing pads and similar stuff. */
6199
6200 static void
6201 construct_exit_block (void)
6202 {
6203 rtx_insn *head = get_last_insn ();
6204 rtx_insn *end;
6205 basic_block exit_block;
6206 edge e, e2;
6207 unsigned ix;
6208 edge_iterator ei;
6209 basic_block prev_bb = EXIT_BLOCK_PTR_FOR_FN (cfun)->prev_bb;
6210 rtx_insn *orig_end = BB_END (prev_bb);
6211
6212 rtl_profile_for_bb (EXIT_BLOCK_PTR_FOR_FN (cfun));
6213
6214 /* Make sure the locus is set to the end of the function, so that
6215 epilogue line numbers and warnings are set properly. */
6216 if (LOCATION_LOCUS (cfun->function_end_locus) != UNKNOWN_LOCATION)
6217 input_location = cfun->function_end_locus;
6218
6219 /* Generate rtl for function exit. */
6220 expand_function_end ();
6221
6222 end = get_last_insn ();
6223 if (head == end)
6224 return;
6225 /* While emitting the function end we could move end of the last basic
6226 block. */
6227 BB_END (prev_bb) = orig_end;
6228 while (NEXT_INSN (head) && NOTE_P (NEXT_INSN (head)))
6229 head = NEXT_INSN (head);
6230 /* But make sure exit_block starts with RETURN_LABEL, otherwise the
6231 bb count counting will be confused. Any instructions before that
6232 label are emitted for the case where PREV_BB falls through into the
6233 exit block, so append those instructions to prev_bb in that case. */
6234 if (NEXT_INSN (head) != return_label)
6235 {
6236 while (NEXT_INSN (head) != return_label)
6237 {
6238 if (!NOTE_P (NEXT_INSN (head)))
6239 BB_END (prev_bb) = NEXT_INSN (head);
6240 head = NEXT_INSN (head);
6241 }
6242 }
6243 exit_block = create_basic_block (NEXT_INSN (head), end, prev_bb);
6244 exit_block->count = EXIT_BLOCK_PTR_FOR_FN (cfun)->count;
6245 add_bb_to_loop (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun)->loop_father);
6246
6247 ix = 0;
6248 while (ix < EDGE_COUNT (EXIT_BLOCK_PTR_FOR_FN (cfun)->preds))
6249 {
6250 e = EDGE_PRED (EXIT_BLOCK_PTR_FOR_FN (cfun), ix);
6251 if (!(e->flags & EDGE_ABNORMAL))
6252 redirect_edge_succ (e, exit_block);
6253 else
6254 ix++;
6255 }
6256
6257 e = make_single_succ_edge (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun),
6258 EDGE_FALLTHRU);
6259 FOR_EACH_EDGE (e2, ei, EXIT_BLOCK_PTR_FOR_FN (cfun)->preds)
6260 if (e2 != e)
6261 {
6262 exit_block->count -= e2->count ();
6263 }
6264 update_bb_for_insn (exit_block);
6265 }
6266
6267 /* Helper function for discover_nonconstant_array_refs.
6268 Look for ARRAY_REF nodes with non-constant indexes and mark them
6269 addressable. */
6270
6271 static tree
6272 discover_nonconstant_array_refs_r (tree * tp, int *walk_subtrees,
6273 void *data)
6274 {
6275 tree t = *tp;
6276 bitmap forced_stack_vars = (bitmap)((walk_stmt_info *)data)->info;
6277
6278 if (IS_TYPE_OR_DECL_P (t))
6279 *walk_subtrees = 0;
6280 else if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
6281 {
6282 while (((TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
6283 && is_gimple_min_invariant (TREE_OPERAND (t, 1))
6284 && (!TREE_OPERAND (t, 2)
6285 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
6286 || (TREE_CODE (t) == COMPONENT_REF
6287 && (!TREE_OPERAND (t,2)
6288 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
6289 || TREE_CODE (t) == BIT_FIELD_REF
6290 || TREE_CODE (t) == REALPART_EXPR
6291 || TREE_CODE (t) == IMAGPART_EXPR
6292 || TREE_CODE (t) == VIEW_CONVERT_EXPR
6293 || CONVERT_EXPR_P (t))
6294 t = TREE_OPERAND (t, 0);
6295
6296 if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
6297 {
6298 t = get_base_address (t);
6299 if (t && DECL_P (t)
6300 && DECL_MODE (t) != BLKmode
6301 && !TREE_ADDRESSABLE (t))
6302 bitmap_set_bit (forced_stack_vars, DECL_UID (t));
6303 }
6304
6305 *walk_subtrees = 0;
6306 }
6307 /* References of size POLY_INT_CST to a fixed-size object must go
6308 through memory. It's more efficient to force that here than
6309 to create temporary slots on the fly.
6310 RTL expansion expectes TARGET_MEM_REF to always address actual memory. */
6311 else if (TREE_CODE (t) == TARGET_MEM_REF
6312 || (TREE_CODE (t) == MEM_REF
6313 && TYPE_SIZE (TREE_TYPE (t))
6314 && POLY_INT_CST_P (TYPE_SIZE (TREE_TYPE (t)))))
6315 {
6316 tree base = get_base_address (t);
6317 if (base
6318 && DECL_P (base)
6319 && !TREE_ADDRESSABLE (base)
6320 && DECL_MODE (base) != BLKmode
6321 && GET_MODE_SIZE (DECL_MODE (base)).is_constant ())
6322 bitmap_set_bit (forced_stack_vars, DECL_UID (base));
6323 *walk_subtrees = 0;
6324 }
6325
6326 return NULL_TREE;
6327 }
6328
6329 /* If there's a chance to get a pseudo for t then if it would be of float mode
6330 and the actual access is via an integer mode (lowered memcpy or similar
6331 access) then avoid the register expansion if the mode likely is not storage
6332 suitable for raw bits processing (like XFmode on i?86). */
6333
6334 static void
6335 avoid_type_punning_on_regs (tree t, bitmap forced_stack_vars)
6336 {
6337 machine_mode access_mode = TYPE_MODE (TREE_TYPE (t));
6338 if (access_mode != BLKmode
6339 && !SCALAR_INT_MODE_P (access_mode))
6340 return;
6341 tree base = get_base_address (t);
6342 if (DECL_P (base)
6343 && !TREE_ADDRESSABLE (base)
6344 && FLOAT_MODE_P (DECL_MODE (base))
6345 && maybe_lt (GET_MODE_PRECISION (DECL_MODE (base)),
6346 GET_MODE_BITSIZE (GET_MODE_INNER (DECL_MODE (base))))
6347 /* Double check in the expensive way we really would get a pseudo. */
6348 && use_register_for_decl (base))
6349 bitmap_set_bit (forced_stack_vars, DECL_UID (base));
6350 }
6351
6352 /* RTL expansion is not able to compile array references with variable
6353 offsets for arrays stored in single register. Discover such
6354 expressions and mark variables as addressable to avoid this
6355 scenario. */
6356
6357 static void
6358 discover_nonconstant_array_refs (bitmap forced_stack_vars)
6359 {
6360 basic_block bb;
6361 gimple_stmt_iterator gsi;
6362
6363 walk_stmt_info wi = {};
6364 wi.info = forced_stack_vars;
6365 FOR_EACH_BB_FN (bb, cfun)
6366 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
6367 {
6368 gimple *stmt = gsi_stmt (gsi);
6369 if (!is_gimple_debug (stmt))
6370 {
6371 walk_gimple_op (stmt, discover_nonconstant_array_refs_r, &wi);
6372 gcall *call = dyn_cast <gcall *> (stmt);
6373 if (call && gimple_call_internal_p (call))
6374 {
6375 tree cand = NULL_TREE;
6376 switch (gimple_call_internal_fn (call))
6377 {
6378 case IFN_LOAD_LANES:
6379 /* The source must be a MEM. */
6380 cand = gimple_call_arg (call, 0);
6381 break;
6382 case IFN_STORE_LANES:
6383 /* The destination must be a MEM. */
6384 cand = gimple_call_lhs (call);
6385 break;
6386 default:
6387 break;
6388 }
6389 if (cand)
6390 cand = get_base_address (cand);
6391 if (cand
6392 && DECL_P (cand)
6393 && use_register_for_decl (cand))
6394 bitmap_set_bit (forced_stack_vars, DECL_UID (cand));
6395 }
6396 if (gimple_vdef (stmt))
6397 {
6398 tree t = gimple_get_lhs (stmt);
6399 if (t && REFERENCE_CLASS_P (t))
6400 avoid_type_punning_on_regs (t, forced_stack_vars);
6401 }
6402 }
6403 }
6404 }
6405
6406 /* This function sets crtl->args.internal_arg_pointer to a virtual
6407 register if DRAP is needed. Local register allocator will replace
6408 virtual_incoming_args_rtx with the virtual register. */
6409
6410 static void
6411 expand_stack_alignment (void)
6412 {
6413 rtx drap_rtx;
6414 unsigned int preferred_stack_boundary;
6415
6416 if (! SUPPORTS_STACK_ALIGNMENT)
6417 return;
6418
6419 if (cfun->calls_alloca
6420 || cfun->has_nonlocal_label
6421 || crtl->has_nonlocal_goto)
6422 crtl->need_drap = true;
6423
6424 /* Call update_stack_boundary here again to update incoming stack
6425 boundary. It may set incoming stack alignment to a different
6426 value after RTL expansion. TARGET_FUNCTION_OK_FOR_SIBCALL may
6427 use the minimum incoming stack alignment to check if it is OK
6428 to perform sibcall optimization since sibcall optimization will
6429 only align the outgoing stack to incoming stack boundary. */
6430 if (targetm.calls.update_stack_boundary)
6431 targetm.calls.update_stack_boundary ();
6432
6433 /* The incoming stack frame has to be aligned at least at
6434 parm_stack_boundary. */
6435 gcc_assert (crtl->parm_stack_boundary <= INCOMING_STACK_BOUNDARY);
6436
6437 /* Update crtl->stack_alignment_estimated and use it later to align
6438 stack. We check PREFERRED_STACK_BOUNDARY if there may be non-call
6439 exceptions since callgraph doesn't collect incoming stack alignment
6440 in this case. */
6441 if (cfun->can_throw_non_call_exceptions
6442 && PREFERRED_STACK_BOUNDARY > crtl->preferred_stack_boundary)
6443 preferred_stack_boundary = PREFERRED_STACK_BOUNDARY;
6444 else
6445 preferred_stack_boundary = crtl->preferred_stack_boundary;
6446 if (preferred_stack_boundary > crtl->stack_alignment_estimated)
6447 crtl->stack_alignment_estimated = preferred_stack_boundary;
6448 if (preferred_stack_boundary > crtl->stack_alignment_needed)
6449 crtl->stack_alignment_needed = preferred_stack_boundary;
6450
6451 gcc_assert (crtl->stack_alignment_needed
6452 <= crtl->stack_alignment_estimated);
6453
6454 crtl->stack_realign_needed
6455 = INCOMING_STACK_BOUNDARY < crtl->stack_alignment_estimated;
6456 crtl->stack_realign_tried = crtl->stack_realign_needed;
6457
6458 crtl->stack_realign_processed = true;
6459
6460 /* Target has to redefine TARGET_GET_DRAP_RTX to support stack
6461 alignment. */
6462 gcc_assert (targetm.calls.get_drap_rtx != NULL);
6463 drap_rtx = targetm.calls.get_drap_rtx ();
6464
6465 /* stack_realign_drap and drap_rtx must match. */
6466 gcc_assert ((stack_realign_drap != 0) == (drap_rtx != NULL));
6467
6468 /* Do nothing if NULL is returned, which means DRAP is not needed. */
6469 if (drap_rtx != NULL)
6470 {
6471 crtl->args.internal_arg_pointer = drap_rtx;
6472
6473 /* Call fixup_tail_calls to clean up REG_EQUIV note if DRAP is
6474 needed. */
6475 fixup_tail_calls ();
6476 }
6477 }
6478 \f
6479
6480 static void
6481 expand_main_function (void)
6482 {
6483 #if (defined(INVOKE__main) \
6484 || (!defined(HAS_INIT_SECTION) \
6485 && !defined(INIT_SECTION_ASM_OP) \
6486 && !defined(INIT_ARRAY_SECTION_ASM_OP)))
6487 emit_library_call (init_one_libfunc (NAME__MAIN), LCT_NORMAL, VOIDmode);
6488 #endif
6489 }
6490 \f
6491
6492 /* Expand code to initialize the stack_protect_guard. This is invoked at
6493 the beginning of a function to be protected. */
6494
6495 static void
6496 stack_protect_prologue (void)
6497 {
6498 tree guard_decl = targetm.stack_protect_guard ();
6499 rtx x, y;
6500
6501 crtl->stack_protect_guard_decl = guard_decl;
6502 x = expand_normal (crtl->stack_protect_guard);
6503
6504 if (targetm.have_stack_protect_combined_set () && guard_decl)
6505 {
6506 gcc_assert (DECL_P (guard_decl));
6507 y = DECL_RTL (guard_decl);
6508
6509 /* Allow the target to compute address of Y and copy it to X without
6510 leaking Y into a register. This combined address + copy pattern
6511 allows the target to prevent spilling of any intermediate results by
6512 splitting it after register allocator. */
6513 if (rtx_insn *insn = targetm.gen_stack_protect_combined_set (x, y))
6514 {
6515 emit_insn (insn);
6516 return;
6517 }
6518 }
6519
6520 if (guard_decl)
6521 y = expand_normal (guard_decl);
6522 else
6523 y = const0_rtx;
6524
6525 /* Allow the target to copy from Y to X without leaking Y into a
6526 register. */
6527 if (targetm.have_stack_protect_set ())
6528 if (rtx_insn *insn = targetm.gen_stack_protect_set (x, y))
6529 {
6530 emit_insn (insn);
6531 return;
6532 }
6533
6534 /* Otherwise do a straight move. */
6535 emit_move_insn (x, y);
6536 }
6537
6538 /* Translate the intermediate representation contained in the CFG
6539 from GIMPLE trees to RTL.
6540
6541 We do conversion per basic block and preserve/update the tree CFG.
6542 This implies we have to do some magic as the CFG can simultaneously
6543 consist of basic blocks containing RTL and GIMPLE trees. This can
6544 confuse the CFG hooks, so be careful to not manipulate CFG during
6545 the expansion. */
6546
6547 namespace {
6548
6549 const pass_data pass_data_expand =
6550 {
6551 RTL_PASS, /* type */
6552 "expand", /* name */
6553 OPTGROUP_NONE, /* optinfo_flags */
6554 TV_EXPAND, /* tv_id */
6555 ( PROP_ssa | PROP_gimple_leh | PROP_cfg
6556 | PROP_gimple_lcx
6557 | PROP_gimple_lvec
6558 | PROP_gimple_lva), /* properties_required */
6559 PROP_rtl, /* properties_provided */
6560 ( PROP_ssa | PROP_gimple ), /* properties_destroyed */
6561 0, /* todo_flags_start */
6562 0, /* todo_flags_finish */
6563 };
6564
6565 class pass_expand : public rtl_opt_pass
6566 {
6567 public:
6568 pass_expand (gcc::context *ctxt)
6569 : rtl_opt_pass (pass_data_expand, ctxt)
6570 {}
6571
6572 /* opt_pass methods: */
6573 virtual unsigned int execute (function *);
6574
6575 }; // class pass_expand
6576
6577 unsigned int
6578 pass_expand::execute (function *fun)
6579 {
6580 basic_block bb, init_block;
6581 edge_iterator ei;
6582 edge e;
6583 rtx_insn *var_seq, *var_ret_seq;
6584 unsigned i;
6585
6586 timevar_push (TV_OUT_OF_SSA);
6587 rewrite_out_of_ssa (&SA);
6588 timevar_pop (TV_OUT_OF_SSA);
6589 SA.partition_to_pseudo = XCNEWVEC (rtx, SA.map->num_partitions);
6590
6591 if (MAY_HAVE_DEBUG_BIND_STMTS && flag_tree_ter)
6592 {
6593 gimple_stmt_iterator gsi;
6594 FOR_EACH_BB_FN (bb, cfun)
6595 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
6596 if (gimple_debug_bind_p (gsi_stmt (gsi)))
6597 avoid_deep_ter_for_debug (gsi_stmt (gsi), 0);
6598 }
6599
6600 /* Mark arrays indexed with non-constant indices with TREE_ADDRESSABLE. */
6601 auto_bitmap forced_stack_vars;
6602 discover_nonconstant_array_refs (forced_stack_vars);
6603
6604 /* Make sure all values used by the optimization passes have sane
6605 defaults. */
6606 reg_renumber = 0;
6607
6608 /* Some backends want to know that we are expanding to RTL. */
6609 currently_expanding_to_rtl = 1;
6610 /* Dominators are not kept up-to-date as we may create new basic-blocks. */
6611 free_dominance_info (CDI_DOMINATORS);
6612
6613 rtl_profile_for_bb (ENTRY_BLOCK_PTR_FOR_FN (fun));
6614
6615 insn_locations_init ();
6616 if (!DECL_IS_UNDECLARED_BUILTIN (current_function_decl))
6617 {
6618 /* Eventually, all FEs should explicitly set function_start_locus. */
6619 if (LOCATION_LOCUS (fun->function_start_locus) == UNKNOWN_LOCATION)
6620 set_curr_insn_location
6621 (DECL_SOURCE_LOCATION (current_function_decl));
6622 else
6623 set_curr_insn_location (fun->function_start_locus);
6624 }
6625 else
6626 set_curr_insn_location (UNKNOWN_LOCATION);
6627 prologue_location = curr_insn_location ();
6628
6629 #ifdef INSN_SCHEDULING
6630 init_sched_attrs ();
6631 #endif
6632
6633 /* Make sure first insn is a note even if we don't want linenums.
6634 This makes sure the first insn will never be deleted.
6635 Also, final expects a note to appear there. */
6636 emit_note (NOTE_INSN_DELETED);
6637
6638 targetm.expand_to_rtl_hook ();
6639 crtl->init_stack_alignment ();
6640 fun->cfg->max_jumptable_ents = 0;
6641
6642 /* Resovle the function section. Some targets, like ARM EABI rely on knowledge
6643 of the function section at exapnsion time to predict distance of calls. */
6644 resolve_unique_section (current_function_decl, 0, flag_function_sections);
6645
6646 /* Expand the variables recorded during gimple lowering. */
6647 timevar_push (TV_VAR_EXPAND);
6648 start_sequence ();
6649
6650 var_ret_seq = expand_used_vars (forced_stack_vars);
6651
6652 var_seq = get_insns ();
6653 end_sequence ();
6654 timevar_pop (TV_VAR_EXPAND);
6655
6656 /* Honor stack protection warnings. */
6657 if (warn_stack_protect)
6658 {
6659 if (fun->calls_alloca)
6660 warning (OPT_Wstack_protector,
6661 "stack protector not protecting local variables: "
6662 "variable length buffer");
6663 if (has_short_buffer && !crtl->stack_protect_guard)
6664 warning (OPT_Wstack_protector,
6665 "stack protector not protecting function: "
6666 "all local arrays are less than %d bytes long",
6667 (int) param_ssp_buffer_size);
6668 }
6669
6670 /* Temporarily mark PARM_DECLs and RESULT_DECLs we need to expand to
6671 memory addressable so expand_function_start can emit the required
6672 copies. */
6673 auto_vec<tree, 16> marked_parms;
6674 for (tree parm = DECL_ARGUMENTS (current_function_decl); parm;
6675 parm = DECL_CHAIN (parm))
6676 if (!TREE_ADDRESSABLE (parm)
6677 && bitmap_bit_p (forced_stack_vars, DECL_UID (parm)))
6678 {
6679 TREE_ADDRESSABLE (parm) = 1;
6680 marked_parms.safe_push (parm);
6681 }
6682 if (DECL_RESULT (current_function_decl)
6683 && !TREE_ADDRESSABLE (DECL_RESULT (current_function_decl))
6684 && bitmap_bit_p (forced_stack_vars,
6685 DECL_UID (DECL_RESULT (current_function_decl))))
6686 {
6687 TREE_ADDRESSABLE (DECL_RESULT (current_function_decl)) = 1;
6688 marked_parms.safe_push (DECL_RESULT (current_function_decl));
6689 }
6690
6691 /* Set up parameters and prepare for return, for the function. */
6692 expand_function_start (current_function_decl);
6693
6694 /* Clear TREE_ADDRESSABLE again. */
6695 while (!marked_parms.is_empty ())
6696 TREE_ADDRESSABLE (marked_parms.pop ()) = 0;
6697
6698 /* If we emitted any instructions for setting up the variables,
6699 emit them before the FUNCTION_START note. */
6700 if (var_seq)
6701 {
6702 emit_insn_before (var_seq, parm_birth_insn);
6703
6704 /* In expand_function_end we'll insert the alloca save/restore
6705 before parm_birth_insn. We've just insertted an alloca call.
6706 Adjust the pointer to match. */
6707 parm_birth_insn = var_seq;
6708 }
6709
6710 /* Now propagate the RTL assignment of each partition to the
6711 underlying var of each SSA_NAME. */
6712 tree name;
6713
6714 FOR_EACH_SSA_NAME (i, name, cfun)
6715 {
6716 /* We might have generated new SSA names in
6717 update_alias_info_with_stack_vars. They will have a NULL
6718 defining statements, and won't be part of the partitioning,
6719 so ignore those. */
6720 if (!SSA_NAME_DEF_STMT (name))
6721 continue;
6722
6723 adjust_one_expanded_partition_var (name);
6724 }
6725
6726 /* Clean up RTL of variables that straddle across multiple
6727 partitions, and check that the rtl of any PARM_DECLs that are not
6728 cleaned up is that of their default defs. */
6729 FOR_EACH_SSA_NAME (i, name, cfun)
6730 {
6731 int part;
6732
6733 /* We might have generated new SSA names in
6734 update_alias_info_with_stack_vars. They will have a NULL
6735 defining statements, and won't be part of the partitioning,
6736 so ignore those. */
6737 if (!SSA_NAME_DEF_STMT (name))
6738 continue;
6739 part = var_to_partition (SA.map, name);
6740 if (part == NO_PARTITION)
6741 continue;
6742
6743 /* If this decl was marked as living in multiple places, reset
6744 this now to NULL. */
6745 tree var = SSA_NAME_VAR (name);
6746 if (var && DECL_RTL_IF_SET (var) == pc_rtx)
6747 SET_DECL_RTL (var, NULL);
6748 /* Check that the pseudos chosen by assign_parms are those of
6749 the corresponding default defs. */
6750 else if (SSA_NAME_IS_DEFAULT_DEF (name)
6751 && (TREE_CODE (var) == PARM_DECL
6752 || TREE_CODE (var) == RESULT_DECL))
6753 {
6754 rtx in = DECL_RTL_IF_SET (var);
6755 gcc_assert (in);
6756 rtx out = SA.partition_to_pseudo[part];
6757 gcc_assert (in == out);
6758
6759 /* Now reset VAR's RTL to IN, so that the _EXPR attrs match
6760 those expected by debug backends for each parm and for
6761 the result. This is particularly important for stabs,
6762 whose register elimination from parm's DECL_RTL may cause
6763 -fcompare-debug differences as SET_DECL_RTL changes reg's
6764 attrs. So, make sure the RTL already has the parm as the
6765 EXPR, so that it won't change. */
6766 SET_DECL_RTL (var, NULL_RTX);
6767 if (MEM_P (in))
6768 set_mem_attributes (in, var, true);
6769 SET_DECL_RTL (var, in);
6770 }
6771 }
6772
6773 /* If this function is `main', emit a call to `__main'
6774 to run global initializers, etc. */
6775 if (DECL_NAME (current_function_decl)
6776 && MAIN_NAME_P (DECL_NAME (current_function_decl))
6777 && DECL_FILE_SCOPE_P (current_function_decl))
6778 expand_main_function ();
6779
6780 /* Initialize the stack_protect_guard field. This must happen after the
6781 call to __main (if any) so that the external decl is initialized. */
6782 if (crtl->stack_protect_guard && targetm.stack_protect_runtime_enabled_p ())
6783 stack_protect_prologue ();
6784
6785 expand_phi_nodes (&SA);
6786
6787 /* Release any stale SSA redirection data. */
6788 redirect_edge_var_map_empty ();
6789
6790 /* Register rtl specific functions for cfg. */
6791 rtl_register_cfg_hooks ();
6792
6793 init_block = construct_init_block ();
6794
6795 /* Clear EDGE_EXECUTABLE on the entry edge(s). It is cleaned from the
6796 remaining edges later. */
6797 FOR_EACH_EDGE (e, ei, ENTRY_BLOCK_PTR_FOR_FN (fun)->succs)
6798 e->flags &= ~EDGE_EXECUTABLE;
6799
6800 /* If the function has too many markers, drop them while expanding. */
6801 if (cfun->debug_marker_count
6802 >= param_max_debug_marker_count)
6803 cfun->debug_nonbind_markers = false;
6804
6805 lab_rtx_for_bb = new hash_map<basic_block, rtx_code_label *>;
6806 FOR_BB_BETWEEN (bb, init_block->next_bb, EXIT_BLOCK_PTR_FOR_FN (fun),
6807 next_bb)
6808 bb = expand_gimple_basic_block (bb, var_ret_seq != NULL_RTX);
6809
6810 if (MAY_HAVE_DEBUG_BIND_INSNS)
6811 expand_debug_locations ();
6812
6813 if (deep_ter_debug_map)
6814 {
6815 delete deep_ter_debug_map;
6816 deep_ter_debug_map = NULL;
6817 }
6818
6819 /* Free stuff we no longer need after GIMPLE optimizations. */
6820 free_dominance_info (CDI_DOMINATORS);
6821 free_dominance_info (CDI_POST_DOMINATORS);
6822 delete_tree_cfg_annotations (fun);
6823
6824 timevar_push (TV_OUT_OF_SSA);
6825 finish_out_of_ssa (&SA);
6826 timevar_pop (TV_OUT_OF_SSA);
6827
6828 timevar_push (TV_POST_EXPAND);
6829 /* We are no longer in SSA form. */
6830 fun->gimple_df->in_ssa_p = false;
6831 loops_state_clear (LOOP_CLOSED_SSA);
6832
6833 /* Expansion is used by optimization passes too, set maybe_hot_insn_p
6834 conservatively to true until they are all profile aware. */
6835 delete lab_rtx_for_bb;
6836 free_histograms (fun);
6837
6838 construct_exit_block ();
6839 insn_locations_finalize ();
6840
6841 if (var_ret_seq)
6842 {
6843 rtx_insn *after = return_label;
6844 rtx_insn *next = NEXT_INSN (after);
6845 if (next && NOTE_INSN_BASIC_BLOCK_P (next))
6846 after = next;
6847 emit_insn_after (var_ret_seq, after);
6848 }
6849
6850 if (hwasan_sanitize_stack_p ())
6851 hwasan_maybe_emit_frame_base_init ();
6852
6853 /* Zap the tree EH table. */
6854 set_eh_throw_stmt_table (fun, NULL);
6855
6856 /* We need JUMP_LABEL be set in order to redirect jumps, and hence
6857 split edges which edge insertions might do. */
6858 rebuild_jump_labels (get_insns ());
6859
6860 /* If we have a single successor to the entry block, put the pending insns
6861 after parm birth, but before NOTE_INSNS_FUNCTION_BEG. */
6862 if (single_succ_p (ENTRY_BLOCK_PTR_FOR_FN (fun)))
6863 {
6864 edge e = single_succ_edge (ENTRY_BLOCK_PTR_FOR_FN (fun));
6865 if (e->insns.r)
6866 {
6867 rtx_insn *insns = e->insns.r;
6868 e->insns.r = NULL;
6869 rebuild_jump_labels_chain (insns);
6870 if (NOTE_P (parm_birth_insn)
6871 && NOTE_KIND (parm_birth_insn) == NOTE_INSN_FUNCTION_BEG)
6872 emit_insn_before_noloc (insns, parm_birth_insn, e->dest);
6873 else
6874 emit_insn_after_noloc (insns, parm_birth_insn, e->dest);
6875 }
6876 }
6877
6878 /* Otherwise, as well as for other edges, take the usual way. */
6879 commit_edge_insertions ();
6880
6881 /* We're done expanding trees to RTL. */
6882 currently_expanding_to_rtl = 0;
6883
6884 flush_mark_addressable_queue ();
6885
6886 FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (fun)->next_bb,
6887 EXIT_BLOCK_PTR_FOR_FN (fun), next_bb)
6888 {
6889 edge e;
6890 edge_iterator ei;
6891 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
6892 {
6893 /* Clear EDGE_EXECUTABLE. This flag is never used in the backend. */
6894 e->flags &= ~EDGE_EXECUTABLE;
6895
6896 /* At the moment not all abnormal edges match the RTL
6897 representation. It is safe to remove them here as
6898 find_many_sub_basic_blocks will rediscover them.
6899 In the future we should get this fixed properly. */
6900 if ((e->flags & EDGE_ABNORMAL)
6901 && !(e->flags & EDGE_SIBCALL))
6902 remove_edge (e);
6903 else
6904 ei_next (&ei);
6905 }
6906 }
6907
6908 auto_sbitmap blocks (last_basic_block_for_fn (fun));
6909 bitmap_ones (blocks);
6910 find_many_sub_basic_blocks (blocks);
6911 purge_all_dead_edges ();
6912
6913 /* After initial rtl generation, call back to finish generating
6914 exception support code. We need to do this before cleaning up
6915 the CFG as the code does not expect dead landing pads. */
6916 if (fun->eh->region_tree != NULL)
6917 finish_eh_generation ();
6918
6919 /* Call expand_stack_alignment after finishing all
6920 updates to crtl->preferred_stack_boundary. */
6921 expand_stack_alignment ();
6922
6923 /* Fixup REG_EQUIV notes in the prologue if there are tailcalls in this
6924 function. */
6925 if (crtl->tail_call_emit)
6926 fixup_tail_calls ();
6927
6928 HOST_WIDE_INT patch_area_size, patch_area_entry;
6929 parse_and_check_patch_area (flag_patchable_function_entry, false,
6930 &patch_area_size, &patch_area_entry);
6931
6932 tree patchable_function_entry_attr
6933 = lookup_attribute ("patchable_function_entry",
6934 DECL_ATTRIBUTES (cfun->decl));
6935 if (patchable_function_entry_attr)
6936 {
6937 tree pp_val = TREE_VALUE (patchable_function_entry_attr);
6938 tree patchable_function_entry_value1 = TREE_VALUE (pp_val);
6939
6940 patch_area_size = tree_to_uhwi (patchable_function_entry_value1);
6941 patch_area_entry = 0;
6942 if (TREE_CHAIN (pp_val) != NULL_TREE)
6943 {
6944 tree patchable_function_entry_value2
6945 = TREE_VALUE (TREE_CHAIN (pp_val));
6946 patch_area_entry = tree_to_uhwi (patchable_function_entry_value2);
6947 }
6948 }
6949
6950 if (patch_area_entry > patch_area_size)
6951 {
6952 if (patch_area_size > 0)
6953 warning (OPT_Wattributes,
6954 "patchable function entry %wu exceeds size %wu",
6955 patch_area_entry, patch_area_size);
6956 patch_area_entry = 0;
6957 }
6958
6959 crtl->patch_area_size = patch_area_size;
6960 crtl->patch_area_entry = patch_area_entry;
6961
6962 /* BB subdivision may have created basic blocks that are only reachable
6963 from unlikely bbs but not marked as such in the profile. */
6964 if (optimize)
6965 propagate_unlikely_bbs_forward ();
6966
6967 /* Remove unreachable blocks, otherwise we cannot compute dominators
6968 which are needed for loop state verification. As a side-effect
6969 this also compacts blocks.
6970 ??? We cannot remove trivially dead insns here as for example
6971 the DRAP reg on i?86 is not magically live at this point.
6972 gcc.c-torture/execute/ipa-sra-2.c execution, -Os -m32 fails otherwise. */
6973 cleanup_cfg (CLEANUP_NO_INSN_DEL);
6974
6975 checking_verify_flow_info ();
6976
6977 /* Initialize pseudos allocated for hard registers. */
6978 emit_initial_value_sets ();
6979
6980 /* And finally unshare all RTL. */
6981 unshare_all_rtl ();
6982
6983 /* There's no need to defer outputting this function any more; we
6984 know we want to output it. */
6985 DECL_DEFER_OUTPUT (current_function_decl) = 0;
6986
6987 /* Now that we're done expanding trees to RTL, we shouldn't have any
6988 more CONCATs anywhere. */
6989 generating_concat_p = 0;
6990
6991 if (dump_file)
6992 {
6993 fprintf (dump_file,
6994 "\n\n;;\n;; Full RTL generated for this function:\n;;\n");
6995 /* And the pass manager will dump RTL for us. */
6996 }
6997
6998 /* If we're emitting a nested function, make sure its parent gets
6999 emitted as well. Doing otherwise confuses debug info. */
7000 {
7001 tree parent;
7002 for (parent = DECL_CONTEXT (current_function_decl);
7003 parent != NULL_TREE;
7004 parent = get_containing_scope (parent))
7005 if (TREE_CODE (parent) == FUNCTION_DECL)
7006 TREE_SYMBOL_REFERENCED (DECL_ASSEMBLER_NAME (parent)) = 1;
7007 }
7008
7009 TREE_ASM_WRITTEN (current_function_decl) = 1;
7010
7011 /* After expanding, the return labels are no longer needed. */
7012 return_label = NULL;
7013 naked_return_label = NULL;
7014
7015 /* After expanding, the tm_restart map is no longer needed. */
7016 if (fun->gimple_df->tm_restart)
7017 fun->gimple_df->tm_restart = NULL;
7018
7019 /* Tag the blocks with a depth number so that change_scope can find
7020 the common parent easily. */
7021 set_block_levels (DECL_INITIAL (fun->decl), 0);
7022 default_rtl_profile ();
7023
7024 /* For -dx discard loops now, otherwise IL verify in clean_state will
7025 ICE. */
7026 if (rtl_dump_and_exit)
7027 {
7028 cfun->curr_properties &= ~PROP_loops;
7029 loop_optimizer_finalize ();
7030 }
7031
7032 timevar_pop (TV_POST_EXPAND);
7033
7034 return 0;
7035 }
7036
7037 } // anon namespace
7038
7039 rtl_opt_pass *
7040 make_pass_expand (gcc::context *ctxt)
7041 {
7042 return new pass_expand (ctxt);
7043 }