]> git.ipfire.org Git - thirdparty/gcc.git/blob - gcc/function.c
Allow automatics in equivalences
[thirdparty/gcc.git] / gcc / function.c
1 /* Expands front end tree to back end RTL for GCC.
2 Copyright (C) 1987-2019 Free Software Foundation, Inc.
3
4 This file is part of GCC.
5
6 GCC is free software; you can redistribute it and/or modify it under
7 the terms of the GNU General Public License as published by the Free
8 Software Foundation; either version 3, or (at your option) any later
9 version.
10
11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
13 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
14 for more details.
15
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
19
20 /* This file handles the generation of rtl code from tree structure
21 at the level of the function as a whole.
22 It creates the rtl expressions for parameters and auto variables
23 and has full responsibility for allocating stack slots.
24
25 `expand_function_start' is called at the beginning of a function,
26 before the function body is parsed, and `expand_function_end' is
27 called after parsing the body.
28
29 Call `assign_stack_local' to allocate a stack slot for a local variable.
30 This is usually done during the RTL generation for the function body,
31 but it can also be done in the reload pass when a pseudo-register does
32 not get a hard register. */
33
34 #include "config.h"
35 #include "system.h"
36 #include "coretypes.h"
37 #include "backend.h"
38 #include "target.h"
39 #include "rtl.h"
40 #include "tree.h"
41 #include "gimple-expr.h"
42 #include "cfghooks.h"
43 #include "df.h"
44 #include "memmodel.h"
45 #include "tm_p.h"
46 #include "stringpool.h"
47 #include "expmed.h"
48 #include "optabs.h"
49 #include "regs.h"
50 #include "emit-rtl.h"
51 #include "recog.h"
52 #include "rtl-error.h"
53 #include "alias.h"
54 #include "fold-const.h"
55 #include "stor-layout.h"
56 #include "varasm.h"
57 #include "except.h"
58 #include "dojump.h"
59 #include "explow.h"
60 #include "calls.h"
61 #include "expr.h"
62 #include "optabs-tree.h"
63 #include "output.h"
64 #include "langhooks.h"
65 #include "common/common-target.h"
66 #include "gimplify.h"
67 #include "tree-pass.h"
68 #include "cfgrtl.h"
69 #include "cfganal.h"
70 #include "cfgbuild.h"
71 #include "cfgcleanup.h"
72 #include "cfgexpand.h"
73 #include "shrink-wrap.h"
74 #include "toplev.h"
75 #include "rtl-iter.h"
76 #include "tree-dfa.h"
77 #include "tree-ssa.h"
78 #include "stringpool.h"
79 #include "attribs.h"
80 #include "gimple.h"
81 #include "options.h"
82
83 /* So we can assign to cfun in this file. */
84 #undef cfun
85
86 #ifndef STACK_ALIGNMENT_NEEDED
87 #define STACK_ALIGNMENT_NEEDED 1
88 #endif
89
90 #define STACK_BYTES (STACK_BOUNDARY / BITS_PER_UNIT)
91
92 /* Round a value to the lowest integer less than it that is a multiple of
93 the required alignment. Avoid using division in case the value is
94 negative. Assume the alignment is a power of two. */
95 #define FLOOR_ROUND(VALUE,ALIGN) ((VALUE) & ~((ALIGN) - 1))
96
97 /* Similar, but round to the next highest integer that meets the
98 alignment. */
99 #define CEIL_ROUND(VALUE,ALIGN) (((VALUE) + (ALIGN) - 1) & ~((ALIGN)- 1))
100
101 /* Nonzero once virtual register instantiation has been done.
102 assign_stack_local uses frame_pointer_rtx when this is nonzero.
103 calls.c:emit_library_call_value_1 uses it to set up
104 post-instantiation libcalls. */
105 int virtuals_instantiated;
106
107 /* Assign unique numbers to labels generated for profiling, debugging, etc. */
108 static GTY(()) int funcdef_no;
109
110 /* These variables hold pointers to functions to create and destroy
111 target specific, per-function data structures. */
112 struct machine_function * (*init_machine_status) (void);
113
114 /* The currently compiled function. */
115 struct function *cfun = 0;
116
117 /* These hashes record the prologue and epilogue insns. */
118
119 struct insn_cache_hasher : ggc_cache_ptr_hash<rtx_def>
120 {
121 static hashval_t hash (rtx x) { return htab_hash_pointer (x); }
122 static bool equal (rtx a, rtx b) { return a == b; }
123 };
124
125 static GTY((cache))
126 hash_table<insn_cache_hasher> *prologue_insn_hash;
127 static GTY((cache))
128 hash_table<insn_cache_hasher> *epilogue_insn_hash;
129 \f
130
131 hash_table<used_type_hasher> *types_used_by_vars_hash = NULL;
132 vec<tree, va_gc> *types_used_by_cur_var_decl;
133
134 /* Forward declarations. */
135
136 static class temp_slot *find_temp_slot_from_address (rtx);
137 static void pad_to_arg_alignment (struct args_size *, int, struct args_size *);
138 static void pad_below (struct args_size *, machine_mode, tree);
139 static void reorder_blocks_1 (rtx_insn *, tree, vec<tree> *);
140 static int all_blocks (tree, tree *);
141 static tree *get_block_vector (tree, int *);
142 extern tree debug_find_var_in_block_tree (tree, tree);
143 /* We always define `record_insns' even if it's not used so that we
144 can always export `prologue_epilogue_contains'. */
145 static void record_insns (rtx_insn *, rtx, hash_table<insn_cache_hasher> **)
146 ATTRIBUTE_UNUSED;
147 static bool contains (const rtx_insn *, hash_table<insn_cache_hasher> *);
148 static void prepare_function_start (void);
149 static void do_clobber_return_reg (rtx, void *);
150 static void do_use_return_reg (rtx, void *);
151
152 \f
153 /* Stack of nested functions. */
154 /* Keep track of the cfun stack. */
155
156 static vec<function *> function_context_stack;
157
158 /* Save the current context for compilation of a nested function.
159 This is called from language-specific code. */
160
161 void
162 push_function_context (void)
163 {
164 if (cfun == 0)
165 allocate_struct_function (NULL, false);
166
167 function_context_stack.safe_push (cfun);
168 set_cfun (NULL);
169 }
170
171 /* Restore the last saved context, at the end of a nested function.
172 This function is called from language-specific code. */
173
174 void
175 pop_function_context (void)
176 {
177 struct function *p = function_context_stack.pop ();
178 set_cfun (p);
179 current_function_decl = p->decl;
180
181 /* Reset variables that have known state during rtx generation. */
182 virtuals_instantiated = 0;
183 generating_concat_p = 1;
184 }
185
186 /* Clear out all parts of the state in F that can safely be discarded
187 after the function has been parsed, but not compiled, to let
188 garbage collection reclaim the memory. */
189
190 void
191 free_after_parsing (struct function *f)
192 {
193 f->language = 0;
194 }
195
196 /* Clear out all parts of the state in F that can safely be discarded
197 after the function has been compiled, to let garbage collection
198 reclaim the memory. */
199
200 void
201 free_after_compilation (struct function *f)
202 {
203 prologue_insn_hash = NULL;
204 epilogue_insn_hash = NULL;
205
206 free (crtl->emit.regno_pointer_align);
207
208 memset (crtl, 0, sizeof (struct rtl_data));
209 f->eh = NULL;
210 f->machine = NULL;
211 f->cfg = NULL;
212 f->curr_properties &= ~PROP_cfg;
213
214 regno_reg_rtx = NULL;
215 }
216 \f
217 /* Return size needed for stack frame based on slots so far allocated.
218 This size counts from zero. It is not rounded to PREFERRED_STACK_BOUNDARY;
219 the caller may have to do that. */
220
221 poly_int64
222 get_frame_size (void)
223 {
224 if (FRAME_GROWS_DOWNWARD)
225 return -frame_offset;
226 else
227 return frame_offset;
228 }
229
230 /* Issue an error message and return TRUE if frame OFFSET overflows in
231 the signed target pointer arithmetics for function FUNC. Otherwise
232 return FALSE. */
233
234 bool
235 frame_offset_overflow (poly_int64 offset, tree func)
236 {
237 poly_uint64 size = FRAME_GROWS_DOWNWARD ? -offset : offset;
238 unsigned HOST_WIDE_INT limit
239 = ((HOST_WIDE_INT_1U << (GET_MODE_BITSIZE (Pmode) - 1))
240 /* Leave room for the fixed part of the frame. */
241 - 64 * UNITS_PER_WORD);
242
243 if (!coeffs_in_range_p (size, 0U, limit))
244 {
245 unsigned HOST_WIDE_INT hwisize;
246 if (size.is_constant (&hwisize))
247 error_at (DECL_SOURCE_LOCATION (func),
248 "total size of local objects %wu exceeds maximum %wu",
249 hwisize, limit);
250 else
251 error_at (DECL_SOURCE_LOCATION (func),
252 "total size of local objects exceeds maximum %wu",
253 limit);
254 return true;
255 }
256
257 return false;
258 }
259
260 /* Return the minimum spill slot alignment for a register of mode MODE. */
261
262 unsigned int
263 spill_slot_alignment (machine_mode mode ATTRIBUTE_UNUSED)
264 {
265 return STACK_SLOT_ALIGNMENT (NULL_TREE, mode, GET_MODE_ALIGNMENT (mode));
266 }
267
268 /* Return stack slot alignment in bits for TYPE and MODE. */
269
270 static unsigned int
271 get_stack_local_alignment (tree type, machine_mode mode)
272 {
273 unsigned int alignment;
274
275 if (mode == BLKmode)
276 alignment = BIGGEST_ALIGNMENT;
277 else
278 alignment = GET_MODE_ALIGNMENT (mode);
279
280 /* Allow the frond-end to (possibly) increase the alignment of this
281 stack slot. */
282 if (! type)
283 type = lang_hooks.types.type_for_mode (mode, 0);
284
285 return STACK_SLOT_ALIGNMENT (type, mode, alignment);
286 }
287
288 /* Determine whether it is possible to fit a stack slot of size SIZE and
289 alignment ALIGNMENT into an area in the stack frame that starts at
290 frame offset START and has a length of LENGTH. If so, store the frame
291 offset to be used for the stack slot in *POFFSET and return true;
292 return false otherwise. This function will extend the frame size when
293 given a start/length pair that lies at the end of the frame. */
294
295 static bool
296 try_fit_stack_local (poly_int64 start, poly_int64 length,
297 poly_int64 size, unsigned int alignment,
298 poly_int64_pod *poffset)
299 {
300 poly_int64 this_frame_offset;
301 int frame_off, frame_alignment, frame_phase;
302
303 /* Calculate how many bytes the start of local variables is off from
304 stack alignment. */
305 frame_alignment = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
306 frame_off = targetm.starting_frame_offset () % frame_alignment;
307 frame_phase = frame_off ? frame_alignment - frame_off : 0;
308
309 /* Round the frame offset to the specified alignment. */
310
311 if (FRAME_GROWS_DOWNWARD)
312 this_frame_offset
313 = (aligned_lower_bound (start + length - size - frame_phase, alignment)
314 + frame_phase);
315 else
316 this_frame_offset
317 = aligned_upper_bound (start - frame_phase, alignment) + frame_phase;
318
319 /* See if it fits. If this space is at the edge of the frame,
320 consider extending the frame to make it fit. Our caller relies on
321 this when allocating a new slot. */
322 if (maybe_lt (this_frame_offset, start))
323 {
324 if (known_eq (frame_offset, start))
325 frame_offset = this_frame_offset;
326 else
327 return false;
328 }
329 else if (maybe_gt (this_frame_offset + size, start + length))
330 {
331 if (known_eq (frame_offset, start + length))
332 frame_offset = this_frame_offset + size;
333 else
334 return false;
335 }
336
337 *poffset = this_frame_offset;
338 return true;
339 }
340
341 /* Create a new frame_space structure describing free space in the stack
342 frame beginning at START and ending at END, and chain it into the
343 function's frame_space_list. */
344
345 static void
346 add_frame_space (poly_int64 start, poly_int64 end)
347 {
348 class frame_space *space = ggc_alloc<frame_space> ();
349 space->next = crtl->frame_space_list;
350 crtl->frame_space_list = space;
351 space->start = start;
352 space->length = end - start;
353 }
354
355 /* Allocate a stack slot of SIZE bytes and return a MEM rtx for it
356 with machine mode MODE.
357
358 ALIGN controls the amount of alignment for the address of the slot:
359 0 means according to MODE,
360 -1 means use BIGGEST_ALIGNMENT and round size to multiple of that,
361 -2 means use BITS_PER_UNIT,
362 positive specifies alignment boundary in bits.
363
364 KIND has ASLK_REDUCE_ALIGN bit set if it is OK to reduce
365 alignment and ASLK_RECORD_PAD bit set if we should remember
366 extra space we allocated for alignment purposes. When we are
367 called from assign_stack_temp_for_type, it is not set so we don't
368 track the same stack slot in two independent lists.
369
370 We do not round to stack_boundary here. */
371
372 rtx
373 assign_stack_local_1 (machine_mode mode, poly_int64 size,
374 int align, int kind)
375 {
376 rtx x, addr;
377 poly_int64 bigend_correction = 0;
378 poly_int64 slot_offset = 0, old_frame_offset;
379 unsigned int alignment, alignment_in_bits;
380
381 if (align == 0)
382 {
383 alignment = get_stack_local_alignment (NULL, mode);
384 alignment /= BITS_PER_UNIT;
385 }
386 else if (align == -1)
387 {
388 alignment = BIGGEST_ALIGNMENT / BITS_PER_UNIT;
389 size = aligned_upper_bound (size, alignment);
390 }
391 else if (align == -2)
392 alignment = 1; /* BITS_PER_UNIT / BITS_PER_UNIT */
393 else
394 alignment = align / BITS_PER_UNIT;
395
396 alignment_in_bits = alignment * BITS_PER_UNIT;
397
398 /* Ignore alignment if it exceeds MAX_SUPPORTED_STACK_ALIGNMENT. */
399 if (alignment_in_bits > MAX_SUPPORTED_STACK_ALIGNMENT)
400 {
401 alignment_in_bits = MAX_SUPPORTED_STACK_ALIGNMENT;
402 alignment = MAX_SUPPORTED_STACK_ALIGNMENT / BITS_PER_UNIT;
403 }
404
405 if (SUPPORTS_STACK_ALIGNMENT)
406 {
407 if (crtl->stack_alignment_estimated < alignment_in_bits)
408 {
409 if (!crtl->stack_realign_processed)
410 crtl->stack_alignment_estimated = alignment_in_bits;
411 else
412 {
413 /* If stack is realigned and stack alignment value
414 hasn't been finalized, it is OK not to increase
415 stack_alignment_estimated. The bigger alignment
416 requirement is recorded in stack_alignment_needed
417 below. */
418 gcc_assert (!crtl->stack_realign_finalized);
419 if (!crtl->stack_realign_needed)
420 {
421 /* It is OK to reduce the alignment as long as the
422 requested size is 0 or the estimated stack
423 alignment >= mode alignment. */
424 gcc_assert ((kind & ASLK_REDUCE_ALIGN)
425 || known_eq (size, 0)
426 || (crtl->stack_alignment_estimated
427 >= GET_MODE_ALIGNMENT (mode)));
428 alignment_in_bits = crtl->stack_alignment_estimated;
429 alignment = alignment_in_bits / BITS_PER_UNIT;
430 }
431 }
432 }
433 }
434
435 if (crtl->stack_alignment_needed < alignment_in_bits)
436 crtl->stack_alignment_needed = alignment_in_bits;
437 if (crtl->max_used_stack_slot_alignment < alignment_in_bits)
438 crtl->max_used_stack_slot_alignment = alignment_in_bits;
439
440 if (mode != BLKmode || maybe_ne (size, 0))
441 {
442 if (kind & ASLK_RECORD_PAD)
443 {
444 class frame_space **psp;
445
446 for (psp = &crtl->frame_space_list; *psp; psp = &(*psp)->next)
447 {
448 class frame_space *space = *psp;
449 if (!try_fit_stack_local (space->start, space->length, size,
450 alignment, &slot_offset))
451 continue;
452 *psp = space->next;
453 if (known_gt (slot_offset, space->start))
454 add_frame_space (space->start, slot_offset);
455 if (known_lt (slot_offset + size, space->start + space->length))
456 add_frame_space (slot_offset + size,
457 space->start + space->length);
458 goto found_space;
459 }
460 }
461 }
462 else if (!STACK_ALIGNMENT_NEEDED)
463 {
464 slot_offset = frame_offset;
465 goto found_space;
466 }
467
468 old_frame_offset = frame_offset;
469
470 if (FRAME_GROWS_DOWNWARD)
471 {
472 frame_offset -= size;
473 try_fit_stack_local (frame_offset, size, size, alignment, &slot_offset);
474
475 if (kind & ASLK_RECORD_PAD)
476 {
477 if (known_gt (slot_offset, frame_offset))
478 add_frame_space (frame_offset, slot_offset);
479 if (known_lt (slot_offset + size, old_frame_offset))
480 add_frame_space (slot_offset + size, old_frame_offset);
481 }
482 }
483 else
484 {
485 frame_offset += size;
486 try_fit_stack_local (old_frame_offset, size, size, alignment, &slot_offset);
487
488 if (kind & ASLK_RECORD_PAD)
489 {
490 if (known_gt (slot_offset, old_frame_offset))
491 add_frame_space (old_frame_offset, slot_offset);
492 if (known_lt (slot_offset + size, frame_offset))
493 add_frame_space (slot_offset + size, frame_offset);
494 }
495 }
496
497 found_space:
498 /* On a big-endian machine, if we are allocating more space than we will use,
499 use the least significant bytes of those that are allocated. */
500 if (mode != BLKmode)
501 {
502 /* The slot size can sometimes be smaller than the mode size;
503 e.g. the rs6000 port allocates slots with a vector mode
504 that have the size of only one element. However, the slot
505 size must always be ordered wrt to the mode size, in the
506 same way as for a subreg. */
507 gcc_checking_assert (ordered_p (GET_MODE_SIZE (mode), size));
508 if (BYTES_BIG_ENDIAN && maybe_lt (GET_MODE_SIZE (mode), size))
509 bigend_correction = size - GET_MODE_SIZE (mode);
510 }
511
512 /* If we have already instantiated virtual registers, return the actual
513 address relative to the frame pointer. */
514 if (virtuals_instantiated)
515 addr = plus_constant (Pmode, frame_pointer_rtx,
516 trunc_int_for_mode
517 (slot_offset + bigend_correction
518 + targetm.starting_frame_offset (), Pmode));
519 else
520 addr = plus_constant (Pmode, virtual_stack_vars_rtx,
521 trunc_int_for_mode
522 (slot_offset + bigend_correction,
523 Pmode));
524
525 x = gen_rtx_MEM (mode, addr);
526 set_mem_align (x, alignment_in_bits);
527 MEM_NOTRAP_P (x) = 1;
528
529 vec_safe_push (stack_slot_list, x);
530
531 if (frame_offset_overflow (frame_offset, current_function_decl))
532 frame_offset = 0;
533
534 return x;
535 }
536
537 /* Wrap up assign_stack_local_1 with last parameter as false. */
538
539 rtx
540 assign_stack_local (machine_mode mode, poly_int64 size, int align)
541 {
542 return assign_stack_local_1 (mode, size, align, ASLK_RECORD_PAD);
543 }
544 \f
545 /* In order to evaluate some expressions, such as function calls returning
546 structures in memory, we need to temporarily allocate stack locations.
547 We record each allocated temporary in the following structure.
548
549 Associated with each temporary slot is a nesting level. When we pop up
550 one level, all temporaries associated with the previous level are freed.
551 Normally, all temporaries are freed after the execution of the statement
552 in which they were created. However, if we are inside a ({...}) grouping,
553 the result may be in a temporary and hence must be preserved. If the
554 result could be in a temporary, we preserve it if we can determine which
555 one it is in. If we cannot determine which temporary may contain the
556 result, all temporaries are preserved. A temporary is preserved by
557 pretending it was allocated at the previous nesting level. */
558
559 class GTY(()) temp_slot {
560 public:
561 /* Points to next temporary slot. */
562 class temp_slot *next;
563 /* Points to previous temporary slot. */
564 class temp_slot *prev;
565 /* The rtx to used to reference the slot. */
566 rtx slot;
567 /* The size, in units, of the slot. */
568 poly_int64 size;
569 /* The type of the object in the slot, or zero if it doesn't correspond
570 to a type. We use this to determine whether a slot can be reused.
571 It can be reused if objects of the type of the new slot will always
572 conflict with objects of the type of the old slot. */
573 tree type;
574 /* The alignment (in bits) of the slot. */
575 unsigned int align;
576 /* Nonzero if this temporary is currently in use. */
577 char in_use;
578 /* Nesting level at which this slot is being used. */
579 int level;
580 /* The offset of the slot from the frame_pointer, including extra space
581 for alignment. This info is for combine_temp_slots. */
582 poly_int64 base_offset;
583 /* The size of the slot, including extra space for alignment. This
584 info is for combine_temp_slots. */
585 poly_int64 full_size;
586 };
587
588 /* Entry for the below hash table. */
589 struct GTY((for_user)) temp_slot_address_entry {
590 hashval_t hash;
591 rtx address;
592 class temp_slot *temp_slot;
593 };
594
595 struct temp_address_hasher : ggc_ptr_hash<temp_slot_address_entry>
596 {
597 static hashval_t hash (temp_slot_address_entry *);
598 static bool equal (temp_slot_address_entry *, temp_slot_address_entry *);
599 };
600
601 /* A table of addresses that represent a stack slot. The table is a mapping
602 from address RTXen to a temp slot. */
603 static GTY(()) hash_table<temp_address_hasher> *temp_slot_address_table;
604 static size_t n_temp_slots_in_use;
605
606 /* Removes temporary slot TEMP from LIST. */
607
608 static void
609 cut_slot_from_list (class temp_slot *temp, class temp_slot **list)
610 {
611 if (temp->next)
612 temp->next->prev = temp->prev;
613 if (temp->prev)
614 temp->prev->next = temp->next;
615 else
616 *list = temp->next;
617
618 temp->prev = temp->next = NULL;
619 }
620
621 /* Inserts temporary slot TEMP to LIST. */
622
623 static void
624 insert_slot_to_list (class temp_slot *temp, class temp_slot **list)
625 {
626 temp->next = *list;
627 if (*list)
628 (*list)->prev = temp;
629 temp->prev = NULL;
630 *list = temp;
631 }
632
633 /* Returns the list of used temp slots at LEVEL. */
634
635 static class temp_slot **
636 temp_slots_at_level (int level)
637 {
638 if (level >= (int) vec_safe_length (used_temp_slots))
639 vec_safe_grow_cleared (used_temp_slots, level + 1);
640
641 return &(*used_temp_slots)[level];
642 }
643
644 /* Returns the maximal temporary slot level. */
645
646 static int
647 max_slot_level (void)
648 {
649 if (!used_temp_slots)
650 return -1;
651
652 return used_temp_slots->length () - 1;
653 }
654
655 /* Moves temporary slot TEMP to LEVEL. */
656
657 static void
658 move_slot_to_level (class temp_slot *temp, int level)
659 {
660 cut_slot_from_list (temp, temp_slots_at_level (temp->level));
661 insert_slot_to_list (temp, temp_slots_at_level (level));
662 temp->level = level;
663 }
664
665 /* Make temporary slot TEMP available. */
666
667 static void
668 make_slot_available (class temp_slot *temp)
669 {
670 cut_slot_from_list (temp, temp_slots_at_level (temp->level));
671 insert_slot_to_list (temp, &avail_temp_slots);
672 temp->in_use = 0;
673 temp->level = -1;
674 n_temp_slots_in_use--;
675 }
676
677 /* Compute the hash value for an address -> temp slot mapping.
678 The value is cached on the mapping entry. */
679 static hashval_t
680 temp_slot_address_compute_hash (struct temp_slot_address_entry *t)
681 {
682 int do_not_record = 0;
683 return hash_rtx (t->address, GET_MODE (t->address),
684 &do_not_record, NULL, false);
685 }
686
687 /* Return the hash value for an address -> temp slot mapping. */
688 hashval_t
689 temp_address_hasher::hash (temp_slot_address_entry *t)
690 {
691 return t->hash;
692 }
693
694 /* Compare two address -> temp slot mapping entries. */
695 bool
696 temp_address_hasher::equal (temp_slot_address_entry *t1,
697 temp_slot_address_entry *t2)
698 {
699 return exp_equiv_p (t1->address, t2->address, 0, true);
700 }
701
702 /* Add ADDRESS as an alias of TEMP_SLOT to the addess -> temp slot mapping. */
703 static void
704 insert_temp_slot_address (rtx address, class temp_slot *temp_slot)
705 {
706 struct temp_slot_address_entry *t = ggc_alloc<temp_slot_address_entry> ();
707 t->address = copy_rtx (address);
708 t->temp_slot = temp_slot;
709 t->hash = temp_slot_address_compute_hash (t);
710 *temp_slot_address_table->find_slot_with_hash (t, t->hash, INSERT) = t;
711 }
712
713 /* Remove an address -> temp slot mapping entry if the temp slot is
714 not in use anymore. Callback for remove_unused_temp_slot_addresses. */
715 int
716 remove_unused_temp_slot_addresses_1 (temp_slot_address_entry **slot, void *)
717 {
718 const struct temp_slot_address_entry *t = *slot;
719 if (! t->temp_slot->in_use)
720 temp_slot_address_table->clear_slot (slot);
721 return 1;
722 }
723
724 /* Remove all mappings of addresses to unused temp slots. */
725 static void
726 remove_unused_temp_slot_addresses (void)
727 {
728 /* Use quicker clearing if there aren't any active temp slots. */
729 if (n_temp_slots_in_use)
730 temp_slot_address_table->traverse
731 <void *, remove_unused_temp_slot_addresses_1> (NULL);
732 else
733 temp_slot_address_table->empty ();
734 }
735
736 /* Find the temp slot corresponding to the object at address X. */
737
738 static class temp_slot *
739 find_temp_slot_from_address (rtx x)
740 {
741 class temp_slot *p;
742 struct temp_slot_address_entry tmp, *t;
743
744 /* First try the easy way:
745 See if X exists in the address -> temp slot mapping. */
746 tmp.address = x;
747 tmp.temp_slot = NULL;
748 tmp.hash = temp_slot_address_compute_hash (&tmp);
749 t = temp_slot_address_table->find_with_hash (&tmp, tmp.hash);
750 if (t)
751 return t->temp_slot;
752
753 /* If we have a sum involving a register, see if it points to a temp
754 slot. */
755 if (GET_CODE (x) == PLUS && REG_P (XEXP (x, 0))
756 && (p = find_temp_slot_from_address (XEXP (x, 0))) != 0)
757 return p;
758 else if (GET_CODE (x) == PLUS && REG_P (XEXP (x, 1))
759 && (p = find_temp_slot_from_address (XEXP (x, 1))) != 0)
760 return p;
761
762 /* Last resort: Address is a virtual stack var address. */
763 poly_int64 offset;
764 if (strip_offset (x, &offset) == virtual_stack_vars_rtx)
765 {
766 int i;
767 for (i = max_slot_level (); i >= 0; i--)
768 for (p = *temp_slots_at_level (i); p; p = p->next)
769 if (known_in_range_p (offset, p->base_offset, p->full_size))
770 return p;
771 }
772
773 return NULL;
774 }
775 \f
776 /* Allocate a temporary stack slot and record it for possible later
777 reuse.
778
779 MODE is the machine mode to be given to the returned rtx.
780
781 SIZE is the size in units of the space required. We do no rounding here
782 since assign_stack_local will do any required rounding.
783
784 TYPE is the type that will be used for the stack slot. */
785
786 rtx
787 assign_stack_temp_for_type (machine_mode mode, poly_int64 size, tree type)
788 {
789 unsigned int align;
790 class temp_slot *p, *best_p = 0, *selected = NULL, **pp;
791 rtx slot;
792
793 gcc_assert (known_size_p (size));
794
795 align = get_stack_local_alignment (type, mode);
796
797 /* Try to find an available, already-allocated temporary of the proper
798 mode which meets the size and alignment requirements. Choose the
799 smallest one with the closest alignment.
800
801 If assign_stack_temp is called outside of the tree->rtl expansion,
802 we cannot reuse the stack slots (that may still refer to
803 VIRTUAL_STACK_VARS_REGNUM). */
804 if (!virtuals_instantiated)
805 {
806 for (p = avail_temp_slots; p; p = p->next)
807 {
808 if (p->align >= align
809 && known_ge (p->size, size)
810 && GET_MODE (p->slot) == mode
811 && objects_must_conflict_p (p->type, type)
812 && (best_p == 0
813 || (known_eq (best_p->size, p->size)
814 ? best_p->align > p->align
815 : known_ge (best_p->size, p->size))))
816 {
817 if (p->align == align && known_eq (p->size, size))
818 {
819 selected = p;
820 cut_slot_from_list (selected, &avail_temp_slots);
821 best_p = 0;
822 break;
823 }
824 best_p = p;
825 }
826 }
827 }
828
829 /* Make our best, if any, the one to use. */
830 if (best_p)
831 {
832 selected = best_p;
833 cut_slot_from_list (selected, &avail_temp_slots);
834
835 /* If there are enough aligned bytes left over, make them into a new
836 temp_slot so that the extra bytes don't get wasted. Do this only
837 for BLKmode slots, so that we can be sure of the alignment. */
838 if (GET_MODE (best_p->slot) == BLKmode)
839 {
840 int alignment = best_p->align / BITS_PER_UNIT;
841 poly_int64 rounded_size = aligned_upper_bound (size, alignment);
842
843 if (known_ge (best_p->size - rounded_size, alignment))
844 {
845 p = ggc_alloc<temp_slot> ();
846 p->in_use = 0;
847 p->size = best_p->size - rounded_size;
848 p->base_offset = best_p->base_offset + rounded_size;
849 p->full_size = best_p->full_size - rounded_size;
850 p->slot = adjust_address_nv (best_p->slot, BLKmode, rounded_size);
851 p->align = best_p->align;
852 p->type = best_p->type;
853 insert_slot_to_list (p, &avail_temp_slots);
854
855 vec_safe_push (stack_slot_list, p->slot);
856
857 best_p->size = rounded_size;
858 best_p->full_size = rounded_size;
859 }
860 }
861 }
862
863 /* If we still didn't find one, make a new temporary. */
864 if (selected == 0)
865 {
866 poly_int64 frame_offset_old = frame_offset;
867
868 p = ggc_alloc<temp_slot> ();
869
870 /* We are passing an explicit alignment request to assign_stack_local.
871 One side effect of that is assign_stack_local will not round SIZE
872 to ensure the frame offset remains suitably aligned.
873
874 So for requests which depended on the rounding of SIZE, we go ahead
875 and round it now. We also make sure ALIGNMENT is at least
876 BIGGEST_ALIGNMENT. */
877 gcc_assert (mode != BLKmode || align == BIGGEST_ALIGNMENT);
878 p->slot = assign_stack_local_1 (mode,
879 (mode == BLKmode
880 ? aligned_upper_bound (size,
881 (int) align
882 / BITS_PER_UNIT)
883 : size),
884 align, 0);
885
886 p->align = align;
887
888 /* The following slot size computation is necessary because we don't
889 know the actual size of the temporary slot until assign_stack_local
890 has performed all the frame alignment and size rounding for the
891 requested temporary. Note that extra space added for alignment
892 can be either above or below this stack slot depending on which
893 way the frame grows. We include the extra space if and only if it
894 is above this slot. */
895 if (FRAME_GROWS_DOWNWARD)
896 p->size = frame_offset_old - frame_offset;
897 else
898 p->size = size;
899
900 /* Now define the fields used by combine_temp_slots. */
901 if (FRAME_GROWS_DOWNWARD)
902 {
903 p->base_offset = frame_offset;
904 p->full_size = frame_offset_old - frame_offset;
905 }
906 else
907 {
908 p->base_offset = frame_offset_old;
909 p->full_size = frame_offset - frame_offset_old;
910 }
911
912 selected = p;
913 }
914
915 p = selected;
916 p->in_use = 1;
917 p->type = type;
918 p->level = temp_slot_level;
919 n_temp_slots_in_use++;
920
921 pp = temp_slots_at_level (p->level);
922 insert_slot_to_list (p, pp);
923 insert_temp_slot_address (XEXP (p->slot, 0), p);
924
925 /* Create a new MEM rtx to avoid clobbering MEM flags of old slots. */
926 slot = gen_rtx_MEM (mode, XEXP (p->slot, 0));
927 vec_safe_push (stack_slot_list, slot);
928
929 /* If we know the alias set for the memory that will be used, use
930 it. If there's no TYPE, then we don't know anything about the
931 alias set for the memory. */
932 set_mem_alias_set (slot, type ? get_alias_set (type) : 0);
933 set_mem_align (slot, align);
934
935 /* If a type is specified, set the relevant flags. */
936 if (type != 0)
937 MEM_VOLATILE_P (slot) = TYPE_VOLATILE (type);
938 MEM_NOTRAP_P (slot) = 1;
939
940 return slot;
941 }
942
943 /* Allocate a temporary stack slot and record it for possible later
944 reuse. First two arguments are same as in preceding function. */
945
946 rtx
947 assign_stack_temp (machine_mode mode, poly_int64 size)
948 {
949 return assign_stack_temp_for_type (mode, size, NULL_TREE);
950 }
951 \f
952 /* Assign a temporary.
953 If TYPE_OR_DECL is a decl, then we are doing it on behalf of the decl
954 and so that should be used in error messages. In either case, we
955 allocate of the given type.
956 MEMORY_REQUIRED is 1 if the result must be addressable stack memory;
957 it is 0 if a register is OK.
958 DONT_PROMOTE is 1 if we should not promote values in register
959 to wider modes. */
960
961 rtx
962 assign_temp (tree type_or_decl, int memory_required,
963 int dont_promote ATTRIBUTE_UNUSED)
964 {
965 tree type, decl;
966 machine_mode mode;
967 #ifdef PROMOTE_MODE
968 int unsignedp;
969 #endif
970
971 if (DECL_P (type_or_decl))
972 decl = type_or_decl, type = TREE_TYPE (decl);
973 else
974 decl = NULL, type = type_or_decl;
975
976 mode = TYPE_MODE (type);
977 #ifdef PROMOTE_MODE
978 unsignedp = TYPE_UNSIGNED (type);
979 #endif
980
981 /* Allocating temporaries of TREE_ADDRESSABLE type must be done in the front
982 end. See also create_tmp_var for the gimplification-time check. */
983 gcc_assert (!TREE_ADDRESSABLE (type) && COMPLETE_TYPE_P (type));
984
985 if (mode == BLKmode || memory_required)
986 {
987 poly_int64 size;
988 rtx tmp;
989
990 /* Unfortunately, we don't yet know how to allocate variable-sized
991 temporaries. However, sometimes we can find a fixed upper limit on
992 the size, so try that instead. */
993 if (!poly_int_tree_p (TYPE_SIZE_UNIT (type), &size))
994 size = max_int_size_in_bytes (type);
995
996 /* Zero sized arrays are a GNU C extension. Set size to 1 to avoid
997 problems with allocating the stack space. */
998 if (known_eq (size, 0))
999 size = 1;
1000
1001 /* The size of the temporary may be too large to fit into an integer. */
1002 /* ??? Not sure this should happen except for user silliness, so limit
1003 this to things that aren't compiler-generated temporaries. The
1004 rest of the time we'll die in assign_stack_temp_for_type. */
1005 if (decl
1006 && !known_size_p (size)
1007 && TREE_CODE (TYPE_SIZE_UNIT (type)) == INTEGER_CST)
1008 {
1009 error ("size of variable %q+D is too large", decl);
1010 size = 1;
1011 }
1012
1013 tmp = assign_stack_temp_for_type (mode, size, type);
1014 return tmp;
1015 }
1016
1017 #ifdef PROMOTE_MODE
1018 if (! dont_promote)
1019 mode = promote_mode (type, mode, &unsignedp);
1020 #endif
1021
1022 return gen_reg_rtx (mode);
1023 }
1024 \f
1025 /* Combine temporary stack slots which are adjacent on the stack.
1026
1027 This allows for better use of already allocated stack space. This is only
1028 done for BLKmode slots because we can be sure that we won't have alignment
1029 problems in this case. */
1030
1031 static void
1032 combine_temp_slots (void)
1033 {
1034 class temp_slot *p, *q, *next, *next_q;
1035 int num_slots;
1036
1037 /* We can't combine slots, because the information about which slot
1038 is in which alias set will be lost. */
1039 if (flag_strict_aliasing)
1040 return;
1041
1042 /* If there are a lot of temp slots, don't do anything unless
1043 high levels of optimization. */
1044 if (! flag_expensive_optimizations)
1045 for (p = avail_temp_slots, num_slots = 0; p; p = p->next, num_slots++)
1046 if (num_slots > 100 || (num_slots > 10 && optimize == 0))
1047 return;
1048
1049 for (p = avail_temp_slots; p; p = next)
1050 {
1051 int delete_p = 0;
1052
1053 next = p->next;
1054
1055 if (GET_MODE (p->slot) != BLKmode)
1056 continue;
1057
1058 for (q = p->next; q; q = next_q)
1059 {
1060 int delete_q = 0;
1061
1062 next_q = q->next;
1063
1064 if (GET_MODE (q->slot) != BLKmode)
1065 continue;
1066
1067 if (known_eq (p->base_offset + p->full_size, q->base_offset))
1068 {
1069 /* Q comes after P; combine Q into P. */
1070 p->size += q->size;
1071 p->full_size += q->full_size;
1072 delete_q = 1;
1073 }
1074 else if (known_eq (q->base_offset + q->full_size, p->base_offset))
1075 {
1076 /* P comes after Q; combine P into Q. */
1077 q->size += p->size;
1078 q->full_size += p->full_size;
1079 delete_p = 1;
1080 break;
1081 }
1082 if (delete_q)
1083 cut_slot_from_list (q, &avail_temp_slots);
1084 }
1085
1086 /* Either delete P or advance past it. */
1087 if (delete_p)
1088 cut_slot_from_list (p, &avail_temp_slots);
1089 }
1090 }
1091 \f
1092 /* Indicate that NEW_RTX is an alternate way of referring to the temp
1093 slot that previously was known by OLD_RTX. */
1094
1095 void
1096 update_temp_slot_address (rtx old_rtx, rtx new_rtx)
1097 {
1098 class temp_slot *p;
1099
1100 if (rtx_equal_p (old_rtx, new_rtx))
1101 return;
1102
1103 p = find_temp_slot_from_address (old_rtx);
1104
1105 /* If we didn't find one, see if both OLD_RTX is a PLUS. If so, and
1106 NEW_RTX is a register, see if one operand of the PLUS is a
1107 temporary location. If so, NEW_RTX points into it. Otherwise,
1108 if both OLD_RTX and NEW_RTX are a PLUS and if there is a register
1109 in common between them. If so, try a recursive call on those
1110 values. */
1111 if (p == 0)
1112 {
1113 if (GET_CODE (old_rtx) != PLUS)
1114 return;
1115
1116 if (REG_P (new_rtx))
1117 {
1118 update_temp_slot_address (XEXP (old_rtx, 0), new_rtx);
1119 update_temp_slot_address (XEXP (old_rtx, 1), new_rtx);
1120 return;
1121 }
1122 else if (GET_CODE (new_rtx) != PLUS)
1123 return;
1124
1125 if (rtx_equal_p (XEXP (old_rtx, 0), XEXP (new_rtx, 0)))
1126 update_temp_slot_address (XEXP (old_rtx, 1), XEXP (new_rtx, 1));
1127 else if (rtx_equal_p (XEXP (old_rtx, 1), XEXP (new_rtx, 0)))
1128 update_temp_slot_address (XEXP (old_rtx, 0), XEXP (new_rtx, 1));
1129 else if (rtx_equal_p (XEXP (old_rtx, 0), XEXP (new_rtx, 1)))
1130 update_temp_slot_address (XEXP (old_rtx, 1), XEXP (new_rtx, 0));
1131 else if (rtx_equal_p (XEXP (old_rtx, 1), XEXP (new_rtx, 1)))
1132 update_temp_slot_address (XEXP (old_rtx, 0), XEXP (new_rtx, 0));
1133
1134 return;
1135 }
1136
1137 /* Otherwise add an alias for the temp's address. */
1138 insert_temp_slot_address (new_rtx, p);
1139 }
1140
1141 /* If X could be a reference to a temporary slot, mark that slot as
1142 belonging to the to one level higher than the current level. If X
1143 matched one of our slots, just mark that one. Otherwise, we can't
1144 easily predict which it is, so upgrade all of them.
1145
1146 This is called when an ({...}) construct occurs and a statement
1147 returns a value in memory. */
1148
1149 void
1150 preserve_temp_slots (rtx x)
1151 {
1152 class temp_slot *p = 0, *next;
1153
1154 if (x == 0)
1155 return;
1156
1157 /* If X is a register that is being used as a pointer, see if we have
1158 a temporary slot we know it points to. */
1159 if (REG_P (x) && REG_POINTER (x))
1160 p = find_temp_slot_from_address (x);
1161
1162 /* If X is not in memory or is at a constant address, it cannot be in
1163 a temporary slot. */
1164 if (p == 0 && (!MEM_P (x) || CONSTANT_P (XEXP (x, 0))))
1165 return;
1166
1167 /* First see if we can find a match. */
1168 if (p == 0)
1169 p = find_temp_slot_from_address (XEXP (x, 0));
1170
1171 if (p != 0)
1172 {
1173 if (p->level == temp_slot_level)
1174 move_slot_to_level (p, temp_slot_level - 1);
1175 return;
1176 }
1177
1178 /* Otherwise, preserve all non-kept slots at this level. */
1179 for (p = *temp_slots_at_level (temp_slot_level); p; p = next)
1180 {
1181 next = p->next;
1182 move_slot_to_level (p, temp_slot_level - 1);
1183 }
1184 }
1185
1186 /* Free all temporaries used so far. This is normally called at the
1187 end of generating code for a statement. */
1188
1189 void
1190 free_temp_slots (void)
1191 {
1192 class temp_slot *p, *next;
1193 bool some_available = false;
1194
1195 for (p = *temp_slots_at_level (temp_slot_level); p; p = next)
1196 {
1197 next = p->next;
1198 make_slot_available (p);
1199 some_available = true;
1200 }
1201
1202 if (some_available)
1203 {
1204 remove_unused_temp_slot_addresses ();
1205 combine_temp_slots ();
1206 }
1207 }
1208
1209 /* Push deeper into the nesting level for stack temporaries. */
1210
1211 void
1212 push_temp_slots (void)
1213 {
1214 temp_slot_level++;
1215 }
1216
1217 /* Pop a temporary nesting level. All slots in use in the current level
1218 are freed. */
1219
1220 void
1221 pop_temp_slots (void)
1222 {
1223 free_temp_slots ();
1224 temp_slot_level--;
1225 }
1226
1227 /* Initialize temporary slots. */
1228
1229 void
1230 init_temp_slots (void)
1231 {
1232 /* We have not allocated any temporaries yet. */
1233 avail_temp_slots = 0;
1234 vec_alloc (used_temp_slots, 0);
1235 temp_slot_level = 0;
1236 n_temp_slots_in_use = 0;
1237
1238 /* Set up the table to map addresses to temp slots. */
1239 if (! temp_slot_address_table)
1240 temp_slot_address_table = hash_table<temp_address_hasher>::create_ggc (32);
1241 else
1242 temp_slot_address_table->empty ();
1243 }
1244 \f
1245 /* Functions and data structures to keep track of the values hard regs
1246 had at the start of the function. */
1247
1248 /* Private type used by get_hard_reg_initial_reg, get_hard_reg_initial_val,
1249 and has_hard_reg_initial_val.. */
1250 struct GTY(()) initial_value_pair {
1251 rtx hard_reg;
1252 rtx pseudo;
1253 };
1254 /* ??? This could be a VEC but there is currently no way to define an
1255 opaque VEC type. This could be worked around by defining struct
1256 initial_value_pair in function.h. */
1257 struct GTY(()) initial_value_struct {
1258 int num_entries;
1259 int max_entries;
1260 initial_value_pair * GTY ((length ("%h.num_entries"))) entries;
1261 };
1262
1263 /* If a pseudo represents an initial hard reg (or expression), return
1264 it, else return NULL_RTX. */
1265
1266 rtx
1267 get_hard_reg_initial_reg (rtx reg)
1268 {
1269 struct initial_value_struct *ivs = crtl->hard_reg_initial_vals;
1270 int i;
1271
1272 if (ivs == 0)
1273 return NULL_RTX;
1274
1275 for (i = 0; i < ivs->num_entries; i++)
1276 if (rtx_equal_p (ivs->entries[i].pseudo, reg))
1277 return ivs->entries[i].hard_reg;
1278
1279 return NULL_RTX;
1280 }
1281
1282 /* Make sure that there's a pseudo register of mode MODE that stores the
1283 initial value of hard register REGNO. Return an rtx for such a pseudo. */
1284
1285 rtx
1286 get_hard_reg_initial_val (machine_mode mode, unsigned int regno)
1287 {
1288 struct initial_value_struct *ivs;
1289 rtx rv;
1290
1291 rv = has_hard_reg_initial_val (mode, regno);
1292 if (rv)
1293 return rv;
1294
1295 ivs = crtl->hard_reg_initial_vals;
1296 if (ivs == 0)
1297 {
1298 ivs = ggc_alloc<initial_value_struct> ();
1299 ivs->num_entries = 0;
1300 ivs->max_entries = 5;
1301 ivs->entries = ggc_vec_alloc<initial_value_pair> (5);
1302 crtl->hard_reg_initial_vals = ivs;
1303 }
1304
1305 if (ivs->num_entries >= ivs->max_entries)
1306 {
1307 ivs->max_entries += 5;
1308 ivs->entries = GGC_RESIZEVEC (initial_value_pair, ivs->entries,
1309 ivs->max_entries);
1310 }
1311
1312 ivs->entries[ivs->num_entries].hard_reg = gen_rtx_REG (mode, regno);
1313 ivs->entries[ivs->num_entries].pseudo = gen_reg_rtx (mode);
1314
1315 return ivs->entries[ivs->num_entries++].pseudo;
1316 }
1317
1318 /* See if get_hard_reg_initial_val has been used to create a pseudo
1319 for the initial value of hard register REGNO in mode MODE. Return
1320 the associated pseudo if so, otherwise return NULL. */
1321
1322 rtx
1323 has_hard_reg_initial_val (machine_mode mode, unsigned int regno)
1324 {
1325 struct initial_value_struct *ivs;
1326 int i;
1327
1328 ivs = crtl->hard_reg_initial_vals;
1329 if (ivs != 0)
1330 for (i = 0; i < ivs->num_entries; i++)
1331 if (GET_MODE (ivs->entries[i].hard_reg) == mode
1332 && REGNO (ivs->entries[i].hard_reg) == regno)
1333 return ivs->entries[i].pseudo;
1334
1335 return NULL_RTX;
1336 }
1337
1338 unsigned int
1339 emit_initial_value_sets (void)
1340 {
1341 struct initial_value_struct *ivs = crtl->hard_reg_initial_vals;
1342 int i;
1343 rtx_insn *seq;
1344
1345 if (ivs == 0)
1346 return 0;
1347
1348 start_sequence ();
1349 for (i = 0; i < ivs->num_entries; i++)
1350 emit_move_insn (ivs->entries[i].pseudo, ivs->entries[i].hard_reg);
1351 seq = get_insns ();
1352 end_sequence ();
1353
1354 emit_insn_at_entry (seq);
1355 return 0;
1356 }
1357
1358 /* Return the hardreg-pseudoreg initial values pair entry I and
1359 TRUE if I is a valid entry, or FALSE if I is not a valid entry. */
1360 bool
1361 initial_value_entry (int i, rtx *hreg, rtx *preg)
1362 {
1363 struct initial_value_struct *ivs = crtl->hard_reg_initial_vals;
1364 if (!ivs || i >= ivs->num_entries)
1365 return false;
1366
1367 *hreg = ivs->entries[i].hard_reg;
1368 *preg = ivs->entries[i].pseudo;
1369 return true;
1370 }
1371 \f
1372 /* These routines are responsible for converting virtual register references
1373 to the actual hard register references once RTL generation is complete.
1374
1375 The following four variables are used for communication between the
1376 routines. They contain the offsets of the virtual registers from their
1377 respective hard registers. */
1378
1379 static poly_int64 in_arg_offset;
1380 static poly_int64 var_offset;
1381 static poly_int64 dynamic_offset;
1382 static poly_int64 out_arg_offset;
1383 static poly_int64 cfa_offset;
1384
1385 /* In most machines, the stack pointer register is equivalent to the bottom
1386 of the stack. */
1387
1388 #ifndef STACK_POINTER_OFFSET
1389 #define STACK_POINTER_OFFSET 0
1390 #endif
1391
1392 #if defined (REG_PARM_STACK_SPACE) && !defined (INCOMING_REG_PARM_STACK_SPACE)
1393 #define INCOMING_REG_PARM_STACK_SPACE REG_PARM_STACK_SPACE
1394 #endif
1395
1396 /* If not defined, pick an appropriate default for the offset of dynamically
1397 allocated memory depending on the value of ACCUMULATE_OUTGOING_ARGS,
1398 INCOMING_REG_PARM_STACK_SPACE, and OUTGOING_REG_PARM_STACK_SPACE. */
1399
1400 #ifndef STACK_DYNAMIC_OFFSET
1401
1402 /* The bottom of the stack points to the actual arguments. If
1403 REG_PARM_STACK_SPACE is defined, this includes the space for the register
1404 parameters. However, if OUTGOING_REG_PARM_STACK space is not defined,
1405 stack space for register parameters is not pushed by the caller, but
1406 rather part of the fixed stack areas and hence not included in
1407 `crtl->outgoing_args_size'. Nevertheless, we must allow
1408 for it when allocating stack dynamic objects. */
1409
1410 #ifdef INCOMING_REG_PARM_STACK_SPACE
1411 #define STACK_DYNAMIC_OFFSET(FNDECL) \
1412 ((ACCUMULATE_OUTGOING_ARGS \
1413 ? (crtl->outgoing_args_size \
1414 + (OUTGOING_REG_PARM_STACK_SPACE ((!(FNDECL) ? NULL_TREE : TREE_TYPE (FNDECL))) ? 0 \
1415 : INCOMING_REG_PARM_STACK_SPACE (FNDECL))) \
1416 : 0) + (STACK_POINTER_OFFSET))
1417 #else
1418 #define STACK_DYNAMIC_OFFSET(FNDECL) \
1419 ((ACCUMULATE_OUTGOING_ARGS ? crtl->outgoing_args_size : poly_int64 (0)) \
1420 + (STACK_POINTER_OFFSET))
1421 #endif
1422 #endif
1423
1424 \f
1425 /* Given a piece of RTX and a pointer to a HOST_WIDE_INT, if the RTX
1426 is a virtual register, return the equivalent hard register and set the
1427 offset indirectly through the pointer. Otherwise, return 0. */
1428
1429 static rtx
1430 instantiate_new_reg (rtx x, poly_int64_pod *poffset)
1431 {
1432 rtx new_rtx;
1433 poly_int64 offset;
1434
1435 if (x == virtual_incoming_args_rtx)
1436 {
1437 if (stack_realign_drap)
1438 {
1439 /* Replace virtual_incoming_args_rtx with internal arg
1440 pointer if DRAP is used to realign stack. */
1441 new_rtx = crtl->args.internal_arg_pointer;
1442 offset = 0;
1443 }
1444 else
1445 new_rtx = arg_pointer_rtx, offset = in_arg_offset;
1446 }
1447 else if (x == virtual_stack_vars_rtx)
1448 new_rtx = frame_pointer_rtx, offset = var_offset;
1449 else if (x == virtual_stack_dynamic_rtx)
1450 new_rtx = stack_pointer_rtx, offset = dynamic_offset;
1451 else if (x == virtual_outgoing_args_rtx)
1452 new_rtx = stack_pointer_rtx, offset = out_arg_offset;
1453 else if (x == virtual_cfa_rtx)
1454 {
1455 #ifdef FRAME_POINTER_CFA_OFFSET
1456 new_rtx = frame_pointer_rtx;
1457 #else
1458 new_rtx = arg_pointer_rtx;
1459 #endif
1460 offset = cfa_offset;
1461 }
1462 else if (x == virtual_preferred_stack_boundary_rtx)
1463 {
1464 new_rtx = GEN_INT (crtl->preferred_stack_boundary / BITS_PER_UNIT);
1465 offset = 0;
1466 }
1467 else
1468 return NULL_RTX;
1469
1470 *poffset = offset;
1471 return new_rtx;
1472 }
1473
1474 /* A subroutine of instantiate_virtual_regs. Instantiate any virtual
1475 registers present inside of *LOC. The expression is simplified,
1476 as much as possible, but is not to be considered "valid" in any sense
1477 implied by the target. Return true if any change is made. */
1478
1479 static bool
1480 instantiate_virtual_regs_in_rtx (rtx *loc)
1481 {
1482 if (!*loc)
1483 return false;
1484 bool changed = false;
1485 subrtx_ptr_iterator::array_type array;
1486 FOR_EACH_SUBRTX_PTR (iter, array, loc, NONCONST)
1487 {
1488 rtx *loc = *iter;
1489 if (rtx x = *loc)
1490 {
1491 rtx new_rtx;
1492 poly_int64 offset;
1493 switch (GET_CODE (x))
1494 {
1495 case REG:
1496 new_rtx = instantiate_new_reg (x, &offset);
1497 if (new_rtx)
1498 {
1499 *loc = plus_constant (GET_MODE (x), new_rtx, offset);
1500 changed = true;
1501 }
1502 iter.skip_subrtxes ();
1503 break;
1504
1505 case PLUS:
1506 new_rtx = instantiate_new_reg (XEXP (x, 0), &offset);
1507 if (new_rtx)
1508 {
1509 XEXP (x, 0) = new_rtx;
1510 *loc = plus_constant (GET_MODE (x), x, offset, true);
1511 changed = true;
1512 iter.skip_subrtxes ();
1513 break;
1514 }
1515
1516 /* FIXME -- from old code */
1517 /* If we have (plus (subreg (virtual-reg)) (const_int)), we know
1518 we can commute the PLUS and SUBREG because pointers into the
1519 frame are well-behaved. */
1520 break;
1521
1522 default:
1523 break;
1524 }
1525 }
1526 }
1527 return changed;
1528 }
1529
1530 /* A subroutine of instantiate_virtual_regs_in_insn. Return true if X
1531 matches the predicate for insn CODE operand OPERAND. */
1532
1533 static int
1534 safe_insn_predicate (int code, int operand, rtx x)
1535 {
1536 return code < 0 || insn_operand_matches ((enum insn_code) code, operand, x);
1537 }
1538
1539 /* A subroutine of instantiate_virtual_regs. Instantiate any virtual
1540 registers present inside of insn. The result will be a valid insn. */
1541
1542 static void
1543 instantiate_virtual_regs_in_insn (rtx_insn *insn)
1544 {
1545 poly_int64 offset;
1546 int insn_code, i;
1547 bool any_change = false;
1548 rtx set, new_rtx, x;
1549 rtx_insn *seq;
1550
1551 /* There are some special cases to be handled first. */
1552 set = single_set (insn);
1553 if (set)
1554 {
1555 /* We're allowed to assign to a virtual register. This is interpreted
1556 to mean that the underlying register gets assigned the inverse
1557 transformation. This is used, for example, in the handling of
1558 non-local gotos. */
1559 new_rtx = instantiate_new_reg (SET_DEST (set), &offset);
1560 if (new_rtx)
1561 {
1562 start_sequence ();
1563
1564 instantiate_virtual_regs_in_rtx (&SET_SRC (set));
1565 x = simplify_gen_binary (PLUS, GET_MODE (new_rtx), SET_SRC (set),
1566 gen_int_mode (-offset, GET_MODE (new_rtx)));
1567 x = force_operand (x, new_rtx);
1568 if (x != new_rtx)
1569 emit_move_insn (new_rtx, x);
1570
1571 seq = get_insns ();
1572 end_sequence ();
1573
1574 emit_insn_before (seq, insn);
1575 delete_insn (insn);
1576 return;
1577 }
1578
1579 /* Handle a straight copy from a virtual register by generating a
1580 new add insn. The difference between this and falling through
1581 to the generic case is avoiding a new pseudo and eliminating a
1582 move insn in the initial rtl stream. */
1583 new_rtx = instantiate_new_reg (SET_SRC (set), &offset);
1584 if (new_rtx
1585 && maybe_ne (offset, 0)
1586 && REG_P (SET_DEST (set))
1587 && REGNO (SET_DEST (set)) > LAST_VIRTUAL_REGISTER)
1588 {
1589 start_sequence ();
1590
1591 x = expand_simple_binop (GET_MODE (SET_DEST (set)), PLUS, new_rtx,
1592 gen_int_mode (offset,
1593 GET_MODE (SET_DEST (set))),
1594 SET_DEST (set), 1, OPTAB_LIB_WIDEN);
1595 if (x != SET_DEST (set))
1596 emit_move_insn (SET_DEST (set), x);
1597
1598 seq = get_insns ();
1599 end_sequence ();
1600
1601 emit_insn_before (seq, insn);
1602 delete_insn (insn);
1603 return;
1604 }
1605
1606 extract_insn (insn);
1607 insn_code = INSN_CODE (insn);
1608
1609 /* Handle a plus involving a virtual register by determining if the
1610 operands remain valid if they're modified in place. */
1611 poly_int64 delta;
1612 if (GET_CODE (SET_SRC (set)) == PLUS
1613 && recog_data.n_operands >= 3
1614 && recog_data.operand_loc[1] == &XEXP (SET_SRC (set), 0)
1615 && recog_data.operand_loc[2] == &XEXP (SET_SRC (set), 1)
1616 && poly_int_rtx_p (recog_data.operand[2], &delta)
1617 && (new_rtx = instantiate_new_reg (recog_data.operand[1], &offset)))
1618 {
1619 offset += delta;
1620
1621 /* If the sum is zero, then replace with a plain move. */
1622 if (known_eq (offset, 0)
1623 && REG_P (SET_DEST (set))
1624 && REGNO (SET_DEST (set)) > LAST_VIRTUAL_REGISTER)
1625 {
1626 start_sequence ();
1627 emit_move_insn (SET_DEST (set), new_rtx);
1628 seq = get_insns ();
1629 end_sequence ();
1630
1631 emit_insn_before (seq, insn);
1632 delete_insn (insn);
1633 return;
1634 }
1635
1636 x = gen_int_mode (offset, recog_data.operand_mode[2]);
1637
1638 /* Using validate_change and apply_change_group here leaves
1639 recog_data in an invalid state. Since we know exactly what
1640 we want to check, do those two by hand. */
1641 if (safe_insn_predicate (insn_code, 1, new_rtx)
1642 && safe_insn_predicate (insn_code, 2, x))
1643 {
1644 *recog_data.operand_loc[1] = recog_data.operand[1] = new_rtx;
1645 *recog_data.operand_loc[2] = recog_data.operand[2] = x;
1646 any_change = true;
1647
1648 /* Fall through into the regular operand fixup loop in
1649 order to take care of operands other than 1 and 2. */
1650 }
1651 }
1652 }
1653 else
1654 {
1655 extract_insn (insn);
1656 insn_code = INSN_CODE (insn);
1657 }
1658
1659 /* In the general case, we expect virtual registers to appear only in
1660 operands, and then only as either bare registers or inside memories. */
1661 for (i = 0; i < recog_data.n_operands; ++i)
1662 {
1663 x = recog_data.operand[i];
1664 switch (GET_CODE (x))
1665 {
1666 case MEM:
1667 {
1668 rtx addr = XEXP (x, 0);
1669
1670 if (!instantiate_virtual_regs_in_rtx (&addr))
1671 continue;
1672
1673 start_sequence ();
1674 x = replace_equiv_address (x, addr, true);
1675 /* It may happen that the address with the virtual reg
1676 was valid (e.g. based on the virtual stack reg, which might
1677 be acceptable to the predicates with all offsets), whereas
1678 the address now isn't anymore, for instance when the address
1679 is still offsetted, but the base reg isn't virtual-stack-reg
1680 anymore. Below we would do a force_reg on the whole operand,
1681 but this insn might actually only accept memory. Hence,
1682 before doing that last resort, try to reload the address into
1683 a register, so this operand stays a MEM. */
1684 if (!safe_insn_predicate (insn_code, i, x))
1685 {
1686 addr = force_reg (GET_MODE (addr), addr);
1687 x = replace_equiv_address (x, addr, true);
1688 }
1689 seq = get_insns ();
1690 end_sequence ();
1691 if (seq)
1692 emit_insn_before (seq, insn);
1693 }
1694 break;
1695
1696 case REG:
1697 new_rtx = instantiate_new_reg (x, &offset);
1698 if (new_rtx == NULL)
1699 continue;
1700 if (known_eq (offset, 0))
1701 x = new_rtx;
1702 else
1703 {
1704 start_sequence ();
1705
1706 /* Careful, special mode predicates may have stuff in
1707 insn_data[insn_code].operand[i].mode that isn't useful
1708 to us for computing a new value. */
1709 /* ??? Recognize address_operand and/or "p" constraints
1710 to see if (plus new offset) is a valid before we put
1711 this through expand_simple_binop. */
1712 x = expand_simple_binop (GET_MODE (x), PLUS, new_rtx,
1713 gen_int_mode (offset, GET_MODE (x)),
1714 NULL_RTX, 1, OPTAB_LIB_WIDEN);
1715 seq = get_insns ();
1716 end_sequence ();
1717 emit_insn_before (seq, insn);
1718 }
1719 break;
1720
1721 case SUBREG:
1722 new_rtx = instantiate_new_reg (SUBREG_REG (x), &offset);
1723 if (new_rtx == NULL)
1724 continue;
1725 if (maybe_ne (offset, 0))
1726 {
1727 start_sequence ();
1728 new_rtx = expand_simple_binop
1729 (GET_MODE (new_rtx), PLUS, new_rtx,
1730 gen_int_mode (offset, GET_MODE (new_rtx)),
1731 NULL_RTX, 1, OPTAB_LIB_WIDEN);
1732 seq = get_insns ();
1733 end_sequence ();
1734 emit_insn_before (seq, insn);
1735 }
1736 x = simplify_gen_subreg (recog_data.operand_mode[i], new_rtx,
1737 GET_MODE (new_rtx), SUBREG_BYTE (x));
1738 gcc_assert (x);
1739 break;
1740
1741 default:
1742 continue;
1743 }
1744
1745 /* At this point, X contains the new value for the operand.
1746 Validate the new value vs the insn predicate. Note that
1747 asm insns will have insn_code -1 here. */
1748 if (!safe_insn_predicate (insn_code, i, x))
1749 {
1750 start_sequence ();
1751 if (REG_P (x))
1752 {
1753 gcc_assert (REGNO (x) <= LAST_VIRTUAL_REGISTER);
1754 x = copy_to_reg (x);
1755 }
1756 else
1757 x = force_reg (insn_data[insn_code].operand[i].mode, x);
1758 seq = get_insns ();
1759 end_sequence ();
1760 if (seq)
1761 emit_insn_before (seq, insn);
1762 }
1763
1764 *recog_data.operand_loc[i] = recog_data.operand[i] = x;
1765 any_change = true;
1766 }
1767
1768 if (any_change)
1769 {
1770 /* Propagate operand changes into the duplicates. */
1771 for (i = 0; i < recog_data.n_dups; ++i)
1772 *recog_data.dup_loc[i]
1773 = copy_rtx (recog_data.operand[(unsigned)recog_data.dup_num[i]]);
1774
1775 /* Force re-recognition of the instruction for validation. */
1776 INSN_CODE (insn) = -1;
1777 }
1778
1779 if (asm_noperands (PATTERN (insn)) >= 0)
1780 {
1781 if (!check_asm_operands (PATTERN (insn)))
1782 {
1783 error_for_asm (insn, "impossible constraint in %<asm%>");
1784 /* For asm goto, instead of fixing up all the edges
1785 just clear the template and clear input operands
1786 (asm goto doesn't have any output operands). */
1787 if (JUMP_P (insn))
1788 {
1789 rtx asm_op = extract_asm_operands (PATTERN (insn));
1790 ASM_OPERANDS_TEMPLATE (asm_op) = ggc_strdup ("");
1791 ASM_OPERANDS_INPUT_VEC (asm_op) = rtvec_alloc (0);
1792 ASM_OPERANDS_INPUT_CONSTRAINT_VEC (asm_op) = rtvec_alloc (0);
1793 }
1794 else
1795 delete_insn (insn);
1796 }
1797 }
1798 else
1799 {
1800 if (recog_memoized (insn) < 0)
1801 fatal_insn_not_found (insn);
1802 }
1803 }
1804
1805 /* Subroutine of instantiate_decls. Given RTL representing a decl,
1806 do any instantiation required. */
1807
1808 void
1809 instantiate_decl_rtl (rtx x)
1810 {
1811 rtx addr;
1812
1813 if (x == 0)
1814 return;
1815
1816 /* If this is a CONCAT, recurse for the pieces. */
1817 if (GET_CODE (x) == CONCAT)
1818 {
1819 instantiate_decl_rtl (XEXP (x, 0));
1820 instantiate_decl_rtl (XEXP (x, 1));
1821 return;
1822 }
1823
1824 /* If this is not a MEM, no need to do anything. Similarly if the
1825 address is a constant or a register that is not a virtual register. */
1826 if (!MEM_P (x))
1827 return;
1828
1829 addr = XEXP (x, 0);
1830 if (CONSTANT_P (addr)
1831 || (REG_P (addr)
1832 && (REGNO (addr) < FIRST_VIRTUAL_REGISTER
1833 || REGNO (addr) > LAST_VIRTUAL_REGISTER)))
1834 return;
1835
1836 instantiate_virtual_regs_in_rtx (&XEXP (x, 0));
1837 }
1838
1839 /* Helper for instantiate_decls called via walk_tree: Process all decls
1840 in the given DECL_VALUE_EXPR. */
1841
1842 static tree
1843 instantiate_expr (tree *tp, int *walk_subtrees, void *data ATTRIBUTE_UNUSED)
1844 {
1845 tree t = *tp;
1846 if (! EXPR_P (t))
1847 {
1848 *walk_subtrees = 0;
1849 if (DECL_P (t))
1850 {
1851 if (DECL_RTL_SET_P (t))
1852 instantiate_decl_rtl (DECL_RTL (t));
1853 if (TREE_CODE (t) == PARM_DECL && DECL_NAMELESS (t)
1854 && DECL_INCOMING_RTL (t))
1855 instantiate_decl_rtl (DECL_INCOMING_RTL (t));
1856 if ((VAR_P (t) || TREE_CODE (t) == RESULT_DECL)
1857 && DECL_HAS_VALUE_EXPR_P (t))
1858 {
1859 tree v = DECL_VALUE_EXPR (t);
1860 walk_tree (&v, instantiate_expr, NULL, NULL);
1861 }
1862 }
1863 }
1864 return NULL;
1865 }
1866
1867 /* Subroutine of instantiate_decls: Process all decls in the given
1868 BLOCK node and all its subblocks. */
1869
1870 static void
1871 instantiate_decls_1 (tree let)
1872 {
1873 tree t;
1874
1875 for (t = BLOCK_VARS (let); t; t = DECL_CHAIN (t))
1876 {
1877 if (DECL_RTL_SET_P (t))
1878 instantiate_decl_rtl (DECL_RTL (t));
1879 if (VAR_P (t) && DECL_HAS_VALUE_EXPR_P (t))
1880 {
1881 tree v = DECL_VALUE_EXPR (t);
1882 walk_tree (&v, instantiate_expr, NULL, NULL);
1883 }
1884 }
1885
1886 /* Process all subblocks. */
1887 for (t = BLOCK_SUBBLOCKS (let); t; t = BLOCK_CHAIN (t))
1888 instantiate_decls_1 (t);
1889 }
1890
1891 /* Scan all decls in FNDECL (both variables and parameters) and instantiate
1892 all virtual registers in their DECL_RTL's. */
1893
1894 static void
1895 instantiate_decls (tree fndecl)
1896 {
1897 tree decl;
1898 unsigned ix;
1899
1900 /* Process all parameters of the function. */
1901 for (decl = DECL_ARGUMENTS (fndecl); decl; decl = DECL_CHAIN (decl))
1902 {
1903 instantiate_decl_rtl (DECL_RTL (decl));
1904 instantiate_decl_rtl (DECL_INCOMING_RTL (decl));
1905 if (DECL_HAS_VALUE_EXPR_P (decl))
1906 {
1907 tree v = DECL_VALUE_EXPR (decl);
1908 walk_tree (&v, instantiate_expr, NULL, NULL);
1909 }
1910 }
1911
1912 if ((decl = DECL_RESULT (fndecl))
1913 && TREE_CODE (decl) == RESULT_DECL)
1914 {
1915 if (DECL_RTL_SET_P (decl))
1916 instantiate_decl_rtl (DECL_RTL (decl));
1917 if (DECL_HAS_VALUE_EXPR_P (decl))
1918 {
1919 tree v = DECL_VALUE_EXPR (decl);
1920 walk_tree (&v, instantiate_expr, NULL, NULL);
1921 }
1922 }
1923
1924 /* Process the saved static chain if it exists. */
1925 decl = DECL_STRUCT_FUNCTION (fndecl)->static_chain_decl;
1926 if (decl && DECL_HAS_VALUE_EXPR_P (decl))
1927 instantiate_decl_rtl (DECL_RTL (DECL_VALUE_EXPR (decl)));
1928
1929 /* Now process all variables defined in the function or its subblocks. */
1930 if (DECL_INITIAL (fndecl))
1931 instantiate_decls_1 (DECL_INITIAL (fndecl));
1932
1933 FOR_EACH_LOCAL_DECL (cfun, ix, decl)
1934 if (DECL_RTL_SET_P (decl))
1935 instantiate_decl_rtl (DECL_RTL (decl));
1936 vec_free (cfun->local_decls);
1937 }
1938
1939 /* Pass through the INSNS of function FNDECL and convert virtual register
1940 references to hard register references. */
1941
1942 static unsigned int
1943 instantiate_virtual_regs (void)
1944 {
1945 rtx_insn *insn;
1946
1947 /* Compute the offsets to use for this function. */
1948 in_arg_offset = FIRST_PARM_OFFSET (current_function_decl);
1949 var_offset = targetm.starting_frame_offset ();
1950 dynamic_offset = STACK_DYNAMIC_OFFSET (current_function_decl);
1951 out_arg_offset = STACK_POINTER_OFFSET;
1952 #ifdef FRAME_POINTER_CFA_OFFSET
1953 cfa_offset = FRAME_POINTER_CFA_OFFSET (current_function_decl);
1954 #else
1955 cfa_offset = ARG_POINTER_CFA_OFFSET (current_function_decl);
1956 #endif
1957
1958 /* Initialize recognition, indicating that volatile is OK. */
1959 init_recog ();
1960
1961 /* Scan through all the insns, instantiating every virtual register still
1962 present. */
1963 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
1964 if (INSN_P (insn))
1965 {
1966 /* These patterns in the instruction stream can never be recognized.
1967 Fortunately, they shouldn't contain virtual registers either. */
1968 if (GET_CODE (PATTERN (insn)) == USE
1969 || GET_CODE (PATTERN (insn)) == CLOBBER
1970 || GET_CODE (PATTERN (insn)) == ASM_INPUT
1971 || DEBUG_MARKER_INSN_P (insn))
1972 continue;
1973 else if (DEBUG_BIND_INSN_P (insn))
1974 instantiate_virtual_regs_in_rtx (INSN_VAR_LOCATION_PTR (insn));
1975 else
1976 instantiate_virtual_regs_in_insn (insn);
1977
1978 if (insn->deleted ())
1979 continue;
1980
1981 instantiate_virtual_regs_in_rtx (&REG_NOTES (insn));
1982
1983 /* Instantiate any virtual registers in CALL_INSN_FUNCTION_USAGE. */
1984 if (CALL_P (insn))
1985 instantiate_virtual_regs_in_rtx (&CALL_INSN_FUNCTION_USAGE (insn));
1986 }
1987
1988 /* Instantiate the virtual registers in the DECLs for debugging purposes. */
1989 instantiate_decls (current_function_decl);
1990
1991 targetm.instantiate_decls ();
1992
1993 /* Indicate that, from now on, assign_stack_local should use
1994 frame_pointer_rtx. */
1995 virtuals_instantiated = 1;
1996
1997 return 0;
1998 }
1999
2000 namespace {
2001
2002 const pass_data pass_data_instantiate_virtual_regs =
2003 {
2004 RTL_PASS, /* type */
2005 "vregs", /* name */
2006 OPTGROUP_NONE, /* optinfo_flags */
2007 TV_NONE, /* tv_id */
2008 0, /* properties_required */
2009 0, /* properties_provided */
2010 0, /* properties_destroyed */
2011 0, /* todo_flags_start */
2012 0, /* todo_flags_finish */
2013 };
2014
2015 class pass_instantiate_virtual_regs : public rtl_opt_pass
2016 {
2017 public:
2018 pass_instantiate_virtual_regs (gcc::context *ctxt)
2019 : rtl_opt_pass (pass_data_instantiate_virtual_regs, ctxt)
2020 {}
2021
2022 /* opt_pass methods: */
2023 virtual unsigned int execute (function *)
2024 {
2025 return instantiate_virtual_regs ();
2026 }
2027
2028 }; // class pass_instantiate_virtual_regs
2029
2030 } // anon namespace
2031
2032 rtl_opt_pass *
2033 make_pass_instantiate_virtual_regs (gcc::context *ctxt)
2034 {
2035 return new pass_instantiate_virtual_regs (ctxt);
2036 }
2037
2038 \f
2039 /* Return 1 if EXP is an aggregate type (or a value with aggregate type).
2040 This means a type for which function calls must pass an address to the
2041 function or get an address back from the function.
2042 EXP may be a type node or an expression (whose type is tested). */
2043
2044 int
2045 aggregate_value_p (const_tree exp, const_tree fntype)
2046 {
2047 const_tree type = (TYPE_P (exp)) ? exp : TREE_TYPE (exp);
2048 int i, regno, nregs;
2049 rtx reg;
2050
2051 if (fntype)
2052 switch (TREE_CODE (fntype))
2053 {
2054 case CALL_EXPR:
2055 {
2056 tree fndecl = get_callee_fndecl (fntype);
2057 if (fndecl)
2058 fntype = TREE_TYPE (fndecl);
2059 else if (CALL_EXPR_FN (fntype))
2060 fntype = TREE_TYPE (TREE_TYPE (CALL_EXPR_FN (fntype)));
2061 else
2062 /* For internal functions, assume nothing needs to be
2063 returned in memory. */
2064 return 0;
2065 }
2066 break;
2067 case FUNCTION_DECL:
2068 fntype = TREE_TYPE (fntype);
2069 break;
2070 case FUNCTION_TYPE:
2071 case METHOD_TYPE:
2072 break;
2073 case IDENTIFIER_NODE:
2074 fntype = NULL_TREE;
2075 break;
2076 default:
2077 /* We don't expect other tree types here. */
2078 gcc_unreachable ();
2079 }
2080
2081 if (VOID_TYPE_P (type))
2082 return 0;
2083
2084 /* If a record should be passed the same as its first (and only) member
2085 don't pass it as an aggregate. */
2086 if (TREE_CODE (type) == RECORD_TYPE && TYPE_TRANSPARENT_AGGR (type))
2087 return aggregate_value_p (first_field (type), fntype);
2088
2089 /* If the front end has decided that this needs to be passed by
2090 reference, do so. */
2091 if ((TREE_CODE (exp) == PARM_DECL || TREE_CODE (exp) == RESULT_DECL)
2092 && DECL_BY_REFERENCE (exp))
2093 return 1;
2094
2095 /* Function types that are TREE_ADDRESSABLE force return in memory. */
2096 if (fntype && TREE_ADDRESSABLE (fntype))
2097 return 1;
2098
2099 /* Types that are TREE_ADDRESSABLE must be constructed in memory,
2100 and thus can't be returned in registers. */
2101 if (TREE_ADDRESSABLE (type))
2102 return 1;
2103
2104 if (TYPE_EMPTY_P (type))
2105 return 0;
2106
2107 if (flag_pcc_struct_return && AGGREGATE_TYPE_P (type))
2108 return 1;
2109
2110 if (targetm.calls.return_in_memory (type, fntype))
2111 return 1;
2112
2113 /* Make sure we have suitable call-clobbered regs to return
2114 the value in; if not, we must return it in memory. */
2115 reg = hard_function_value (type, 0, fntype, 0);
2116
2117 /* If we have something other than a REG (e.g. a PARALLEL), then assume
2118 it is OK. */
2119 if (!REG_P (reg))
2120 return 0;
2121
2122 regno = REGNO (reg);
2123 nregs = hard_regno_nregs (regno, TYPE_MODE (type));
2124 for (i = 0; i < nregs; i++)
2125 if (! call_used_regs[regno + i])
2126 return 1;
2127
2128 return 0;
2129 }
2130 \f
2131 /* Return true if we should assign DECL a pseudo register; false if it
2132 should live on the local stack. */
2133
2134 bool
2135 use_register_for_decl (const_tree decl)
2136 {
2137 if (TREE_CODE (decl) == SSA_NAME)
2138 {
2139 /* We often try to use the SSA_NAME, instead of its underlying
2140 decl, to get type information and guide decisions, to avoid
2141 differences of behavior between anonymous and named
2142 variables, but in this one case we have to go for the actual
2143 variable if there is one. The main reason is that, at least
2144 at -O0, we want to place user variables on the stack, but we
2145 don't mind using pseudos for anonymous or ignored temps.
2146 Should we take the SSA_NAME, we'd conclude all SSA_NAMEs
2147 should go in pseudos, whereas their corresponding variables
2148 might have to go on the stack. So, disregarding the decl
2149 here would negatively impact debug info at -O0, enable
2150 coalescing between SSA_NAMEs that ought to get different
2151 stack/pseudo assignments, and get the incoming argument
2152 processing thoroughly confused by PARM_DECLs expected to live
2153 in stack slots but assigned to pseudos. */
2154 if (!SSA_NAME_VAR (decl))
2155 return TYPE_MODE (TREE_TYPE (decl)) != BLKmode
2156 && !(flag_float_store && FLOAT_TYPE_P (TREE_TYPE (decl)));
2157
2158 decl = SSA_NAME_VAR (decl);
2159 }
2160
2161 /* Honor volatile. */
2162 if (TREE_SIDE_EFFECTS (decl))
2163 return false;
2164
2165 /* Honor addressability. */
2166 if (TREE_ADDRESSABLE (decl))
2167 return false;
2168
2169 /* RESULT_DECLs are a bit special in that they're assigned without
2170 regard to use_register_for_decl, but we generally only store in
2171 them. If we coalesce their SSA NAMEs, we'd better return a
2172 result that matches the assignment in expand_function_start. */
2173 if (TREE_CODE (decl) == RESULT_DECL)
2174 {
2175 /* If it's not an aggregate, we're going to use a REG or a
2176 PARALLEL containing a REG. */
2177 if (!aggregate_value_p (decl, current_function_decl))
2178 return true;
2179
2180 /* If expand_function_start determines the return value, we'll
2181 use MEM if it's not by reference. */
2182 if (cfun->returns_pcc_struct
2183 || (targetm.calls.struct_value_rtx
2184 (TREE_TYPE (current_function_decl), 1)))
2185 return DECL_BY_REFERENCE (decl);
2186
2187 /* Otherwise, we're taking an extra all.function_result_decl
2188 argument. It's set up in assign_parms_augmented_arg_list,
2189 under the (negated) conditions above, and then it's used to
2190 set up the RESULT_DECL rtl in assign_params, after looping
2191 over all parameters. Now, if the RESULT_DECL is not by
2192 reference, we'll use a MEM either way. */
2193 if (!DECL_BY_REFERENCE (decl))
2194 return false;
2195
2196 /* Otherwise, if RESULT_DECL is DECL_BY_REFERENCE, it will take
2197 the function_result_decl's assignment. Since it's a pointer,
2198 we can short-circuit a number of the tests below, and we must
2199 duplicat e them because we don't have the
2200 function_result_decl to test. */
2201 if (!targetm.calls.allocate_stack_slots_for_args ())
2202 return true;
2203 /* We don't set DECL_IGNORED_P for the function_result_decl. */
2204 if (optimize)
2205 return true;
2206 /* We don't set DECL_REGISTER for the function_result_decl. */
2207 return false;
2208 }
2209
2210 /* Only register-like things go in registers. */
2211 if (DECL_MODE (decl) == BLKmode)
2212 return false;
2213
2214 /* If -ffloat-store specified, don't put explicit float variables
2215 into registers. */
2216 /* ??? This should be checked after DECL_ARTIFICIAL, but tree-ssa
2217 propagates values across these stores, and it probably shouldn't. */
2218 if (flag_float_store && FLOAT_TYPE_P (TREE_TYPE (decl)))
2219 return false;
2220
2221 if (!targetm.calls.allocate_stack_slots_for_args ())
2222 return true;
2223
2224 /* If we're not interested in tracking debugging information for
2225 this decl, then we can certainly put it in a register. */
2226 if (DECL_IGNORED_P (decl))
2227 return true;
2228
2229 if (optimize)
2230 return true;
2231
2232 if (!DECL_REGISTER (decl))
2233 return false;
2234
2235 /* When not optimizing, disregard register keyword for types that
2236 could have methods, otherwise the methods won't be callable from
2237 the debugger. */
2238 if (RECORD_OR_UNION_TYPE_P (TREE_TYPE (decl)))
2239 return false;
2240
2241 return true;
2242 }
2243
2244 /* Structures to communicate between the subroutines of assign_parms.
2245 The first holds data persistent across all parameters, the second
2246 is cleared out for each parameter. */
2247
2248 struct assign_parm_data_all
2249 {
2250 /* When INIT_CUMULATIVE_ARGS gets revamped, allocating CUMULATIVE_ARGS
2251 should become a job of the target or otherwise encapsulated. */
2252 CUMULATIVE_ARGS args_so_far_v;
2253 cumulative_args_t args_so_far;
2254 struct args_size stack_args_size;
2255 tree function_result_decl;
2256 tree orig_fnargs;
2257 rtx_insn *first_conversion_insn;
2258 rtx_insn *last_conversion_insn;
2259 HOST_WIDE_INT pretend_args_size;
2260 HOST_WIDE_INT extra_pretend_bytes;
2261 int reg_parm_stack_space;
2262 };
2263
2264 struct assign_parm_data_one
2265 {
2266 tree nominal_type;
2267 tree passed_type;
2268 rtx entry_parm;
2269 rtx stack_parm;
2270 machine_mode nominal_mode;
2271 machine_mode passed_mode;
2272 machine_mode promoted_mode;
2273 struct locate_and_pad_arg_data locate;
2274 int partial;
2275 BOOL_BITFIELD named_arg : 1;
2276 BOOL_BITFIELD passed_pointer : 1;
2277 };
2278
2279 /* A subroutine of assign_parms. Initialize ALL. */
2280
2281 static void
2282 assign_parms_initialize_all (struct assign_parm_data_all *all)
2283 {
2284 tree fntype ATTRIBUTE_UNUSED;
2285
2286 memset (all, 0, sizeof (*all));
2287
2288 fntype = TREE_TYPE (current_function_decl);
2289
2290 #ifdef INIT_CUMULATIVE_INCOMING_ARGS
2291 INIT_CUMULATIVE_INCOMING_ARGS (all->args_so_far_v, fntype, NULL_RTX);
2292 #else
2293 INIT_CUMULATIVE_ARGS (all->args_so_far_v, fntype, NULL_RTX,
2294 current_function_decl, -1);
2295 #endif
2296 all->args_so_far = pack_cumulative_args (&all->args_so_far_v);
2297
2298 #ifdef INCOMING_REG_PARM_STACK_SPACE
2299 all->reg_parm_stack_space
2300 = INCOMING_REG_PARM_STACK_SPACE (current_function_decl);
2301 #endif
2302 }
2303
2304 /* If ARGS contains entries with complex types, split the entry into two
2305 entries of the component type. Return a new list of substitutions are
2306 needed, else the old list. */
2307
2308 static void
2309 split_complex_args (vec<tree> *args)
2310 {
2311 unsigned i;
2312 tree p;
2313
2314 FOR_EACH_VEC_ELT (*args, i, p)
2315 {
2316 tree type = TREE_TYPE (p);
2317 if (TREE_CODE (type) == COMPLEX_TYPE
2318 && targetm.calls.split_complex_arg (type))
2319 {
2320 tree decl;
2321 tree subtype = TREE_TYPE (type);
2322 bool addressable = TREE_ADDRESSABLE (p);
2323
2324 /* Rewrite the PARM_DECL's type with its component. */
2325 p = copy_node (p);
2326 TREE_TYPE (p) = subtype;
2327 DECL_ARG_TYPE (p) = TREE_TYPE (DECL_ARG_TYPE (p));
2328 SET_DECL_MODE (p, VOIDmode);
2329 DECL_SIZE (p) = NULL;
2330 DECL_SIZE_UNIT (p) = NULL;
2331 /* If this arg must go in memory, put it in a pseudo here.
2332 We can't allow it to go in memory as per normal parms,
2333 because the usual place might not have the imag part
2334 adjacent to the real part. */
2335 DECL_ARTIFICIAL (p) = addressable;
2336 DECL_IGNORED_P (p) = addressable;
2337 TREE_ADDRESSABLE (p) = 0;
2338 layout_decl (p, 0);
2339 (*args)[i] = p;
2340
2341 /* Build a second synthetic decl. */
2342 decl = build_decl (EXPR_LOCATION (p),
2343 PARM_DECL, NULL_TREE, subtype);
2344 DECL_ARG_TYPE (decl) = DECL_ARG_TYPE (p);
2345 DECL_ARTIFICIAL (decl) = addressable;
2346 DECL_IGNORED_P (decl) = addressable;
2347 layout_decl (decl, 0);
2348 args->safe_insert (++i, decl);
2349 }
2350 }
2351 }
2352
2353 /* A subroutine of assign_parms. Adjust the parameter list to incorporate
2354 the hidden struct return argument, and (abi willing) complex args.
2355 Return the new parameter list. */
2356
2357 static vec<tree>
2358 assign_parms_augmented_arg_list (struct assign_parm_data_all *all)
2359 {
2360 tree fndecl = current_function_decl;
2361 tree fntype = TREE_TYPE (fndecl);
2362 vec<tree> fnargs = vNULL;
2363 tree arg;
2364
2365 for (arg = DECL_ARGUMENTS (fndecl); arg; arg = DECL_CHAIN (arg))
2366 fnargs.safe_push (arg);
2367
2368 all->orig_fnargs = DECL_ARGUMENTS (fndecl);
2369
2370 /* If struct value address is treated as the first argument, make it so. */
2371 if (aggregate_value_p (DECL_RESULT (fndecl), fndecl)
2372 && ! cfun->returns_pcc_struct
2373 && targetm.calls.struct_value_rtx (TREE_TYPE (fndecl), 1) == 0)
2374 {
2375 tree type = build_pointer_type (TREE_TYPE (fntype));
2376 tree decl;
2377
2378 decl = build_decl (DECL_SOURCE_LOCATION (fndecl),
2379 PARM_DECL, get_identifier (".result_ptr"), type);
2380 DECL_ARG_TYPE (decl) = type;
2381 DECL_ARTIFICIAL (decl) = 1;
2382 DECL_NAMELESS (decl) = 1;
2383 TREE_CONSTANT (decl) = 1;
2384 /* We don't set DECL_IGNORED_P or DECL_REGISTER here. If this
2385 changes, the end of the RESULT_DECL handling block in
2386 use_register_for_decl must be adjusted to match. */
2387
2388 DECL_CHAIN (decl) = all->orig_fnargs;
2389 all->orig_fnargs = decl;
2390 fnargs.safe_insert (0, decl);
2391
2392 all->function_result_decl = decl;
2393 }
2394
2395 /* If the target wants to split complex arguments into scalars, do so. */
2396 if (targetm.calls.split_complex_arg)
2397 split_complex_args (&fnargs);
2398
2399 return fnargs;
2400 }
2401
2402 /* A subroutine of assign_parms. Examine PARM and pull out type and mode
2403 data for the parameter. Incorporate ABI specifics such as pass-by-
2404 reference and type promotion. */
2405
2406 static void
2407 assign_parm_find_data_types (struct assign_parm_data_all *all, tree parm,
2408 struct assign_parm_data_one *data)
2409 {
2410 tree nominal_type, passed_type;
2411 machine_mode nominal_mode, passed_mode, promoted_mode;
2412 int unsignedp;
2413
2414 memset (data, 0, sizeof (*data));
2415
2416 /* NAMED_ARG is a misnomer. We really mean 'non-variadic'. */
2417 if (!cfun->stdarg)
2418 data->named_arg = 1; /* No variadic parms. */
2419 else if (DECL_CHAIN (parm))
2420 data->named_arg = 1; /* Not the last non-variadic parm. */
2421 else if (targetm.calls.strict_argument_naming (all->args_so_far))
2422 data->named_arg = 1; /* Only variadic ones are unnamed. */
2423 else
2424 data->named_arg = 0; /* Treat as variadic. */
2425
2426 nominal_type = TREE_TYPE (parm);
2427 passed_type = DECL_ARG_TYPE (parm);
2428
2429 /* Look out for errors propagating this far. Also, if the parameter's
2430 type is void then its value doesn't matter. */
2431 if (TREE_TYPE (parm) == error_mark_node
2432 /* This can happen after weird syntax errors
2433 or if an enum type is defined among the parms. */
2434 || TREE_CODE (parm) != PARM_DECL
2435 || passed_type == NULL
2436 || VOID_TYPE_P (nominal_type))
2437 {
2438 nominal_type = passed_type = void_type_node;
2439 nominal_mode = passed_mode = promoted_mode = VOIDmode;
2440 goto egress;
2441 }
2442
2443 /* Find mode of arg as it is passed, and mode of arg as it should be
2444 during execution of this function. */
2445 passed_mode = TYPE_MODE (passed_type);
2446 nominal_mode = TYPE_MODE (nominal_type);
2447
2448 /* If the parm is to be passed as a transparent union or record, use the
2449 type of the first field for the tests below. We have already verified
2450 that the modes are the same. */
2451 if ((TREE_CODE (passed_type) == UNION_TYPE
2452 || TREE_CODE (passed_type) == RECORD_TYPE)
2453 && TYPE_TRANSPARENT_AGGR (passed_type))
2454 passed_type = TREE_TYPE (first_field (passed_type));
2455
2456 /* See if this arg was passed by invisible reference. */
2457 if (pass_by_reference (&all->args_so_far_v, passed_mode,
2458 passed_type, data->named_arg))
2459 {
2460 passed_type = nominal_type = build_pointer_type (passed_type);
2461 data->passed_pointer = true;
2462 passed_mode = nominal_mode = TYPE_MODE (nominal_type);
2463 }
2464
2465 /* Find mode as it is passed by the ABI. */
2466 unsignedp = TYPE_UNSIGNED (passed_type);
2467 promoted_mode = promote_function_mode (passed_type, passed_mode, &unsignedp,
2468 TREE_TYPE (current_function_decl), 0);
2469
2470 egress:
2471 data->nominal_type = nominal_type;
2472 data->passed_type = passed_type;
2473 data->nominal_mode = nominal_mode;
2474 data->passed_mode = passed_mode;
2475 data->promoted_mode = promoted_mode;
2476 }
2477
2478 /* A subroutine of assign_parms. Invoke setup_incoming_varargs. */
2479
2480 static void
2481 assign_parms_setup_varargs (struct assign_parm_data_all *all,
2482 struct assign_parm_data_one *data, bool no_rtl)
2483 {
2484 int varargs_pretend_bytes = 0;
2485
2486 targetm.calls.setup_incoming_varargs (all->args_so_far,
2487 data->promoted_mode,
2488 data->passed_type,
2489 &varargs_pretend_bytes, no_rtl);
2490
2491 /* If the back-end has requested extra stack space, record how much is
2492 needed. Do not change pretend_args_size otherwise since it may be
2493 nonzero from an earlier partial argument. */
2494 if (varargs_pretend_bytes > 0)
2495 all->pretend_args_size = varargs_pretend_bytes;
2496 }
2497
2498 /* A subroutine of assign_parms. Set DATA->ENTRY_PARM corresponding to
2499 the incoming location of the current parameter. */
2500
2501 static void
2502 assign_parm_find_entry_rtl (struct assign_parm_data_all *all,
2503 struct assign_parm_data_one *data)
2504 {
2505 HOST_WIDE_INT pretend_bytes = 0;
2506 rtx entry_parm;
2507 bool in_regs;
2508
2509 if (data->promoted_mode == VOIDmode)
2510 {
2511 data->entry_parm = data->stack_parm = const0_rtx;
2512 return;
2513 }
2514
2515 targetm.calls.warn_parameter_passing_abi (all->args_so_far,
2516 data->passed_type);
2517
2518 entry_parm = targetm.calls.function_incoming_arg (all->args_so_far,
2519 data->promoted_mode,
2520 data->passed_type,
2521 data->named_arg);
2522
2523 if (entry_parm == 0)
2524 data->promoted_mode = data->passed_mode;
2525
2526 /* Determine parm's home in the stack, in case it arrives in the stack
2527 or we should pretend it did. Compute the stack position and rtx where
2528 the argument arrives and its size.
2529
2530 There is one complexity here: If this was a parameter that would
2531 have been passed in registers, but wasn't only because it is
2532 __builtin_va_alist, we want locate_and_pad_parm to treat it as if
2533 it came in a register so that REG_PARM_STACK_SPACE isn't skipped.
2534 In this case, we call FUNCTION_ARG with NAMED set to 1 instead of 0
2535 as it was the previous time. */
2536 in_regs = (entry_parm != 0);
2537 #ifdef STACK_PARMS_IN_REG_PARM_AREA
2538 in_regs = true;
2539 #endif
2540 if (!in_regs && !data->named_arg)
2541 {
2542 if (targetm.calls.pretend_outgoing_varargs_named (all->args_so_far))
2543 {
2544 rtx tem;
2545 tem = targetm.calls.function_incoming_arg (all->args_so_far,
2546 data->promoted_mode,
2547 data->passed_type, true);
2548 in_regs = tem != NULL;
2549 }
2550 }
2551
2552 /* If this parameter was passed both in registers and in the stack, use
2553 the copy on the stack. */
2554 if (targetm.calls.must_pass_in_stack (data->promoted_mode,
2555 data->passed_type))
2556 entry_parm = 0;
2557
2558 if (entry_parm)
2559 {
2560 int partial;
2561
2562 partial = targetm.calls.arg_partial_bytes (all->args_so_far,
2563 data->promoted_mode,
2564 data->passed_type,
2565 data->named_arg);
2566 data->partial = partial;
2567
2568 /* The caller might already have allocated stack space for the
2569 register parameters. */
2570 if (partial != 0 && all->reg_parm_stack_space == 0)
2571 {
2572 /* Part of this argument is passed in registers and part
2573 is passed on the stack. Ask the prologue code to extend
2574 the stack part so that we can recreate the full value.
2575
2576 PRETEND_BYTES is the size of the registers we need to store.
2577 CURRENT_FUNCTION_PRETEND_ARGS_SIZE is the amount of extra
2578 stack space that the prologue should allocate.
2579
2580 Internally, gcc assumes that the argument pointer is aligned
2581 to STACK_BOUNDARY bits. This is used both for alignment
2582 optimizations (see init_emit) and to locate arguments that are
2583 aligned to more than PARM_BOUNDARY bits. We must preserve this
2584 invariant by rounding CURRENT_FUNCTION_PRETEND_ARGS_SIZE up to
2585 a stack boundary. */
2586
2587 /* We assume at most one partial arg, and it must be the first
2588 argument on the stack. */
2589 gcc_assert (!all->extra_pretend_bytes && !all->pretend_args_size);
2590
2591 pretend_bytes = partial;
2592 all->pretend_args_size = CEIL_ROUND (pretend_bytes, STACK_BYTES);
2593
2594 /* We want to align relative to the actual stack pointer, so
2595 don't include this in the stack size until later. */
2596 all->extra_pretend_bytes = all->pretend_args_size;
2597 }
2598 }
2599
2600 locate_and_pad_parm (data->promoted_mode, data->passed_type, in_regs,
2601 all->reg_parm_stack_space,
2602 entry_parm ? data->partial : 0, current_function_decl,
2603 &all->stack_args_size, &data->locate);
2604
2605 /* Update parm_stack_boundary if this parameter is passed in the
2606 stack. */
2607 if (!in_regs && crtl->parm_stack_boundary < data->locate.boundary)
2608 crtl->parm_stack_boundary = data->locate.boundary;
2609
2610 /* Adjust offsets to include the pretend args. */
2611 pretend_bytes = all->extra_pretend_bytes - pretend_bytes;
2612 data->locate.slot_offset.constant += pretend_bytes;
2613 data->locate.offset.constant += pretend_bytes;
2614
2615 data->entry_parm = entry_parm;
2616 }
2617
2618 /* A subroutine of assign_parms. If there is actually space on the stack
2619 for this parm, count it in stack_args_size and return true. */
2620
2621 static bool
2622 assign_parm_is_stack_parm (struct assign_parm_data_all *all,
2623 struct assign_parm_data_one *data)
2624 {
2625 /* Trivially true if we've no incoming register. */
2626 if (data->entry_parm == NULL)
2627 ;
2628 /* Also true if we're partially in registers and partially not,
2629 since we've arranged to drop the entire argument on the stack. */
2630 else if (data->partial != 0)
2631 ;
2632 /* Also true if the target says that it's passed in both registers
2633 and on the stack. */
2634 else if (GET_CODE (data->entry_parm) == PARALLEL
2635 && XEXP (XVECEXP (data->entry_parm, 0, 0), 0) == NULL_RTX)
2636 ;
2637 /* Also true if the target says that there's stack allocated for
2638 all register parameters. */
2639 else if (all->reg_parm_stack_space > 0)
2640 ;
2641 /* Otherwise, no, this parameter has no ABI defined stack slot. */
2642 else
2643 return false;
2644
2645 all->stack_args_size.constant += data->locate.size.constant;
2646 if (data->locate.size.var)
2647 ADD_PARM_SIZE (all->stack_args_size, data->locate.size.var);
2648
2649 return true;
2650 }
2651
2652 /* A subroutine of assign_parms. Given that this parameter is allocated
2653 stack space by the ABI, find it. */
2654
2655 static void
2656 assign_parm_find_stack_rtl (tree parm, struct assign_parm_data_one *data)
2657 {
2658 rtx offset_rtx, stack_parm;
2659 unsigned int align, boundary;
2660
2661 /* If we're passing this arg using a reg, make its stack home the
2662 aligned stack slot. */
2663 if (data->entry_parm)
2664 offset_rtx = ARGS_SIZE_RTX (data->locate.slot_offset);
2665 else
2666 offset_rtx = ARGS_SIZE_RTX (data->locate.offset);
2667
2668 stack_parm = crtl->args.internal_arg_pointer;
2669 if (offset_rtx != const0_rtx)
2670 stack_parm = gen_rtx_PLUS (Pmode, stack_parm, offset_rtx);
2671 stack_parm = gen_rtx_MEM (data->promoted_mode, stack_parm);
2672
2673 if (!data->passed_pointer)
2674 {
2675 set_mem_attributes (stack_parm, parm, 1);
2676 /* set_mem_attributes could set MEM_SIZE to the passed mode's size,
2677 while promoted mode's size is needed. */
2678 if (data->promoted_mode != BLKmode
2679 && data->promoted_mode != DECL_MODE (parm))
2680 {
2681 set_mem_size (stack_parm, GET_MODE_SIZE (data->promoted_mode));
2682 if (MEM_EXPR (stack_parm) && MEM_OFFSET_KNOWN_P (stack_parm))
2683 {
2684 poly_int64 offset = subreg_lowpart_offset (DECL_MODE (parm),
2685 data->promoted_mode);
2686 if (maybe_ne (offset, 0))
2687 set_mem_offset (stack_parm, MEM_OFFSET (stack_parm) - offset);
2688 }
2689 }
2690 }
2691
2692 boundary = data->locate.boundary;
2693 align = BITS_PER_UNIT;
2694
2695 /* If we're padding upward, we know that the alignment of the slot
2696 is TARGET_FUNCTION_ARG_BOUNDARY. If we're using slot_offset, we're
2697 intentionally forcing upward padding. Otherwise we have to come
2698 up with a guess at the alignment based on OFFSET_RTX. */
2699 poly_int64 offset;
2700 if (data->locate.where_pad != PAD_DOWNWARD || data->entry_parm)
2701 align = boundary;
2702 else if (poly_int_rtx_p (offset_rtx, &offset))
2703 {
2704 align = least_bit_hwi (boundary);
2705 unsigned int offset_align = known_alignment (offset) * BITS_PER_UNIT;
2706 if (offset_align != 0)
2707 align = MIN (align, offset_align);
2708 }
2709 set_mem_align (stack_parm, align);
2710
2711 if (data->entry_parm)
2712 set_reg_attrs_for_parm (data->entry_parm, stack_parm);
2713
2714 data->stack_parm = stack_parm;
2715 }
2716
2717 /* A subroutine of assign_parms. Adjust DATA->ENTRY_RTL such that it's
2718 always valid and contiguous. */
2719
2720 static void
2721 assign_parm_adjust_entry_rtl (struct assign_parm_data_one *data)
2722 {
2723 rtx entry_parm = data->entry_parm;
2724 rtx stack_parm = data->stack_parm;
2725
2726 /* If this parm was passed part in regs and part in memory, pretend it
2727 arrived entirely in memory by pushing the register-part onto the stack.
2728 In the special case of a DImode or DFmode that is split, we could put
2729 it together in a pseudoreg directly, but for now that's not worth
2730 bothering with. */
2731 if (data->partial != 0)
2732 {
2733 /* Handle calls that pass values in multiple non-contiguous
2734 locations. The Irix 6 ABI has examples of this. */
2735 if (GET_CODE (entry_parm) == PARALLEL)
2736 emit_group_store (validize_mem (copy_rtx (stack_parm)), entry_parm,
2737 data->passed_type,
2738 int_size_in_bytes (data->passed_type));
2739 else
2740 {
2741 gcc_assert (data->partial % UNITS_PER_WORD == 0);
2742 move_block_from_reg (REGNO (entry_parm),
2743 validize_mem (copy_rtx (stack_parm)),
2744 data->partial / UNITS_PER_WORD);
2745 }
2746
2747 entry_parm = stack_parm;
2748 }
2749
2750 /* If we didn't decide this parm came in a register, by default it came
2751 on the stack. */
2752 else if (entry_parm == NULL)
2753 entry_parm = stack_parm;
2754
2755 /* When an argument is passed in multiple locations, we can't make use
2756 of this information, but we can save some copying if the whole argument
2757 is passed in a single register. */
2758 else if (GET_CODE (entry_parm) == PARALLEL
2759 && data->nominal_mode != BLKmode
2760 && data->passed_mode != BLKmode)
2761 {
2762 size_t i, len = XVECLEN (entry_parm, 0);
2763
2764 for (i = 0; i < len; i++)
2765 if (XEXP (XVECEXP (entry_parm, 0, i), 0) != NULL_RTX
2766 && REG_P (XEXP (XVECEXP (entry_parm, 0, i), 0))
2767 && (GET_MODE (XEXP (XVECEXP (entry_parm, 0, i), 0))
2768 == data->passed_mode)
2769 && INTVAL (XEXP (XVECEXP (entry_parm, 0, i), 1)) == 0)
2770 {
2771 entry_parm = XEXP (XVECEXP (entry_parm, 0, i), 0);
2772 break;
2773 }
2774 }
2775
2776 data->entry_parm = entry_parm;
2777 }
2778
2779 /* A subroutine of assign_parms. Reconstitute any values which were
2780 passed in multiple registers and would fit in a single register. */
2781
2782 static void
2783 assign_parm_remove_parallels (struct assign_parm_data_one *data)
2784 {
2785 rtx entry_parm = data->entry_parm;
2786
2787 /* Convert the PARALLEL to a REG of the same mode as the parallel.
2788 This can be done with register operations rather than on the
2789 stack, even if we will store the reconstituted parameter on the
2790 stack later. */
2791 if (GET_CODE (entry_parm) == PARALLEL && GET_MODE (entry_parm) != BLKmode)
2792 {
2793 rtx parmreg = gen_reg_rtx (GET_MODE (entry_parm));
2794 emit_group_store (parmreg, entry_parm, data->passed_type,
2795 GET_MODE_SIZE (GET_MODE (entry_parm)));
2796 entry_parm = parmreg;
2797 }
2798
2799 data->entry_parm = entry_parm;
2800 }
2801
2802 /* A subroutine of assign_parms. Adjust DATA->STACK_RTL such that it's
2803 always valid and properly aligned. */
2804
2805 static void
2806 assign_parm_adjust_stack_rtl (struct assign_parm_data_one *data)
2807 {
2808 rtx stack_parm = data->stack_parm;
2809
2810 /* If we can't trust the parm stack slot to be aligned enough for its
2811 ultimate type, don't use that slot after entry. We'll make another
2812 stack slot, if we need one. */
2813 if (stack_parm
2814 && ((GET_MODE_ALIGNMENT (data->nominal_mode) > MEM_ALIGN (stack_parm)
2815 && targetm.slow_unaligned_access (data->nominal_mode,
2816 MEM_ALIGN (stack_parm)))
2817 || (data->nominal_type
2818 && TYPE_ALIGN (data->nominal_type) > MEM_ALIGN (stack_parm)
2819 && MEM_ALIGN (stack_parm) < PREFERRED_STACK_BOUNDARY)))
2820 stack_parm = NULL;
2821
2822 /* If parm was passed in memory, and we need to convert it on entry,
2823 don't store it back in that same slot. */
2824 else if (data->entry_parm == stack_parm
2825 && data->nominal_mode != BLKmode
2826 && data->nominal_mode != data->passed_mode)
2827 stack_parm = NULL;
2828
2829 /* If stack protection is in effect for this function, don't leave any
2830 pointers in their passed stack slots. */
2831 else if (crtl->stack_protect_guard
2832 && (flag_stack_protect == 2
2833 || data->passed_pointer
2834 || POINTER_TYPE_P (data->nominal_type)))
2835 stack_parm = NULL;
2836
2837 data->stack_parm = stack_parm;
2838 }
2839
2840 /* A subroutine of assign_parms. Return true if the current parameter
2841 should be stored as a BLKmode in the current frame. */
2842
2843 static bool
2844 assign_parm_setup_block_p (struct assign_parm_data_one *data)
2845 {
2846 if (data->nominal_mode == BLKmode)
2847 return true;
2848 if (GET_MODE (data->entry_parm) == BLKmode)
2849 return true;
2850
2851 #ifdef BLOCK_REG_PADDING
2852 /* Only assign_parm_setup_block knows how to deal with register arguments
2853 that are padded at the least significant end. */
2854 if (REG_P (data->entry_parm)
2855 && known_lt (GET_MODE_SIZE (data->promoted_mode), UNITS_PER_WORD)
2856 && (BLOCK_REG_PADDING (data->passed_mode, data->passed_type, 1)
2857 == (BYTES_BIG_ENDIAN ? PAD_UPWARD : PAD_DOWNWARD)))
2858 return true;
2859 #endif
2860
2861 return false;
2862 }
2863
2864 /* A subroutine of assign_parms. Arrange for the parameter to be
2865 present and valid in DATA->STACK_RTL. */
2866
2867 static void
2868 assign_parm_setup_block (struct assign_parm_data_all *all,
2869 tree parm, struct assign_parm_data_one *data)
2870 {
2871 rtx entry_parm = data->entry_parm;
2872 rtx stack_parm = data->stack_parm;
2873 rtx target_reg = NULL_RTX;
2874 bool in_conversion_seq = false;
2875 HOST_WIDE_INT size;
2876 HOST_WIDE_INT size_stored;
2877
2878 if (GET_CODE (entry_parm) == PARALLEL)
2879 entry_parm = emit_group_move_into_temps (entry_parm);
2880
2881 /* If we want the parameter in a pseudo, don't use a stack slot. */
2882 if (is_gimple_reg (parm) && use_register_for_decl (parm))
2883 {
2884 tree def = ssa_default_def (cfun, parm);
2885 gcc_assert (def);
2886 machine_mode mode = promote_ssa_mode (def, NULL);
2887 rtx reg = gen_reg_rtx (mode);
2888 if (GET_CODE (reg) != CONCAT)
2889 stack_parm = reg;
2890 else
2891 {
2892 target_reg = reg;
2893 /* Avoid allocating a stack slot, if there isn't one
2894 preallocated by the ABI. It might seem like we should
2895 always prefer a pseudo, but converting between
2896 floating-point and integer modes goes through the stack
2897 on various machines, so it's better to use the reserved
2898 stack slot than to risk wasting it and allocating more
2899 for the conversion. */
2900 if (stack_parm == NULL_RTX)
2901 {
2902 int save = generating_concat_p;
2903 generating_concat_p = 0;
2904 stack_parm = gen_reg_rtx (mode);
2905 generating_concat_p = save;
2906 }
2907 }
2908 data->stack_parm = NULL;
2909 }
2910
2911 size = int_size_in_bytes (data->passed_type);
2912 size_stored = CEIL_ROUND (size, UNITS_PER_WORD);
2913 if (stack_parm == 0)
2914 {
2915 HOST_WIDE_INT parm_align
2916 = (STRICT_ALIGNMENT
2917 ? MAX (DECL_ALIGN (parm), BITS_PER_WORD) : DECL_ALIGN (parm));
2918
2919 SET_DECL_ALIGN (parm, parm_align);
2920 if (DECL_ALIGN (parm) > MAX_SUPPORTED_STACK_ALIGNMENT)
2921 {
2922 rtx allocsize = gen_int_mode (size_stored, Pmode);
2923 get_dynamic_stack_size (&allocsize, 0, DECL_ALIGN (parm), NULL);
2924 stack_parm = assign_stack_local (BLKmode, UINTVAL (allocsize),
2925 MAX_SUPPORTED_STACK_ALIGNMENT);
2926 rtx addr = align_dynamic_address (XEXP (stack_parm, 0),
2927 DECL_ALIGN (parm));
2928 mark_reg_pointer (addr, DECL_ALIGN (parm));
2929 stack_parm = gen_rtx_MEM (GET_MODE (stack_parm), addr);
2930 MEM_NOTRAP_P (stack_parm) = 1;
2931 }
2932 else
2933 stack_parm = assign_stack_local (BLKmode, size_stored,
2934 DECL_ALIGN (parm));
2935 if (known_eq (GET_MODE_SIZE (GET_MODE (entry_parm)), size))
2936 PUT_MODE (stack_parm, GET_MODE (entry_parm));
2937 set_mem_attributes (stack_parm, parm, 1);
2938 }
2939
2940 /* If a BLKmode arrives in registers, copy it to a stack slot. Handle
2941 calls that pass values in multiple non-contiguous locations. */
2942 if (REG_P (entry_parm) || GET_CODE (entry_parm) == PARALLEL)
2943 {
2944 rtx mem;
2945
2946 /* Note that we will be storing an integral number of words.
2947 So we have to be careful to ensure that we allocate an
2948 integral number of words. We do this above when we call
2949 assign_stack_local if space was not allocated in the argument
2950 list. If it was, this will not work if PARM_BOUNDARY is not
2951 a multiple of BITS_PER_WORD. It isn't clear how to fix this
2952 if it becomes a problem. Exception is when BLKmode arrives
2953 with arguments not conforming to word_mode. */
2954
2955 if (data->stack_parm == 0)
2956 ;
2957 else if (GET_CODE (entry_parm) == PARALLEL)
2958 ;
2959 else
2960 gcc_assert (!size || !(PARM_BOUNDARY % BITS_PER_WORD));
2961
2962 mem = validize_mem (copy_rtx (stack_parm));
2963
2964 /* Handle values in multiple non-contiguous locations. */
2965 if (GET_CODE (entry_parm) == PARALLEL && !MEM_P (mem))
2966 emit_group_store (mem, entry_parm, data->passed_type, size);
2967 else if (GET_CODE (entry_parm) == PARALLEL)
2968 {
2969 push_to_sequence2 (all->first_conversion_insn,
2970 all->last_conversion_insn);
2971 emit_group_store (mem, entry_parm, data->passed_type, size);
2972 all->first_conversion_insn = get_insns ();
2973 all->last_conversion_insn = get_last_insn ();
2974 end_sequence ();
2975 in_conversion_seq = true;
2976 }
2977
2978 else if (size == 0)
2979 ;
2980
2981 /* If SIZE is that of a mode no bigger than a word, just use
2982 that mode's store operation. */
2983 else if (size <= UNITS_PER_WORD)
2984 {
2985 unsigned int bits = size * BITS_PER_UNIT;
2986 machine_mode mode = int_mode_for_size (bits, 0).else_blk ();
2987
2988 if (mode != BLKmode
2989 #ifdef BLOCK_REG_PADDING
2990 && (size == UNITS_PER_WORD
2991 || (BLOCK_REG_PADDING (mode, data->passed_type, 1)
2992 != (BYTES_BIG_ENDIAN ? PAD_UPWARD : PAD_DOWNWARD)))
2993 #endif
2994 )
2995 {
2996 rtx reg;
2997
2998 /* We are really truncating a word_mode value containing
2999 SIZE bytes into a value of mode MODE. If such an
3000 operation requires no actual instructions, we can refer
3001 to the value directly in mode MODE, otherwise we must
3002 start with the register in word_mode and explicitly
3003 convert it. */
3004 if (targetm.truly_noop_truncation (size * BITS_PER_UNIT,
3005 BITS_PER_WORD))
3006 reg = gen_rtx_REG (mode, REGNO (entry_parm));
3007 else
3008 {
3009 reg = gen_rtx_REG (word_mode, REGNO (entry_parm));
3010 reg = convert_to_mode (mode, copy_to_reg (reg), 1);
3011 }
3012 emit_move_insn (change_address (mem, mode, 0), reg);
3013 }
3014
3015 #ifdef BLOCK_REG_PADDING
3016 /* Storing the register in memory as a full word, as
3017 move_block_from_reg below would do, and then using the
3018 MEM in a smaller mode, has the effect of shifting right
3019 if BYTES_BIG_ENDIAN. If we're bypassing memory, the
3020 shifting must be explicit. */
3021 else if (!MEM_P (mem))
3022 {
3023 rtx x;
3024
3025 /* If the assert below fails, we should have taken the
3026 mode != BLKmode path above, unless we have downward
3027 padding of smaller-than-word arguments on a machine
3028 with little-endian bytes, which would likely require
3029 additional changes to work correctly. */
3030 gcc_checking_assert (BYTES_BIG_ENDIAN
3031 && (BLOCK_REG_PADDING (mode,
3032 data->passed_type, 1)
3033 == PAD_UPWARD));
3034
3035 int by = (UNITS_PER_WORD - size) * BITS_PER_UNIT;
3036
3037 x = gen_rtx_REG (word_mode, REGNO (entry_parm));
3038 x = expand_shift (RSHIFT_EXPR, word_mode, x, by,
3039 NULL_RTX, 1);
3040 x = force_reg (word_mode, x);
3041 x = gen_lowpart_SUBREG (GET_MODE (mem), x);
3042
3043 emit_move_insn (mem, x);
3044 }
3045 #endif
3046
3047 /* Blocks smaller than a word on a BYTES_BIG_ENDIAN
3048 machine must be aligned to the left before storing
3049 to memory. Note that the previous test doesn't
3050 handle all cases (e.g. SIZE == 3). */
3051 else if (size != UNITS_PER_WORD
3052 #ifdef BLOCK_REG_PADDING
3053 && (BLOCK_REG_PADDING (mode, data->passed_type, 1)
3054 == PAD_DOWNWARD)
3055 #else
3056 && BYTES_BIG_ENDIAN
3057 #endif
3058 )
3059 {
3060 rtx tem, x;
3061 int by = (UNITS_PER_WORD - size) * BITS_PER_UNIT;
3062 rtx reg = gen_rtx_REG (word_mode, REGNO (entry_parm));
3063
3064 x = expand_shift (LSHIFT_EXPR, word_mode, reg, by, NULL_RTX, 1);
3065 tem = change_address (mem, word_mode, 0);
3066 emit_move_insn (tem, x);
3067 }
3068 else
3069 move_block_from_reg (REGNO (entry_parm), mem,
3070 size_stored / UNITS_PER_WORD);
3071 }
3072 else if (!MEM_P (mem))
3073 {
3074 gcc_checking_assert (size > UNITS_PER_WORD);
3075 #ifdef BLOCK_REG_PADDING
3076 gcc_checking_assert (BLOCK_REG_PADDING (GET_MODE (mem),
3077 data->passed_type, 0)
3078 == PAD_UPWARD);
3079 #endif
3080 emit_move_insn (mem, entry_parm);
3081 }
3082 else
3083 move_block_from_reg (REGNO (entry_parm), mem,
3084 size_stored / UNITS_PER_WORD);
3085 }
3086 else if (data->stack_parm == 0)
3087 {
3088 push_to_sequence2 (all->first_conversion_insn, all->last_conversion_insn);
3089 emit_block_move (stack_parm, data->entry_parm, GEN_INT (size),
3090 BLOCK_OP_NORMAL);
3091 all->first_conversion_insn = get_insns ();
3092 all->last_conversion_insn = get_last_insn ();
3093 end_sequence ();
3094 in_conversion_seq = true;
3095 }
3096
3097 if (target_reg)
3098 {
3099 if (!in_conversion_seq)
3100 emit_move_insn (target_reg, stack_parm);
3101 else
3102 {
3103 push_to_sequence2 (all->first_conversion_insn,
3104 all->last_conversion_insn);
3105 emit_move_insn (target_reg, stack_parm);
3106 all->first_conversion_insn = get_insns ();
3107 all->last_conversion_insn = get_last_insn ();
3108 end_sequence ();
3109 }
3110 stack_parm = target_reg;
3111 }
3112
3113 data->stack_parm = stack_parm;
3114 set_parm_rtl (parm, stack_parm);
3115 }
3116
3117 /* A subroutine of assign_parms. Allocate a pseudo to hold the current
3118 parameter. Get it there. Perform all ABI specified conversions. */
3119
3120 static void
3121 assign_parm_setup_reg (struct assign_parm_data_all *all, tree parm,
3122 struct assign_parm_data_one *data)
3123 {
3124 rtx parmreg, validated_mem;
3125 rtx equiv_stack_parm;
3126 machine_mode promoted_nominal_mode;
3127 int unsignedp = TYPE_UNSIGNED (TREE_TYPE (parm));
3128 bool did_conversion = false;
3129 bool need_conversion, moved;
3130 enum insn_code icode;
3131 rtx rtl;
3132
3133 /* Store the parm in a pseudoregister during the function, but we may
3134 need to do it in a wider mode. Using 2 here makes the result
3135 consistent with promote_decl_mode and thus expand_expr_real_1. */
3136 promoted_nominal_mode
3137 = promote_function_mode (data->nominal_type, data->nominal_mode, &unsignedp,
3138 TREE_TYPE (current_function_decl), 2);
3139
3140 parmreg = gen_reg_rtx (promoted_nominal_mode);
3141 if (!DECL_ARTIFICIAL (parm))
3142 mark_user_reg (parmreg);
3143
3144 /* If this was an item that we received a pointer to,
3145 set rtl appropriately. */
3146 if (data->passed_pointer)
3147 {
3148 rtl = gen_rtx_MEM (TYPE_MODE (TREE_TYPE (data->passed_type)), parmreg);
3149 set_mem_attributes (rtl, parm, 1);
3150 }
3151 else
3152 rtl = parmreg;
3153
3154 assign_parm_remove_parallels (data);
3155
3156 /* Copy the value into the register, thus bridging between
3157 assign_parm_find_data_types and expand_expr_real_1. */
3158
3159 equiv_stack_parm = data->stack_parm;
3160 validated_mem = validize_mem (copy_rtx (data->entry_parm));
3161
3162 need_conversion = (data->nominal_mode != data->passed_mode
3163 || promoted_nominal_mode != data->promoted_mode);
3164 moved = false;
3165
3166 if (need_conversion
3167 && GET_MODE_CLASS (data->nominal_mode) == MODE_INT
3168 && data->nominal_mode == data->passed_mode
3169 && data->nominal_mode == GET_MODE (data->entry_parm))
3170 {
3171 /* ENTRY_PARM has been converted to PROMOTED_MODE, its
3172 mode, by the caller. We now have to convert it to
3173 NOMINAL_MODE, if different. However, PARMREG may be in
3174 a different mode than NOMINAL_MODE if it is being stored
3175 promoted.
3176
3177 If ENTRY_PARM is a hard register, it might be in a register
3178 not valid for operating in its mode (e.g., an odd-numbered
3179 register for a DFmode). In that case, moves are the only
3180 thing valid, so we can't do a convert from there. This
3181 occurs when the calling sequence allow such misaligned
3182 usages.
3183
3184 In addition, the conversion may involve a call, which could
3185 clobber parameters which haven't been copied to pseudo
3186 registers yet.
3187
3188 First, we try to emit an insn which performs the necessary
3189 conversion. We verify that this insn does not clobber any
3190 hard registers. */
3191
3192 rtx op0, op1;
3193
3194 icode = can_extend_p (promoted_nominal_mode, data->passed_mode,
3195 unsignedp);
3196
3197 op0 = parmreg;
3198 op1 = validated_mem;
3199 if (icode != CODE_FOR_nothing
3200 && insn_operand_matches (icode, 0, op0)
3201 && insn_operand_matches (icode, 1, op1))
3202 {
3203 enum rtx_code code = unsignedp ? ZERO_EXTEND : SIGN_EXTEND;
3204 rtx_insn *insn, *insns;
3205 rtx t = op1;
3206 HARD_REG_SET hardregs;
3207
3208 start_sequence ();
3209 /* If op1 is a hard register that is likely spilled, first
3210 force it into a pseudo, otherwise combiner might extend
3211 its lifetime too much. */
3212 if (GET_CODE (t) == SUBREG)
3213 t = SUBREG_REG (t);
3214 if (REG_P (t)
3215 && HARD_REGISTER_P (t)
3216 && ! TEST_HARD_REG_BIT (fixed_reg_set, REGNO (t))
3217 && targetm.class_likely_spilled_p (REGNO_REG_CLASS (REGNO (t))))
3218 {
3219 t = gen_reg_rtx (GET_MODE (op1));
3220 emit_move_insn (t, op1);
3221 }
3222 else
3223 t = op1;
3224 rtx_insn *pat = gen_extend_insn (op0, t, promoted_nominal_mode,
3225 data->passed_mode, unsignedp);
3226 emit_insn (pat);
3227 insns = get_insns ();
3228
3229 moved = true;
3230 CLEAR_HARD_REG_SET (hardregs);
3231 for (insn = insns; insn && moved; insn = NEXT_INSN (insn))
3232 {
3233 if (INSN_P (insn))
3234 note_stores (PATTERN (insn), record_hard_reg_sets,
3235 &hardregs);
3236 if (!hard_reg_set_empty_p (hardregs))
3237 moved = false;
3238 }
3239
3240 end_sequence ();
3241
3242 if (moved)
3243 {
3244 emit_insn (insns);
3245 if (equiv_stack_parm != NULL_RTX)
3246 equiv_stack_parm = gen_rtx_fmt_e (code, GET_MODE (parmreg),
3247 equiv_stack_parm);
3248 }
3249 }
3250 }
3251
3252 if (moved)
3253 /* Nothing to do. */
3254 ;
3255 else if (need_conversion)
3256 {
3257 /* We did not have an insn to convert directly, or the sequence
3258 generated appeared unsafe. We must first copy the parm to a
3259 pseudo reg, and save the conversion until after all
3260 parameters have been moved. */
3261
3262 int save_tree_used;
3263 rtx tempreg = gen_reg_rtx (GET_MODE (data->entry_parm));
3264
3265 emit_move_insn (tempreg, validated_mem);
3266
3267 push_to_sequence2 (all->first_conversion_insn, all->last_conversion_insn);
3268 tempreg = convert_to_mode (data->nominal_mode, tempreg, unsignedp);
3269
3270 if (partial_subreg_p (tempreg)
3271 && GET_MODE (tempreg) == data->nominal_mode
3272 && REG_P (SUBREG_REG (tempreg))
3273 && data->nominal_mode == data->passed_mode
3274 && GET_MODE (SUBREG_REG (tempreg)) == GET_MODE (data->entry_parm))
3275 {
3276 /* The argument is already sign/zero extended, so note it
3277 into the subreg. */
3278 SUBREG_PROMOTED_VAR_P (tempreg) = 1;
3279 SUBREG_PROMOTED_SET (tempreg, unsignedp);
3280 }
3281
3282 /* TREE_USED gets set erroneously during expand_assignment. */
3283 save_tree_used = TREE_USED (parm);
3284 SET_DECL_RTL (parm, rtl);
3285 expand_assignment (parm, make_tree (data->nominal_type, tempreg), false);
3286 SET_DECL_RTL (parm, NULL_RTX);
3287 TREE_USED (parm) = save_tree_used;
3288 all->first_conversion_insn = get_insns ();
3289 all->last_conversion_insn = get_last_insn ();
3290 end_sequence ();
3291
3292 did_conversion = true;
3293 }
3294 else if (MEM_P (data->entry_parm)
3295 && GET_MODE_ALIGNMENT (promoted_nominal_mode)
3296 > MEM_ALIGN (data->entry_parm)
3297 && (((icode = optab_handler (movmisalign_optab,
3298 promoted_nominal_mode))
3299 != CODE_FOR_nothing)
3300 || targetm.slow_unaligned_access (promoted_nominal_mode,
3301 MEM_ALIGN (data->entry_parm))))
3302 {
3303 if (icode != CODE_FOR_nothing)
3304 emit_insn (GEN_FCN (icode) (parmreg, validated_mem));
3305 else
3306 rtl = parmreg = extract_bit_field (validated_mem,
3307 GET_MODE_BITSIZE (promoted_nominal_mode), 0,
3308 unsignedp, parmreg,
3309 promoted_nominal_mode, VOIDmode, false, NULL);
3310 }
3311 else
3312 emit_move_insn (parmreg, validated_mem);
3313
3314 /* If we were passed a pointer but the actual value can safely live
3315 in a register, retrieve it and use it directly. */
3316 if (data->passed_pointer && TYPE_MODE (TREE_TYPE (parm)) != BLKmode)
3317 {
3318 /* We can't use nominal_mode, because it will have been set to
3319 Pmode above. We must use the actual mode of the parm. */
3320 if (use_register_for_decl (parm))
3321 {
3322 parmreg = gen_reg_rtx (TYPE_MODE (TREE_TYPE (parm)));
3323 mark_user_reg (parmreg);
3324 }
3325 else
3326 {
3327 int align = STACK_SLOT_ALIGNMENT (TREE_TYPE (parm),
3328 TYPE_MODE (TREE_TYPE (parm)),
3329 TYPE_ALIGN (TREE_TYPE (parm)));
3330 parmreg
3331 = assign_stack_local (TYPE_MODE (TREE_TYPE (parm)),
3332 GET_MODE_SIZE (TYPE_MODE (TREE_TYPE (parm))),
3333 align);
3334 set_mem_attributes (parmreg, parm, 1);
3335 }
3336
3337 /* We need to preserve an address based on VIRTUAL_STACK_VARS_REGNUM for
3338 the debug info in case it is not legitimate. */
3339 if (GET_MODE (parmreg) != GET_MODE (rtl))
3340 {
3341 rtx tempreg = gen_reg_rtx (GET_MODE (rtl));
3342 int unsigned_p = TYPE_UNSIGNED (TREE_TYPE (parm));
3343
3344 push_to_sequence2 (all->first_conversion_insn,
3345 all->last_conversion_insn);
3346 emit_move_insn (tempreg, rtl);
3347 tempreg = convert_to_mode (GET_MODE (parmreg), tempreg, unsigned_p);
3348 emit_move_insn (MEM_P (parmreg) ? copy_rtx (parmreg) : parmreg,
3349 tempreg);
3350 all->first_conversion_insn = get_insns ();
3351 all->last_conversion_insn = get_last_insn ();
3352 end_sequence ();
3353
3354 did_conversion = true;
3355 }
3356 else
3357 emit_move_insn (MEM_P (parmreg) ? copy_rtx (parmreg) : parmreg, rtl);
3358
3359 rtl = parmreg;
3360
3361 /* STACK_PARM is the pointer, not the parm, and PARMREG is
3362 now the parm. */
3363 data->stack_parm = NULL;
3364 }
3365
3366 set_parm_rtl (parm, rtl);
3367
3368 /* Mark the register as eliminable if we did no conversion and it was
3369 copied from memory at a fixed offset, and the arg pointer was not
3370 copied to a pseudo-reg. If the arg pointer is a pseudo reg or the
3371 offset formed an invalid address, such memory-equivalences as we
3372 make here would screw up life analysis for it. */
3373 if (data->nominal_mode == data->passed_mode
3374 && !did_conversion
3375 && data->stack_parm != 0
3376 && MEM_P (data->stack_parm)
3377 && data->locate.offset.var == 0
3378 && reg_mentioned_p (virtual_incoming_args_rtx,
3379 XEXP (data->stack_parm, 0)))
3380 {
3381 rtx_insn *linsn = get_last_insn ();
3382 rtx_insn *sinsn;
3383 rtx set;
3384
3385 /* Mark complex types separately. */
3386 if (GET_CODE (parmreg) == CONCAT)
3387 {
3388 scalar_mode submode = GET_MODE_INNER (GET_MODE (parmreg));
3389 int regnor = REGNO (XEXP (parmreg, 0));
3390 int regnoi = REGNO (XEXP (parmreg, 1));
3391 rtx stackr = adjust_address_nv (data->stack_parm, submode, 0);
3392 rtx stacki = adjust_address_nv (data->stack_parm, submode,
3393 GET_MODE_SIZE (submode));
3394
3395 /* Scan backwards for the set of the real and
3396 imaginary parts. */
3397 for (sinsn = linsn; sinsn != 0;
3398 sinsn = prev_nonnote_insn (sinsn))
3399 {
3400 set = single_set (sinsn);
3401 if (set == 0)
3402 continue;
3403
3404 if (SET_DEST (set) == regno_reg_rtx [regnoi])
3405 set_unique_reg_note (sinsn, REG_EQUIV, stacki);
3406 else if (SET_DEST (set) == regno_reg_rtx [regnor])
3407 set_unique_reg_note (sinsn, REG_EQUIV, stackr);
3408 }
3409 }
3410 else
3411 set_dst_reg_note (linsn, REG_EQUIV, equiv_stack_parm, parmreg);
3412 }
3413
3414 /* For pointer data type, suggest pointer register. */
3415 if (POINTER_TYPE_P (TREE_TYPE (parm)))
3416 mark_reg_pointer (parmreg,
3417 TYPE_ALIGN (TREE_TYPE (TREE_TYPE (parm))));
3418 }
3419
3420 /* A subroutine of assign_parms. Allocate stack space to hold the current
3421 parameter. Get it there. Perform all ABI specified conversions. */
3422
3423 static void
3424 assign_parm_setup_stack (struct assign_parm_data_all *all, tree parm,
3425 struct assign_parm_data_one *data)
3426 {
3427 /* Value must be stored in the stack slot STACK_PARM during function
3428 execution. */
3429 bool to_conversion = false;
3430
3431 assign_parm_remove_parallels (data);
3432
3433 if (data->promoted_mode != data->nominal_mode)
3434 {
3435 /* Conversion is required. */
3436 rtx tempreg = gen_reg_rtx (GET_MODE (data->entry_parm));
3437
3438 emit_move_insn (tempreg, validize_mem (copy_rtx (data->entry_parm)));
3439
3440 push_to_sequence2 (all->first_conversion_insn, all->last_conversion_insn);
3441 to_conversion = true;
3442
3443 data->entry_parm = convert_to_mode (data->nominal_mode, tempreg,
3444 TYPE_UNSIGNED (TREE_TYPE (parm)));
3445
3446 if (data->stack_parm)
3447 {
3448 poly_int64 offset
3449 = subreg_lowpart_offset (data->nominal_mode,
3450 GET_MODE (data->stack_parm));
3451 /* ??? This may need a big-endian conversion on sparc64. */
3452 data->stack_parm
3453 = adjust_address (data->stack_parm, data->nominal_mode, 0);
3454 if (maybe_ne (offset, 0) && MEM_OFFSET_KNOWN_P (data->stack_parm))
3455 set_mem_offset (data->stack_parm,
3456 MEM_OFFSET (data->stack_parm) + offset);
3457 }
3458 }
3459
3460 if (data->entry_parm != data->stack_parm)
3461 {
3462 rtx src, dest;
3463
3464 if (data->stack_parm == 0)
3465 {
3466 int align = STACK_SLOT_ALIGNMENT (data->passed_type,
3467 GET_MODE (data->entry_parm),
3468 TYPE_ALIGN (data->passed_type));
3469 data->stack_parm
3470 = assign_stack_local (GET_MODE (data->entry_parm),
3471 GET_MODE_SIZE (GET_MODE (data->entry_parm)),
3472 align);
3473 set_mem_attributes (data->stack_parm, parm, 1);
3474 }
3475
3476 dest = validize_mem (copy_rtx (data->stack_parm));
3477 src = validize_mem (copy_rtx (data->entry_parm));
3478
3479 if (MEM_P (src))
3480 {
3481 /* Use a block move to handle potentially misaligned entry_parm. */
3482 if (!to_conversion)
3483 push_to_sequence2 (all->first_conversion_insn,
3484 all->last_conversion_insn);
3485 to_conversion = true;
3486
3487 emit_block_move (dest, src,
3488 GEN_INT (int_size_in_bytes (data->passed_type)),
3489 BLOCK_OP_NORMAL);
3490 }
3491 else
3492 {
3493 if (!REG_P (src))
3494 src = force_reg (GET_MODE (src), src);
3495 emit_move_insn (dest, src);
3496 }
3497 }
3498
3499 if (to_conversion)
3500 {
3501 all->first_conversion_insn = get_insns ();
3502 all->last_conversion_insn = get_last_insn ();
3503 end_sequence ();
3504 }
3505
3506 set_parm_rtl (parm, data->stack_parm);
3507 }
3508
3509 /* A subroutine of assign_parms. If the ABI splits complex arguments, then
3510 undo the frobbing that we did in assign_parms_augmented_arg_list. */
3511
3512 static void
3513 assign_parms_unsplit_complex (struct assign_parm_data_all *all,
3514 vec<tree> fnargs)
3515 {
3516 tree parm;
3517 tree orig_fnargs = all->orig_fnargs;
3518 unsigned i = 0;
3519
3520 for (parm = orig_fnargs; parm; parm = TREE_CHAIN (parm), ++i)
3521 {
3522 if (TREE_CODE (TREE_TYPE (parm)) == COMPLEX_TYPE
3523 && targetm.calls.split_complex_arg (TREE_TYPE (parm)))
3524 {
3525 rtx tmp, real, imag;
3526 scalar_mode inner = GET_MODE_INNER (DECL_MODE (parm));
3527
3528 real = DECL_RTL (fnargs[i]);
3529 imag = DECL_RTL (fnargs[i + 1]);
3530 if (inner != GET_MODE (real))
3531 {
3532 real = gen_lowpart_SUBREG (inner, real);
3533 imag = gen_lowpart_SUBREG (inner, imag);
3534 }
3535
3536 if (TREE_ADDRESSABLE (parm))
3537 {
3538 rtx rmem, imem;
3539 HOST_WIDE_INT size = int_size_in_bytes (TREE_TYPE (parm));
3540 int align = STACK_SLOT_ALIGNMENT (TREE_TYPE (parm),
3541 DECL_MODE (parm),
3542 TYPE_ALIGN (TREE_TYPE (parm)));
3543
3544 /* split_complex_arg put the real and imag parts in
3545 pseudos. Move them to memory. */
3546 tmp = assign_stack_local (DECL_MODE (parm), size, align);
3547 set_mem_attributes (tmp, parm, 1);
3548 rmem = adjust_address_nv (tmp, inner, 0);
3549 imem = adjust_address_nv (tmp, inner, GET_MODE_SIZE (inner));
3550 push_to_sequence2 (all->first_conversion_insn,
3551 all->last_conversion_insn);
3552 emit_move_insn (rmem, real);
3553 emit_move_insn (imem, imag);
3554 all->first_conversion_insn = get_insns ();
3555 all->last_conversion_insn = get_last_insn ();
3556 end_sequence ();
3557 }
3558 else
3559 tmp = gen_rtx_CONCAT (DECL_MODE (parm), real, imag);
3560 set_parm_rtl (parm, tmp);
3561
3562 real = DECL_INCOMING_RTL (fnargs[i]);
3563 imag = DECL_INCOMING_RTL (fnargs[i + 1]);
3564 if (inner != GET_MODE (real))
3565 {
3566 real = gen_lowpart_SUBREG (inner, real);
3567 imag = gen_lowpart_SUBREG (inner, imag);
3568 }
3569 tmp = gen_rtx_CONCAT (DECL_MODE (parm), real, imag);
3570 set_decl_incoming_rtl (parm, tmp, false);
3571 i++;
3572 }
3573 }
3574 }
3575
3576 /* Assign RTL expressions to the function's parameters. This may involve
3577 copying them into registers and using those registers as the DECL_RTL. */
3578
3579 static void
3580 assign_parms (tree fndecl)
3581 {
3582 struct assign_parm_data_all all;
3583 tree parm;
3584 vec<tree> fnargs;
3585 unsigned i;
3586
3587 crtl->args.internal_arg_pointer
3588 = targetm.calls.internal_arg_pointer ();
3589
3590 assign_parms_initialize_all (&all);
3591 fnargs = assign_parms_augmented_arg_list (&all);
3592
3593 FOR_EACH_VEC_ELT (fnargs, i, parm)
3594 {
3595 struct assign_parm_data_one data;
3596
3597 /* Extract the type of PARM; adjust it according to ABI. */
3598 assign_parm_find_data_types (&all, parm, &data);
3599
3600 /* Early out for errors and void parameters. */
3601 if (data.passed_mode == VOIDmode)
3602 {
3603 SET_DECL_RTL (parm, const0_rtx);
3604 DECL_INCOMING_RTL (parm) = DECL_RTL (parm);
3605 continue;
3606 }
3607
3608 /* Estimate stack alignment from parameter alignment. */
3609 if (SUPPORTS_STACK_ALIGNMENT)
3610 {
3611 unsigned int align
3612 = targetm.calls.function_arg_boundary (data.promoted_mode,
3613 data.passed_type);
3614 align = MINIMUM_ALIGNMENT (data.passed_type, data.promoted_mode,
3615 align);
3616 if (TYPE_ALIGN (data.nominal_type) > align)
3617 align = MINIMUM_ALIGNMENT (data.nominal_type,
3618 TYPE_MODE (data.nominal_type),
3619 TYPE_ALIGN (data.nominal_type));
3620 if (crtl->stack_alignment_estimated < align)
3621 {
3622 gcc_assert (!crtl->stack_realign_processed);
3623 crtl->stack_alignment_estimated = align;
3624 }
3625 }
3626
3627 /* Find out where the parameter arrives in this function. */
3628 assign_parm_find_entry_rtl (&all, &data);
3629
3630 /* Find out where stack space for this parameter might be. */
3631 if (assign_parm_is_stack_parm (&all, &data))
3632 {
3633 assign_parm_find_stack_rtl (parm, &data);
3634 assign_parm_adjust_entry_rtl (&data);
3635 }
3636 /* Record permanently how this parm was passed. */
3637 if (data.passed_pointer)
3638 {
3639 rtx incoming_rtl
3640 = gen_rtx_MEM (TYPE_MODE (TREE_TYPE (data.passed_type)),
3641 data.entry_parm);
3642 set_decl_incoming_rtl (parm, incoming_rtl, true);
3643 }
3644 else
3645 set_decl_incoming_rtl (parm, data.entry_parm, false);
3646
3647 assign_parm_adjust_stack_rtl (&data);
3648
3649 if (assign_parm_setup_block_p (&data))
3650 assign_parm_setup_block (&all, parm, &data);
3651 else if (data.passed_pointer || use_register_for_decl (parm))
3652 assign_parm_setup_reg (&all, parm, &data);
3653 else
3654 assign_parm_setup_stack (&all, parm, &data);
3655
3656 if (cfun->stdarg && !DECL_CHAIN (parm))
3657 assign_parms_setup_varargs (&all, &data, false);
3658
3659 /* Update info on where next arg arrives in registers. */
3660 targetm.calls.function_arg_advance (all.args_so_far, data.promoted_mode,
3661 data.passed_type, data.named_arg);
3662 }
3663
3664 if (targetm.calls.split_complex_arg)
3665 assign_parms_unsplit_complex (&all, fnargs);
3666
3667 fnargs.release ();
3668
3669 /* Output all parameter conversion instructions (possibly including calls)
3670 now that all parameters have been copied out of hard registers. */
3671 emit_insn (all.first_conversion_insn);
3672
3673 /* Estimate reload stack alignment from scalar return mode. */
3674 if (SUPPORTS_STACK_ALIGNMENT)
3675 {
3676 if (DECL_RESULT (fndecl))
3677 {
3678 tree type = TREE_TYPE (DECL_RESULT (fndecl));
3679 machine_mode mode = TYPE_MODE (type);
3680
3681 if (mode != BLKmode
3682 && mode != VOIDmode
3683 && !AGGREGATE_TYPE_P (type))
3684 {
3685 unsigned int align = GET_MODE_ALIGNMENT (mode);
3686 if (crtl->stack_alignment_estimated < align)
3687 {
3688 gcc_assert (!crtl->stack_realign_processed);
3689 crtl->stack_alignment_estimated = align;
3690 }
3691 }
3692 }
3693 }
3694
3695 /* If we are receiving a struct value address as the first argument, set up
3696 the RTL for the function result. As this might require code to convert
3697 the transmitted address to Pmode, we do this here to ensure that possible
3698 preliminary conversions of the address have been emitted already. */
3699 if (all.function_result_decl)
3700 {
3701 tree result = DECL_RESULT (current_function_decl);
3702 rtx addr = DECL_RTL (all.function_result_decl);
3703 rtx x;
3704
3705 if (DECL_BY_REFERENCE (result))
3706 {
3707 SET_DECL_VALUE_EXPR (result, all.function_result_decl);
3708 x = addr;
3709 }
3710 else
3711 {
3712 SET_DECL_VALUE_EXPR (result,
3713 build1 (INDIRECT_REF, TREE_TYPE (result),
3714 all.function_result_decl));
3715 addr = convert_memory_address (Pmode, addr);
3716 x = gen_rtx_MEM (DECL_MODE (result), addr);
3717 set_mem_attributes (x, result, 1);
3718 }
3719
3720 DECL_HAS_VALUE_EXPR_P (result) = 1;
3721
3722 set_parm_rtl (result, x);
3723 }
3724
3725 /* We have aligned all the args, so add space for the pretend args. */
3726 crtl->args.pretend_args_size = all.pretend_args_size;
3727 all.stack_args_size.constant += all.extra_pretend_bytes;
3728 crtl->args.size = all.stack_args_size.constant;
3729
3730 /* Adjust function incoming argument size for alignment and
3731 minimum length. */
3732
3733 crtl->args.size = upper_bound (crtl->args.size, all.reg_parm_stack_space);
3734 crtl->args.size = aligned_upper_bound (crtl->args.size,
3735 PARM_BOUNDARY / BITS_PER_UNIT);
3736
3737 if (ARGS_GROW_DOWNWARD)
3738 {
3739 crtl->args.arg_offset_rtx
3740 = (all.stack_args_size.var == 0
3741 ? gen_int_mode (-all.stack_args_size.constant, Pmode)
3742 : expand_expr (size_diffop (all.stack_args_size.var,
3743 size_int (-all.stack_args_size.constant)),
3744 NULL_RTX, VOIDmode, EXPAND_NORMAL));
3745 }
3746 else
3747 crtl->args.arg_offset_rtx = ARGS_SIZE_RTX (all.stack_args_size);
3748
3749 /* See how many bytes, if any, of its args a function should try to pop
3750 on return. */
3751
3752 crtl->args.pops_args = targetm.calls.return_pops_args (fndecl,
3753 TREE_TYPE (fndecl),
3754 crtl->args.size);
3755
3756 /* For stdarg.h function, save info about
3757 regs and stack space used by the named args. */
3758
3759 crtl->args.info = all.args_so_far_v;
3760
3761 /* Set the rtx used for the function return value. Put this in its
3762 own variable so any optimizers that need this information don't have
3763 to include tree.h. Do this here so it gets done when an inlined
3764 function gets output. */
3765
3766 crtl->return_rtx
3767 = (DECL_RTL_SET_P (DECL_RESULT (fndecl))
3768 ? DECL_RTL (DECL_RESULT (fndecl)) : NULL_RTX);
3769
3770 /* If scalar return value was computed in a pseudo-reg, or was a named
3771 return value that got dumped to the stack, copy that to the hard
3772 return register. */
3773 if (DECL_RTL_SET_P (DECL_RESULT (fndecl)))
3774 {
3775 tree decl_result = DECL_RESULT (fndecl);
3776 rtx decl_rtl = DECL_RTL (decl_result);
3777
3778 if (REG_P (decl_rtl)
3779 ? REGNO (decl_rtl) >= FIRST_PSEUDO_REGISTER
3780 : DECL_REGISTER (decl_result))
3781 {
3782 rtx real_decl_rtl;
3783
3784 real_decl_rtl = targetm.calls.function_value (TREE_TYPE (decl_result),
3785 fndecl, true);
3786 REG_FUNCTION_VALUE_P (real_decl_rtl) = 1;
3787 /* The delay slot scheduler assumes that crtl->return_rtx
3788 holds the hard register containing the return value, not a
3789 temporary pseudo. */
3790 crtl->return_rtx = real_decl_rtl;
3791 }
3792 }
3793 }
3794
3795 /* A subroutine of gimplify_parameters, invoked via walk_tree.
3796 For all seen types, gimplify their sizes. */
3797
3798 static tree
3799 gimplify_parm_type (tree *tp, int *walk_subtrees, void *data)
3800 {
3801 tree t = *tp;
3802
3803 *walk_subtrees = 0;
3804 if (TYPE_P (t))
3805 {
3806 if (POINTER_TYPE_P (t))
3807 *walk_subtrees = 1;
3808 else if (TYPE_SIZE (t) && !TREE_CONSTANT (TYPE_SIZE (t))
3809 && !TYPE_SIZES_GIMPLIFIED (t))
3810 {
3811 gimplify_type_sizes (t, (gimple_seq *) data);
3812 *walk_subtrees = 1;
3813 }
3814 }
3815
3816 return NULL;
3817 }
3818
3819 /* Gimplify the parameter list for current_function_decl. This involves
3820 evaluating SAVE_EXPRs of variable sized parameters and generating code
3821 to implement callee-copies reference parameters. Returns a sequence of
3822 statements to add to the beginning of the function. */
3823
3824 gimple_seq
3825 gimplify_parameters (gimple_seq *cleanup)
3826 {
3827 struct assign_parm_data_all all;
3828 tree parm;
3829 gimple_seq stmts = NULL;
3830 vec<tree> fnargs;
3831 unsigned i;
3832
3833 assign_parms_initialize_all (&all);
3834 fnargs = assign_parms_augmented_arg_list (&all);
3835
3836 FOR_EACH_VEC_ELT (fnargs, i, parm)
3837 {
3838 struct assign_parm_data_one data;
3839
3840 /* Extract the type of PARM; adjust it according to ABI. */
3841 assign_parm_find_data_types (&all, parm, &data);
3842
3843 /* Early out for errors and void parameters. */
3844 if (data.passed_mode == VOIDmode || DECL_SIZE (parm) == NULL)
3845 continue;
3846
3847 /* Update info on where next arg arrives in registers. */
3848 targetm.calls.function_arg_advance (all.args_so_far, data.promoted_mode,
3849 data.passed_type, data.named_arg);
3850
3851 /* ??? Once upon a time variable_size stuffed parameter list
3852 SAVE_EXPRs (amongst others) onto a pending sizes list. This
3853 turned out to be less than manageable in the gimple world.
3854 Now we have to hunt them down ourselves. */
3855 walk_tree_without_duplicates (&data.passed_type,
3856 gimplify_parm_type, &stmts);
3857
3858 if (TREE_CODE (DECL_SIZE_UNIT (parm)) != INTEGER_CST)
3859 {
3860 gimplify_one_sizepos (&DECL_SIZE (parm), &stmts);
3861 gimplify_one_sizepos (&DECL_SIZE_UNIT (parm), &stmts);
3862 }
3863
3864 if (data.passed_pointer)
3865 {
3866 tree type = TREE_TYPE (data.passed_type);
3867 if (reference_callee_copied (&all.args_so_far_v, TYPE_MODE (type),
3868 type, data.named_arg))
3869 {
3870 tree local, t;
3871
3872 /* For constant-sized objects, this is trivial; for
3873 variable-sized objects, we have to play games. */
3874 if (TREE_CODE (DECL_SIZE_UNIT (parm)) == INTEGER_CST
3875 && !(flag_stack_check == GENERIC_STACK_CHECK
3876 && compare_tree_int (DECL_SIZE_UNIT (parm),
3877 STACK_CHECK_MAX_VAR_SIZE) > 0))
3878 {
3879 local = create_tmp_var (type, get_name (parm));
3880 DECL_IGNORED_P (local) = 0;
3881 /* If PARM was addressable, move that flag over
3882 to the local copy, as its address will be taken,
3883 not the PARMs. Keep the parms address taken
3884 as we'll query that flag during gimplification. */
3885 if (TREE_ADDRESSABLE (parm))
3886 TREE_ADDRESSABLE (local) = 1;
3887 else if (TREE_CODE (type) == COMPLEX_TYPE
3888 || TREE_CODE (type) == VECTOR_TYPE)
3889 DECL_GIMPLE_REG_P (local) = 1;
3890
3891 if (!is_gimple_reg (local)
3892 && flag_stack_reuse != SR_NONE)
3893 {
3894 tree clobber = build_constructor (type, NULL);
3895 gimple *clobber_stmt;
3896 TREE_THIS_VOLATILE (clobber) = 1;
3897 clobber_stmt = gimple_build_assign (local, clobber);
3898 gimple_seq_add_stmt (cleanup, clobber_stmt);
3899 }
3900 }
3901 else
3902 {
3903 tree ptr_type, addr;
3904
3905 ptr_type = build_pointer_type (type);
3906 addr = create_tmp_reg (ptr_type, get_name (parm));
3907 DECL_IGNORED_P (addr) = 0;
3908 local = build_fold_indirect_ref (addr);
3909
3910 t = build_alloca_call_expr (DECL_SIZE_UNIT (parm),
3911 DECL_ALIGN (parm),
3912 max_int_size_in_bytes (type));
3913 /* The call has been built for a variable-sized object. */
3914 CALL_ALLOCA_FOR_VAR_P (t) = 1;
3915 t = fold_convert (ptr_type, t);
3916 t = build2 (MODIFY_EXPR, TREE_TYPE (addr), addr, t);
3917 gimplify_and_add (t, &stmts);
3918 }
3919
3920 gimplify_assign (local, parm, &stmts);
3921
3922 SET_DECL_VALUE_EXPR (parm, local);
3923 DECL_HAS_VALUE_EXPR_P (parm) = 1;
3924 }
3925 }
3926 }
3927
3928 fnargs.release ();
3929
3930 return stmts;
3931 }
3932 \f
3933 /* Compute the size and offset from the start of the stacked arguments for a
3934 parm passed in mode PASSED_MODE and with type TYPE.
3935
3936 INITIAL_OFFSET_PTR points to the current offset into the stacked
3937 arguments.
3938
3939 The starting offset and size for this parm are returned in
3940 LOCATE->OFFSET and LOCATE->SIZE, respectively. When IN_REGS is
3941 nonzero, the offset is that of stack slot, which is returned in
3942 LOCATE->SLOT_OFFSET. LOCATE->ALIGNMENT_PAD is the amount of
3943 padding required from the initial offset ptr to the stack slot.
3944
3945 IN_REGS is nonzero if the argument will be passed in registers. It will
3946 never be set if REG_PARM_STACK_SPACE is not defined.
3947
3948 REG_PARM_STACK_SPACE is the number of bytes of stack space reserved
3949 for arguments which are passed in registers.
3950
3951 FNDECL is the function in which the argument was defined.
3952
3953 There are two types of rounding that are done. The first, controlled by
3954 TARGET_FUNCTION_ARG_BOUNDARY, forces the offset from the start of the
3955 argument list to be aligned to the specific boundary (in bits). This
3956 rounding affects the initial and starting offsets, but not the argument
3957 size.
3958
3959 The second, controlled by TARGET_FUNCTION_ARG_PADDING and PARM_BOUNDARY,
3960 optionally rounds the size of the parm to PARM_BOUNDARY. The
3961 initial offset is not affected by this rounding, while the size always
3962 is and the starting offset may be. */
3963
3964 /* LOCATE->OFFSET will be negative for ARGS_GROW_DOWNWARD case;
3965 INITIAL_OFFSET_PTR is positive because locate_and_pad_parm's
3966 callers pass in the total size of args so far as
3967 INITIAL_OFFSET_PTR. LOCATE->SIZE is always positive. */
3968
3969 void
3970 locate_and_pad_parm (machine_mode passed_mode, tree type, int in_regs,
3971 int reg_parm_stack_space, int partial,
3972 tree fndecl ATTRIBUTE_UNUSED,
3973 struct args_size *initial_offset_ptr,
3974 struct locate_and_pad_arg_data *locate)
3975 {
3976 tree sizetree;
3977 pad_direction where_pad;
3978 unsigned int boundary, round_boundary;
3979 int part_size_in_regs;
3980
3981 /* If we have found a stack parm before we reach the end of the
3982 area reserved for registers, skip that area. */
3983 if (! in_regs)
3984 {
3985 if (reg_parm_stack_space > 0)
3986 {
3987 if (initial_offset_ptr->var
3988 || !ordered_p (initial_offset_ptr->constant,
3989 reg_parm_stack_space))
3990 {
3991 initial_offset_ptr->var
3992 = size_binop (MAX_EXPR, ARGS_SIZE_TREE (*initial_offset_ptr),
3993 ssize_int (reg_parm_stack_space));
3994 initial_offset_ptr->constant = 0;
3995 }
3996 else
3997 initial_offset_ptr->constant
3998 = ordered_max (initial_offset_ptr->constant,
3999 reg_parm_stack_space);
4000 }
4001 }
4002
4003 part_size_in_regs = (reg_parm_stack_space == 0 ? partial : 0);
4004
4005 sizetree = (type
4006 ? arg_size_in_bytes (type)
4007 : size_int (GET_MODE_SIZE (passed_mode)));
4008 where_pad = targetm.calls.function_arg_padding (passed_mode, type);
4009 boundary = targetm.calls.function_arg_boundary (passed_mode, type);
4010 round_boundary = targetm.calls.function_arg_round_boundary (passed_mode,
4011 type);
4012 locate->where_pad = where_pad;
4013
4014 /* Alignment can't exceed MAX_SUPPORTED_STACK_ALIGNMENT. */
4015 if (boundary > MAX_SUPPORTED_STACK_ALIGNMENT)
4016 boundary = MAX_SUPPORTED_STACK_ALIGNMENT;
4017
4018 locate->boundary = boundary;
4019
4020 if (SUPPORTS_STACK_ALIGNMENT)
4021 {
4022 /* stack_alignment_estimated can't change after stack has been
4023 realigned. */
4024 if (crtl->stack_alignment_estimated < boundary)
4025 {
4026 if (!crtl->stack_realign_processed)
4027 crtl->stack_alignment_estimated = boundary;
4028 else
4029 {
4030 /* If stack is realigned and stack alignment value
4031 hasn't been finalized, it is OK not to increase
4032 stack_alignment_estimated. The bigger alignment
4033 requirement is recorded in stack_alignment_needed
4034 below. */
4035 gcc_assert (!crtl->stack_realign_finalized
4036 && crtl->stack_realign_needed);
4037 }
4038 }
4039 }
4040
4041 if (ARGS_GROW_DOWNWARD)
4042 {
4043 locate->slot_offset.constant = -initial_offset_ptr->constant;
4044 if (initial_offset_ptr->var)
4045 locate->slot_offset.var = size_binop (MINUS_EXPR, ssize_int (0),
4046 initial_offset_ptr->var);
4047
4048 {
4049 tree s2 = sizetree;
4050 if (where_pad != PAD_NONE
4051 && (!tree_fits_uhwi_p (sizetree)
4052 || (tree_to_uhwi (sizetree) * BITS_PER_UNIT) % round_boundary))
4053 s2 = round_up (s2, round_boundary / BITS_PER_UNIT);
4054 SUB_PARM_SIZE (locate->slot_offset, s2);
4055 }
4056
4057 locate->slot_offset.constant += part_size_in_regs;
4058
4059 if (!in_regs || reg_parm_stack_space > 0)
4060 pad_to_arg_alignment (&locate->slot_offset, boundary,
4061 &locate->alignment_pad);
4062
4063 locate->size.constant = (-initial_offset_ptr->constant
4064 - locate->slot_offset.constant);
4065 if (initial_offset_ptr->var)
4066 locate->size.var = size_binop (MINUS_EXPR,
4067 size_binop (MINUS_EXPR,
4068 ssize_int (0),
4069 initial_offset_ptr->var),
4070 locate->slot_offset.var);
4071
4072 /* Pad_below needs the pre-rounded size to know how much to pad
4073 below. */
4074 locate->offset = locate->slot_offset;
4075 if (where_pad == PAD_DOWNWARD)
4076 pad_below (&locate->offset, passed_mode, sizetree);
4077
4078 }
4079 else
4080 {
4081 if (!in_regs || reg_parm_stack_space > 0)
4082 pad_to_arg_alignment (initial_offset_ptr, boundary,
4083 &locate->alignment_pad);
4084 locate->slot_offset = *initial_offset_ptr;
4085
4086 #ifdef PUSH_ROUNDING
4087 if (passed_mode != BLKmode)
4088 sizetree = size_int (PUSH_ROUNDING (TREE_INT_CST_LOW (sizetree)));
4089 #endif
4090
4091 /* Pad_below needs the pre-rounded size to know how much to pad below
4092 so this must be done before rounding up. */
4093 locate->offset = locate->slot_offset;
4094 if (where_pad == PAD_DOWNWARD)
4095 pad_below (&locate->offset, passed_mode, sizetree);
4096
4097 if (where_pad != PAD_NONE
4098 && (!tree_fits_uhwi_p (sizetree)
4099 || (tree_to_uhwi (sizetree) * BITS_PER_UNIT) % round_boundary))
4100 sizetree = round_up (sizetree, round_boundary / BITS_PER_UNIT);
4101
4102 ADD_PARM_SIZE (locate->size, sizetree);
4103
4104 locate->size.constant -= part_size_in_regs;
4105 }
4106
4107 locate->offset.constant
4108 += targetm.calls.function_arg_offset (passed_mode, type);
4109 }
4110
4111 /* Round the stack offset in *OFFSET_PTR up to a multiple of BOUNDARY.
4112 BOUNDARY is measured in bits, but must be a multiple of a storage unit. */
4113
4114 static void
4115 pad_to_arg_alignment (struct args_size *offset_ptr, int boundary,
4116 struct args_size *alignment_pad)
4117 {
4118 tree save_var = NULL_TREE;
4119 poly_int64 save_constant = 0;
4120 int boundary_in_bytes = boundary / BITS_PER_UNIT;
4121 poly_int64 sp_offset = STACK_POINTER_OFFSET;
4122
4123 #ifdef SPARC_STACK_BOUNDARY_HACK
4124 /* ??? The SPARC port may claim a STACK_BOUNDARY higher than
4125 the real alignment of %sp. However, when it does this, the
4126 alignment of %sp+STACK_POINTER_OFFSET is STACK_BOUNDARY. */
4127 if (SPARC_STACK_BOUNDARY_HACK)
4128 sp_offset = 0;
4129 #endif
4130
4131 if (boundary > PARM_BOUNDARY)
4132 {
4133 save_var = offset_ptr->var;
4134 save_constant = offset_ptr->constant;
4135 }
4136
4137 alignment_pad->var = NULL_TREE;
4138 alignment_pad->constant = 0;
4139
4140 if (boundary > BITS_PER_UNIT)
4141 {
4142 int misalign;
4143 if (offset_ptr->var
4144 || !known_misalignment (offset_ptr->constant + sp_offset,
4145 boundary_in_bytes, &misalign))
4146 {
4147 tree sp_offset_tree = ssize_int (sp_offset);
4148 tree offset = size_binop (PLUS_EXPR,
4149 ARGS_SIZE_TREE (*offset_ptr),
4150 sp_offset_tree);
4151 tree rounded;
4152 if (ARGS_GROW_DOWNWARD)
4153 rounded = round_down (offset, boundary / BITS_PER_UNIT);
4154 else
4155 rounded = round_up (offset, boundary / BITS_PER_UNIT);
4156
4157 offset_ptr->var = size_binop (MINUS_EXPR, rounded, sp_offset_tree);
4158 /* ARGS_SIZE_TREE includes constant term. */
4159 offset_ptr->constant = 0;
4160 if (boundary > PARM_BOUNDARY)
4161 alignment_pad->var = size_binop (MINUS_EXPR, offset_ptr->var,
4162 save_var);
4163 }
4164 else
4165 {
4166 if (ARGS_GROW_DOWNWARD)
4167 offset_ptr->constant -= misalign;
4168 else
4169 offset_ptr->constant += -misalign & (boundary_in_bytes - 1);
4170
4171 if (boundary > PARM_BOUNDARY)
4172 alignment_pad->constant = offset_ptr->constant - save_constant;
4173 }
4174 }
4175 }
4176
4177 static void
4178 pad_below (struct args_size *offset_ptr, machine_mode passed_mode, tree sizetree)
4179 {
4180 unsigned int align = PARM_BOUNDARY / BITS_PER_UNIT;
4181 int misalign;
4182 if (passed_mode != BLKmode
4183 && known_misalignment (GET_MODE_SIZE (passed_mode), align, &misalign))
4184 offset_ptr->constant += -misalign & (align - 1);
4185 else
4186 {
4187 if (TREE_CODE (sizetree) != INTEGER_CST
4188 || (TREE_INT_CST_LOW (sizetree) & (align - 1)) != 0)
4189 {
4190 /* Round the size up to multiple of PARM_BOUNDARY bits. */
4191 tree s2 = round_up (sizetree, align);
4192 /* Add it in. */
4193 ADD_PARM_SIZE (*offset_ptr, s2);
4194 SUB_PARM_SIZE (*offset_ptr, sizetree);
4195 }
4196 }
4197 }
4198 \f
4199
4200 /* True if register REGNO was alive at a place where `setjmp' was
4201 called and was set more than once or is an argument. Such regs may
4202 be clobbered by `longjmp'. */
4203
4204 static bool
4205 regno_clobbered_at_setjmp (bitmap setjmp_crosses, int regno)
4206 {
4207 /* There appear to be cases where some local vars never reach the
4208 backend but have bogus regnos. */
4209 if (regno >= max_reg_num ())
4210 return false;
4211
4212 return ((REG_N_SETS (regno) > 1
4213 || REGNO_REG_SET_P (df_get_live_out (ENTRY_BLOCK_PTR_FOR_FN (cfun)),
4214 regno))
4215 && REGNO_REG_SET_P (setjmp_crosses, regno));
4216 }
4217
4218 /* Walk the tree of blocks describing the binding levels within a
4219 function and warn about variables the might be killed by setjmp or
4220 vfork. This is done after calling flow_analysis before register
4221 allocation since that will clobber the pseudo-regs to hard
4222 regs. */
4223
4224 static void
4225 setjmp_vars_warning (bitmap setjmp_crosses, tree block)
4226 {
4227 tree decl, sub;
4228
4229 for (decl = BLOCK_VARS (block); decl; decl = DECL_CHAIN (decl))
4230 {
4231 if (VAR_P (decl)
4232 && DECL_RTL_SET_P (decl)
4233 && REG_P (DECL_RTL (decl))
4234 && regno_clobbered_at_setjmp (setjmp_crosses, REGNO (DECL_RTL (decl))))
4235 warning (OPT_Wclobbered, "variable %q+D might be clobbered by"
4236 " %<longjmp%> or %<vfork%>", decl);
4237 }
4238
4239 for (sub = BLOCK_SUBBLOCKS (block); sub; sub = BLOCK_CHAIN (sub))
4240 setjmp_vars_warning (setjmp_crosses, sub);
4241 }
4242
4243 /* Do the appropriate part of setjmp_vars_warning
4244 but for arguments instead of local variables. */
4245
4246 static void
4247 setjmp_args_warning (bitmap setjmp_crosses)
4248 {
4249 tree decl;
4250 for (decl = DECL_ARGUMENTS (current_function_decl);
4251 decl; decl = DECL_CHAIN (decl))
4252 if (DECL_RTL (decl) != 0
4253 && REG_P (DECL_RTL (decl))
4254 && regno_clobbered_at_setjmp (setjmp_crosses, REGNO (DECL_RTL (decl))))
4255 warning (OPT_Wclobbered,
4256 "argument %q+D might be clobbered by %<longjmp%> or %<vfork%>",
4257 decl);
4258 }
4259
4260 /* Generate warning messages for variables live across setjmp. */
4261
4262 void
4263 generate_setjmp_warnings (void)
4264 {
4265 bitmap setjmp_crosses = regstat_get_setjmp_crosses ();
4266
4267 if (n_basic_blocks_for_fn (cfun) == NUM_FIXED_BLOCKS
4268 || bitmap_empty_p (setjmp_crosses))
4269 return;
4270
4271 setjmp_vars_warning (setjmp_crosses, DECL_INITIAL (current_function_decl));
4272 setjmp_args_warning (setjmp_crosses);
4273 }
4274
4275 \f
4276 /* Reverse the order of elements in the fragment chain T of blocks,
4277 and return the new head of the chain (old last element).
4278 In addition to that clear BLOCK_SAME_RANGE flags when needed
4279 and adjust BLOCK_SUPERCONTEXT from the super fragment to
4280 its super fragment origin. */
4281
4282 static tree
4283 block_fragments_nreverse (tree t)
4284 {
4285 tree prev = 0, block, next, prev_super = 0;
4286 tree super = BLOCK_SUPERCONTEXT (t);
4287 if (BLOCK_FRAGMENT_ORIGIN (super))
4288 super = BLOCK_FRAGMENT_ORIGIN (super);
4289 for (block = t; block; block = next)
4290 {
4291 next = BLOCK_FRAGMENT_CHAIN (block);
4292 BLOCK_FRAGMENT_CHAIN (block) = prev;
4293 if ((prev && !BLOCK_SAME_RANGE (prev))
4294 || (BLOCK_FRAGMENT_CHAIN (BLOCK_SUPERCONTEXT (block))
4295 != prev_super))
4296 BLOCK_SAME_RANGE (block) = 0;
4297 prev_super = BLOCK_SUPERCONTEXT (block);
4298 BLOCK_SUPERCONTEXT (block) = super;
4299 prev = block;
4300 }
4301 t = BLOCK_FRAGMENT_ORIGIN (t);
4302 if (BLOCK_FRAGMENT_CHAIN (BLOCK_SUPERCONTEXT (t))
4303 != prev_super)
4304 BLOCK_SAME_RANGE (t) = 0;
4305 BLOCK_SUPERCONTEXT (t) = super;
4306 return prev;
4307 }
4308
4309 /* Reverse the order of elements in the chain T of blocks,
4310 and return the new head of the chain (old last element).
4311 Also do the same on subblocks and reverse the order of elements
4312 in BLOCK_FRAGMENT_CHAIN as well. */
4313
4314 static tree
4315 blocks_nreverse_all (tree t)
4316 {
4317 tree prev = 0, block, next;
4318 for (block = t; block; block = next)
4319 {
4320 next = BLOCK_CHAIN (block);
4321 BLOCK_CHAIN (block) = prev;
4322 if (BLOCK_FRAGMENT_CHAIN (block)
4323 && BLOCK_FRAGMENT_ORIGIN (block) == NULL_TREE)
4324 {
4325 BLOCK_FRAGMENT_CHAIN (block)
4326 = block_fragments_nreverse (BLOCK_FRAGMENT_CHAIN (block));
4327 if (!BLOCK_SAME_RANGE (BLOCK_FRAGMENT_CHAIN (block)))
4328 BLOCK_SAME_RANGE (block) = 0;
4329 }
4330 BLOCK_SUBBLOCKS (block) = blocks_nreverse_all (BLOCK_SUBBLOCKS (block));
4331 prev = block;
4332 }
4333 return prev;
4334 }
4335
4336
4337 /* Identify BLOCKs referenced by more than one NOTE_INSN_BLOCK_{BEG,END},
4338 and create duplicate blocks. */
4339 /* ??? Need an option to either create block fragments or to create
4340 abstract origin duplicates of a source block. It really depends
4341 on what optimization has been performed. */
4342
4343 void
4344 reorder_blocks (void)
4345 {
4346 tree block = DECL_INITIAL (current_function_decl);
4347
4348 if (block == NULL_TREE)
4349 return;
4350
4351 auto_vec<tree, 10> block_stack;
4352
4353 /* Reset the TREE_ASM_WRITTEN bit for all blocks. */
4354 clear_block_marks (block);
4355
4356 /* Prune the old trees away, so that they don't get in the way. */
4357 BLOCK_SUBBLOCKS (block) = NULL_TREE;
4358 BLOCK_CHAIN (block) = NULL_TREE;
4359
4360 /* Recreate the block tree from the note nesting. */
4361 reorder_blocks_1 (get_insns (), block, &block_stack);
4362 BLOCK_SUBBLOCKS (block) = blocks_nreverse_all (BLOCK_SUBBLOCKS (block));
4363 }
4364
4365 /* Helper function for reorder_blocks. Reset TREE_ASM_WRITTEN. */
4366
4367 void
4368 clear_block_marks (tree block)
4369 {
4370 while (block)
4371 {
4372 TREE_ASM_WRITTEN (block) = 0;
4373 clear_block_marks (BLOCK_SUBBLOCKS (block));
4374 block = BLOCK_CHAIN (block);
4375 }
4376 }
4377
4378 static void
4379 reorder_blocks_1 (rtx_insn *insns, tree current_block,
4380 vec<tree> *p_block_stack)
4381 {
4382 rtx_insn *insn;
4383 tree prev_beg = NULL_TREE, prev_end = NULL_TREE;
4384
4385 for (insn = insns; insn; insn = NEXT_INSN (insn))
4386 {
4387 if (NOTE_P (insn))
4388 {
4389 if (NOTE_KIND (insn) == NOTE_INSN_BLOCK_BEG)
4390 {
4391 tree block = NOTE_BLOCK (insn);
4392 tree origin;
4393
4394 gcc_assert (BLOCK_FRAGMENT_ORIGIN (block) == NULL_TREE);
4395 origin = block;
4396
4397 if (prev_end)
4398 BLOCK_SAME_RANGE (prev_end) = 0;
4399 prev_end = NULL_TREE;
4400
4401 /* If we have seen this block before, that means it now
4402 spans multiple address regions. Create a new fragment. */
4403 if (TREE_ASM_WRITTEN (block))
4404 {
4405 tree new_block = copy_node (block);
4406
4407 BLOCK_SAME_RANGE (new_block) = 0;
4408 BLOCK_FRAGMENT_ORIGIN (new_block) = origin;
4409 BLOCK_FRAGMENT_CHAIN (new_block)
4410 = BLOCK_FRAGMENT_CHAIN (origin);
4411 BLOCK_FRAGMENT_CHAIN (origin) = new_block;
4412
4413 NOTE_BLOCK (insn) = new_block;
4414 block = new_block;
4415 }
4416
4417 if (prev_beg == current_block && prev_beg)
4418 BLOCK_SAME_RANGE (block) = 1;
4419
4420 prev_beg = origin;
4421
4422 BLOCK_SUBBLOCKS (block) = 0;
4423 TREE_ASM_WRITTEN (block) = 1;
4424 /* When there's only one block for the entire function,
4425 current_block == block and we mustn't do this, it
4426 will cause infinite recursion. */
4427 if (block != current_block)
4428 {
4429 tree super;
4430 if (block != origin)
4431 gcc_assert (BLOCK_SUPERCONTEXT (origin) == current_block
4432 || BLOCK_FRAGMENT_ORIGIN (BLOCK_SUPERCONTEXT
4433 (origin))
4434 == current_block);
4435 if (p_block_stack->is_empty ())
4436 super = current_block;
4437 else
4438 {
4439 super = p_block_stack->last ();
4440 gcc_assert (super == current_block
4441 || BLOCK_FRAGMENT_ORIGIN (super)
4442 == current_block);
4443 }
4444 BLOCK_SUPERCONTEXT (block) = super;
4445 BLOCK_CHAIN (block) = BLOCK_SUBBLOCKS (current_block);
4446 BLOCK_SUBBLOCKS (current_block) = block;
4447 current_block = origin;
4448 }
4449 p_block_stack->safe_push (block);
4450 }
4451 else if (NOTE_KIND (insn) == NOTE_INSN_BLOCK_END)
4452 {
4453 NOTE_BLOCK (insn) = p_block_stack->pop ();
4454 current_block = BLOCK_SUPERCONTEXT (current_block);
4455 if (BLOCK_FRAGMENT_ORIGIN (current_block))
4456 current_block = BLOCK_FRAGMENT_ORIGIN (current_block);
4457 prev_beg = NULL_TREE;
4458 prev_end = BLOCK_SAME_RANGE (NOTE_BLOCK (insn))
4459 ? NOTE_BLOCK (insn) : NULL_TREE;
4460 }
4461 }
4462 else
4463 {
4464 prev_beg = NULL_TREE;
4465 if (prev_end)
4466 BLOCK_SAME_RANGE (prev_end) = 0;
4467 prev_end = NULL_TREE;
4468 }
4469 }
4470 }
4471
4472 /* Reverse the order of elements in the chain T of blocks,
4473 and return the new head of the chain (old last element). */
4474
4475 tree
4476 blocks_nreverse (tree t)
4477 {
4478 tree prev = 0, block, next;
4479 for (block = t; block; block = next)
4480 {
4481 next = BLOCK_CHAIN (block);
4482 BLOCK_CHAIN (block) = prev;
4483 prev = block;
4484 }
4485 return prev;
4486 }
4487
4488 /* Concatenate two chains of blocks (chained through BLOCK_CHAIN)
4489 by modifying the last node in chain 1 to point to chain 2. */
4490
4491 tree
4492 block_chainon (tree op1, tree op2)
4493 {
4494 tree t1;
4495
4496 if (!op1)
4497 return op2;
4498 if (!op2)
4499 return op1;
4500
4501 for (t1 = op1; BLOCK_CHAIN (t1); t1 = BLOCK_CHAIN (t1))
4502 continue;
4503 BLOCK_CHAIN (t1) = op2;
4504
4505 #ifdef ENABLE_TREE_CHECKING
4506 {
4507 tree t2;
4508 for (t2 = op2; t2; t2 = BLOCK_CHAIN (t2))
4509 gcc_assert (t2 != t1);
4510 }
4511 #endif
4512
4513 return op1;
4514 }
4515
4516 /* Count the subblocks of the list starting with BLOCK. If VECTOR is
4517 non-NULL, list them all into VECTOR, in a depth-first preorder
4518 traversal of the block tree. Also clear TREE_ASM_WRITTEN in all
4519 blocks. */
4520
4521 static int
4522 all_blocks (tree block, tree *vector)
4523 {
4524 int n_blocks = 0;
4525
4526 while (block)
4527 {
4528 TREE_ASM_WRITTEN (block) = 0;
4529
4530 /* Record this block. */
4531 if (vector)
4532 vector[n_blocks] = block;
4533
4534 ++n_blocks;
4535
4536 /* Record the subblocks, and their subblocks... */
4537 n_blocks += all_blocks (BLOCK_SUBBLOCKS (block),
4538 vector ? vector + n_blocks : 0);
4539 block = BLOCK_CHAIN (block);
4540 }
4541
4542 return n_blocks;
4543 }
4544
4545 /* Return a vector containing all the blocks rooted at BLOCK. The
4546 number of elements in the vector is stored in N_BLOCKS_P. The
4547 vector is dynamically allocated; it is the caller's responsibility
4548 to call `free' on the pointer returned. */
4549
4550 static tree *
4551 get_block_vector (tree block, int *n_blocks_p)
4552 {
4553 tree *block_vector;
4554
4555 *n_blocks_p = all_blocks (block, NULL);
4556 block_vector = XNEWVEC (tree, *n_blocks_p);
4557 all_blocks (block, block_vector);
4558
4559 return block_vector;
4560 }
4561
4562 static GTY(()) int next_block_index = 2;
4563
4564 /* Set BLOCK_NUMBER for all the blocks in FN. */
4565
4566 void
4567 number_blocks (tree fn)
4568 {
4569 int i;
4570 int n_blocks;
4571 tree *block_vector;
4572
4573 /* For XCOFF debugging output, we start numbering the blocks
4574 from 1 within each function, rather than keeping a running
4575 count. */
4576 #if defined (XCOFF_DEBUGGING_INFO)
4577 if (write_symbols == XCOFF_DEBUG)
4578 next_block_index = 1;
4579 #endif
4580
4581 block_vector = get_block_vector (DECL_INITIAL (fn), &n_blocks);
4582
4583 /* The top-level BLOCK isn't numbered at all. */
4584 for (i = 1; i < n_blocks; ++i)
4585 /* We number the blocks from two. */
4586 BLOCK_NUMBER (block_vector[i]) = next_block_index++;
4587
4588 free (block_vector);
4589
4590 return;
4591 }
4592
4593 /* If VAR is present in a subblock of BLOCK, return the subblock. */
4594
4595 DEBUG_FUNCTION tree
4596 debug_find_var_in_block_tree (tree var, tree block)
4597 {
4598 tree t;
4599
4600 for (t = BLOCK_VARS (block); t; t = TREE_CHAIN (t))
4601 if (t == var)
4602 return block;
4603
4604 for (t = BLOCK_SUBBLOCKS (block); t; t = TREE_CHAIN (t))
4605 {
4606 tree ret = debug_find_var_in_block_tree (var, t);
4607 if (ret)
4608 return ret;
4609 }
4610
4611 return NULL_TREE;
4612 }
4613 \f
4614 /* Keep track of whether we're in a dummy function context. If we are,
4615 we don't want to invoke the set_current_function hook, because we'll
4616 get into trouble if the hook calls target_reinit () recursively or
4617 when the initial initialization is not yet complete. */
4618
4619 static bool in_dummy_function;
4620
4621 /* Invoke the target hook when setting cfun. Update the optimization options
4622 if the function uses different options than the default. */
4623
4624 static void
4625 invoke_set_current_function_hook (tree fndecl)
4626 {
4627 if (!in_dummy_function)
4628 {
4629 tree opts = ((fndecl)
4630 ? DECL_FUNCTION_SPECIFIC_OPTIMIZATION (fndecl)
4631 : optimization_default_node);
4632
4633 if (!opts)
4634 opts = optimization_default_node;
4635
4636 /* Change optimization options if needed. */
4637 if (optimization_current_node != opts)
4638 {
4639 optimization_current_node = opts;
4640 cl_optimization_restore (&global_options, TREE_OPTIMIZATION (opts));
4641 }
4642
4643 targetm.set_current_function (fndecl);
4644 this_fn_optabs = this_target_optabs;
4645
4646 /* Initialize global alignment variables after op. */
4647 parse_alignment_opts ();
4648
4649 if (opts != optimization_default_node)
4650 {
4651 init_tree_optimization_optabs (opts);
4652 if (TREE_OPTIMIZATION_OPTABS (opts))
4653 this_fn_optabs = (struct target_optabs *)
4654 TREE_OPTIMIZATION_OPTABS (opts);
4655 }
4656 }
4657 }
4658
4659 /* cfun should never be set directly; use this function. */
4660
4661 void
4662 set_cfun (struct function *new_cfun, bool force)
4663 {
4664 if (cfun != new_cfun || force)
4665 {
4666 cfun = new_cfun;
4667 invoke_set_current_function_hook (new_cfun ? new_cfun->decl : NULL_TREE);
4668 redirect_edge_var_map_empty ();
4669 }
4670 }
4671
4672 /* Initialized with NOGC, making this poisonous to the garbage collector. */
4673
4674 static vec<function *> cfun_stack;
4675
4676 /* Push the current cfun onto the stack, and set cfun to new_cfun. Also set
4677 current_function_decl accordingly. */
4678
4679 void
4680 push_cfun (struct function *new_cfun)
4681 {
4682 gcc_assert ((!cfun && !current_function_decl)
4683 || (cfun && current_function_decl == cfun->decl));
4684 cfun_stack.safe_push (cfun);
4685 current_function_decl = new_cfun ? new_cfun->decl : NULL_TREE;
4686 set_cfun (new_cfun);
4687 }
4688
4689 /* Pop cfun from the stack. Also set current_function_decl accordingly. */
4690
4691 void
4692 pop_cfun (void)
4693 {
4694 struct function *new_cfun = cfun_stack.pop ();
4695 /* When in_dummy_function, we do have a cfun but current_function_decl is
4696 NULL. We also allow pushing NULL cfun and subsequently changing
4697 current_function_decl to something else and have both restored by
4698 pop_cfun. */
4699 gcc_checking_assert (in_dummy_function
4700 || !cfun
4701 || current_function_decl == cfun->decl);
4702 set_cfun (new_cfun);
4703 current_function_decl = new_cfun ? new_cfun->decl : NULL_TREE;
4704 }
4705
4706 /* Return value of funcdef and increase it. */
4707 int
4708 get_next_funcdef_no (void)
4709 {
4710 return funcdef_no++;
4711 }
4712
4713 /* Return value of funcdef. */
4714 int
4715 get_last_funcdef_no (void)
4716 {
4717 return funcdef_no;
4718 }
4719
4720 /* Allocate a function structure for FNDECL and set its contents
4721 to the defaults. Set cfun to the newly-allocated object.
4722 Some of the helper functions invoked during initialization assume
4723 that cfun has already been set. Therefore, assign the new object
4724 directly into cfun and invoke the back end hook explicitly at the
4725 very end, rather than initializing a temporary and calling set_cfun
4726 on it.
4727
4728 ABSTRACT_P is true if this is a function that will never be seen by
4729 the middle-end. Such functions are front-end concepts (like C++
4730 function templates) that do not correspond directly to functions
4731 placed in object files. */
4732
4733 void
4734 allocate_struct_function (tree fndecl, bool abstract_p)
4735 {
4736 tree fntype = fndecl ? TREE_TYPE (fndecl) : NULL_TREE;
4737
4738 cfun = ggc_cleared_alloc<function> ();
4739
4740 init_eh_for_function ();
4741
4742 if (init_machine_status)
4743 cfun->machine = (*init_machine_status) ();
4744
4745 #ifdef OVERRIDE_ABI_FORMAT
4746 OVERRIDE_ABI_FORMAT (fndecl);
4747 #endif
4748
4749 if (fndecl != NULL_TREE)
4750 {
4751 DECL_STRUCT_FUNCTION (fndecl) = cfun;
4752 cfun->decl = fndecl;
4753 current_function_funcdef_no = get_next_funcdef_no ();
4754 }
4755
4756 invoke_set_current_function_hook (fndecl);
4757
4758 if (fndecl != NULL_TREE)
4759 {
4760 tree result = DECL_RESULT (fndecl);
4761
4762 if (!abstract_p)
4763 {
4764 /* Now that we have activated any function-specific attributes
4765 that might affect layout, particularly vector modes, relayout
4766 each of the parameters and the result. */
4767 relayout_decl (result);
4768 for (tree parm = DECL_ARGUMENTS (fndecl); parm;
4769 parm = DECL_CHAIN (parm))
4770 relayout_decl (parm);
4771
4772 /* Similarly relayout the function decl. */
4773 targetm.target_option.relayout_function (fndecl);
4774 }
4775
4776 if (!abstract_p && aggregate_value_p (result, fndecl))
4777 {
4778 #ifdef PCC_STATIC_STRUCT_RETURN
4779 cfun->returns_pcc_struct = 1;
4780 #endif
4781 cfun->returns_struct = 1;
4782 }
4783
4784 cfun->stdarg = stdarg_p (fntype);
4785
4786 /* Assume all registers in stdarg functions need to be saved. */
4787 cfun->va_list_gpr_size = VA_LIST_MAX_GPR_SIZE;
4788 cfun->va_list_fpr_size = VA_LIST_MAX_FPR_SIZE;
4789
4790 /* ??? This could be set on a per-function basis by the front-end
4791 but is this worth the hassle? */
4792 cfun->can_throw_non_call_exceptions = flag_non_call_exceptions;
4793 cfun->can_delete_dead_exceptions = flag_delete_dead_exceptions;
4794
4795 if (!profile_flag && !flag_instrument_function_entry_exit)
4796 DECL_NO_INSTRUMENT_FUNCTION_ENTRY_EXIT (fndecl) = 1;
4797 }
4798
4799 /* Don't enable begin stmt markers if var-tracking at assignments is
4800 disabled. The markers make little sense without the variable
4801 binding annotations among them. */
4802 cfun->debug_nonbind_markers = lang_hooks.emits_begin_stmt
4803 && MAY_HAVE_DEBUG_MARKER_STMTS;
4804 }
4805
4806 /* This is like allocate_struct_function, but pushes a new cfun for FNDECL
4807 instead of just setting it. */
4808
4809 void
4810 push_struct_function (tree fndecl)
4811 {
4812 /* When in_dummy_function we might be in the middle of a pop_cfun and
4813 current_function_decl and cfun may not match. */
4814 gcc_assert (in_dummy_function
4815 || (!cfun && !current_function_decl)
4816 || (cfun && current_function_decl == cfun->decl));
4817 cfun_stack.safe_push (cfun);
4818 current_function_decl = fndecl;
4819 allocate_struct_function (fndecl, false);
4820 }
4821
4822 /* Reset crtl and other non-struct-function variables to defaults as
4823 appropriate for emitting rtl at the start of a function. */
4824
4825 static void
4826 prepare_function_start (void)
4827 {
4828 gcc_assert (!get_last_insn ());
4829 init_temp_slots ();
4830 init_emit ();
4831 init_varasm_status ();
4832 init_expr ();
4833 default_rtl_profile ();
4834
4835 if (flag_stack_usage_info)
4836 {
4837 cfun->su = ggc_cleared_alloc<stack_usage> ();
4838 cfun->su->static_stack_size = -1;
4839 }
4840
4841 cse_not_expected = ! optimize;
4842
4843 /* Caller save not needed yet. */
4844 caller_save_needed = 0;
4845
4846 /* We haven't done register allocation yet. */
4847 reg_renumber = 0;
4848
4849 /* Indicate that we have not instantiated virtual registers yet. */
4850 virtuals_instantiated = 0;
4851
4852 /* Indicate that we want CONCATs now. */
4853 generating_concat_p = 1;
4854
4855 /* Indicate we have no need of a frame pointer yet. */
4856 frame_pointer_needed = 0;
4857 }
4858
4859 void
4860 push_dummy_function (bool with_decl)
4861 {
4862 tree fn_decl, fn_type, fn_result_decl;
4863
4864 gcc_assert (!in_dummy_function);
4865 in_dummy_function = true;
4866
4867 if (with_decl)
4868 {
4869 fn_type = build_function_type_list (void_type_node, NULL_TREE);
4870 fn_decl = build_decl (UNKNOWN_LOCATION, FUNCTION_DECL, NULL_TREE,
4871 fn_type);
4872 fn_result_decl = build_decl (UNKNOWN_LOCATION, RESULT_DECL,
4873 NULL_TREE, void_type_node);
4874 DECL_RESULT (fn_decl) = fn_result_decl;
4875 }
4876 else
4877 fn_decl = NULL_TREE;
4878
4879 push_struct_function (fn_decl);
4880 }
4881
4882 /* Initialize the rtl expansion mechanism so that we can do simple things
4883 like generate sequences. This is used to provide a context during global
4884 initialization of some passes. You must call expand_dummy_function_end
4885 to exit this context. */
4886
4887 void
4888 init_dummy_function_start (void)
4889 {
4890 push_dummy_function (false);
4891 prepare_function_start ();
4892 }
4893
4894 /* Generate RTL for the start of the function SUBR (a FUNCTION_DECL tree node)
4895 and initialize static variables for generating RTL for the statements
4896 of the function. */
4897
4898 void
4899 init_function_start (tree subr)
4900 {
4901 /* Initialize backend, if needed. */
4902 initialize_rtl ();
4903
4904 prepare_function_start ();
4905 decide_function_section (subr);
4906
4907 /* Warn if this value is an aggregate type,
4908 regardless of which calling convention we are using for it. */
4909 if (AGGREGATE_TYPE_P (TREE_TYPE (DECL_RESULT (subr))))
4910 warning (OPT_Waggregate_return, "function returns an aggregate");
4911 }
4912
4913 /* Expand code to verify the stack_protect_guard. This is invoked at
4914 the end of a function to be protected. */
4915
4916 void
4917 stack_protect_epilogue (void)
4918 {
4919 tree guard_decl = crtl->stack_protect_guard_decl;
4920 rtx_code_label *label = gen_label_rtx ();
4921 rtx x, y;
4922 rtx_insn *seq = NULL;
4923
4924 x = expand_normal (crtl->stack_protect_guard);
4925
4926 if (targetm.have_stack_protect_combined_test () && guard_decl)
4927 {
4928 gcc_assert (DECL_P (guard_decl));
4929 y = DECL_RTL (guard_decl);
4930 /* Allow the target to compute address of Y and compare it with X without
4931 leaking Y into a register. This combined address + compare pattern
4932 allows the target to prevent spilling of any intermediate results by
4933 splitting it after register allocator. */
4934 seq = targetm.gen_stack_protect_combined_test (x, y, label);
4935 }
4936 else
4937 {
4938 if (guard_decl)
4939 y = expand_normal (guard_decl);
4940 else
4941 y = const0_rtx;
4942
4943 /* Allow the target to compare Y with X without leaking either into
4944 a register. */
4945 if (targetm.have_stack_protect_test ())
4946 seq = targetm.gen_stack_protect_test (x, y, label);
4947 }
4948
4949 if (seq)
4950 emit_insn (seq);
4951 else
4952 emit_cmp_and_jump_insns (x, y, EQ, NULL_RTX, ptr_mode, 1, label);
4953
4954 /* The noreturn predictor has been moved to the tree level. The rtl-level
4955 predictors estimate this branch about 20%, which isn't enough to get
4956 things moved out of line. Since this is the only extant case of adding
4957 a noreturn function at the rtl level, it doesn't seem worth doing ought
4958 except adding the prediction by hand. */
4959 rtx_insn *tmp = get_last_insn ();
4960 if (JUMP_P (tmp))
4961 predict_insn_def (tmp, PRED_NORETURN, TAKEN);
4962
4963 expand_call (targetm.stack_protect_fail (), NULL_RTX, /*ignore=*/true);
4964 free_temp_slots ();
4965 emit_label (label);
4966 }
4967 \f
4968 /* Start the RTL for a new function, and set variables used for
4969 emitting RTL.
4970 SUBR is the FUNCTION_DECL node.
4971 PARMS_HAVE_CLEANUPS is nonzero if there are cleanups associated with
4972 the function's parameters, which must be run at any return statement. */
4973
4974 void
4975 expand_function_start (tree subr)
4976 {
4977 /* Make sure volatile mem refs aren't considered
4978 valid operands of arithmetic insns. */
4979 init_recog_no_volatile ();
4980
4981 crtl->profile
4982 = (profile_flag
4983 && ! DECL_NO_INSTRUMENT_FUNCTION_ENTRY_EXIT (subr));
4984
4985 crtl->limit_stack
4986 = (stack_limit_rtx != NULL_RTX && ! DECL_NO_LIMIT_STACK (subr));
4987
4988 /* Make the label for return statements to jump to. Do not special
4989 case machines with special return instructions -- they will be
4990 handled later during jump, ifcvt, or epilogue creation. */
4991 return_label = gen_label_rtx ();
4992
4993 /* Initialize rtx used to return the value. */
4994 /* Do this before assign_parms so that we copy the struct value address
4995 before any library calls that assign parms might generate. */
4996
4997 /* Decide whether to return the value in memory or in a register. */
4998 tree res = DECL_RESULT (subr);
4999 if (aggregate_value_p (res, subr))
5000 {
5001 /* Returning something that won't go in a register. */
5002 rtx value_address = 0;
5003
5004 #ifdef PCC_STATIC_STRUCT_RETURN
5005 if (cfun->returns_pcc_struct)
5006 {
5007 int size = int_size_in_bytes (TREE_TYPE (res));
5008 value_address = assemble_static_space (size);
5009 }
5010 else
5011 #endif
5012 {
5013 rtx sv = targetm.calls.struct_value_rtx (TREE_TYPE (subr), 2);
5014 /* Expect to be passed the address of a place to store the value.
5015 If it is passed as an argument, assign_parms will take care of
5016 it. */
5017 if (sv)
5018 {
5019 value_address = gen_reg_rtx (Pmode);
5020 emit_move_insn (value_address, sv);
5021 }
5022 }
5023 if (value_address)
5024 {
5025 rtx x = value_address;
5026 if (!DECL_BY_REFERENCE (res))
5027 {
5028 x = gen_rtx_MEM (DECL_MODE (res), x);
5029 set_mem_attributes (x, res, 1);
5030 }
5031 set_parm_rtl (res, x);
5032 }
5033 }
5034 else if (DECL_MODE (res) == VOIDmode)
5035 /* If return mode is void, this decl rtl should not be used. */
5036 set_parm_rtl (res, NULL_RTX);
5037 else
5038 {
5039 /* Compute the return values into a pseudo reg, which we will copy
5040 into the true return register after the cleanups are done. */
5041 tree return_type = TREE_TYPE (res);
5042
5043 /* If we may coalesce this result, make sure it has the expected mode
5044 in case it was promoted. But we need not bother about BLKmode. */
5045 machine_mode promoted_mode
5046 = flag_tree_coalesce_vars && is_gimple_reg (res)
5047 ? promote_ssa_mode (ssa_default_def (cfun, res), NULL)
5048 : BLKmode;
5049
5050 if (promoted_mode != BLKmode)
5051 set_parm_rtl (res, gen_reg_rtx (promoted_mode));
5052 else if (TYPE_MODE (return_type) != BLKmode
5053 && targetm.calls.return_in_msb (return_type))
5054 /* expand_function_end will insert the appropriate padding in
5055 this case. Use the return value's natural (unpadded) mode
5056 within the function proper. */
5057 set_parm_rtl (res, gen_reg_rtx (TYPE_MODE (return_type)));
5058 else
5059 {
5060 /* In order to figure out what mode to use for the pseudo, we
5061 figure out what the mode of the eventual return register will
5062 actually be, and use that. */
5063 rtx hard_reg = hard_function_value (return_type, subr, 0, 1);
5064
5065 /* Structures that are returned in registers are not
5066 aggregate_value_p, so we may see a PARALLEL or a REG. */
5067 if (REG_P (hard_reg))
5068 set_parm_rtl (res, gen_reg_rtx (GET_MODE (hard_reg)));
5069 else
5070 {
5071 gcc_assert (GET_CODE (hard_reg) == PARALLEL);
5072 set_parm_rtl (res, gen_group_rtx (hard_reg));
5073 }
5074 }
5075
5076 /* Set DECL_REGISTER flag so that expand_function_end will copy the
5077 result to the real return register(s). */
5078 DECL_REGISTER (res) = 1;
5079 }
5080
5081 /* Initialize rtx for parameters and local variables.
5082 In some cases this requires emitting insns. */
5083 assign_parms (subr);
5084
5085 /* If function gets a static chain arg, store it. */
5086 if (cfun->static_chain_decl)
5087 {
5088 tree parm = cfun->static_chain_decl;
5089 rtx local, chain;
5090 rtx_insn *insn;
5091 int unsignedp;
5092
5093 local = gen_reg_rtx (promote_decl_mode (parm, &unsignedp));
5094 chain = targetm.calls.static_chain (current_function_decl, true);
5095
5096 set_decl_incoming_rtl (parm, chain, false);
5097 set_parm_rtl (parm, local);
5098 mark_reg_pointer (local, TYPE_ALIGN (TREE_TYPE (TREE_TYPE (parm))));
5099
5100 if (GET_MODE (local) != GET_MODE (chain))
5101 {
5102 convert_move (local, chain, unsignedp);
5103 insn = get_last_insn ();
5104 }
5105 else
5106 insn = emit_move_insn (local, chain);
5107
5108 /* Mark the register as eliminable, similar to parameters. */
5109 if (MEM_P (chain)
5110 && reg_mentioned_p (arg_pointer_rtx, XEXP (chain, 0)))
5111 set_dst_reg_note (insn, REG_EQUIV, chain, local);
5112
5113 /* If we aren't optimizing, save the static chain onto the stack. */
5114 if (!optimize)
5115 {
5116 tree saved_static_chain_decl
5117 = build_decl (DECL_SOURCE_LOCATION (parm), VAR_DECL,
5118 DECL_NAME (parm), TREE_TYPE (parm));
5119 rtx saved_static_chain_rtx
5120 = assign_stack_local (Pmode, GET_MODE_SIZE (Pmode), 0);
5121 SET_DECL_RTL (saved_static_chain_decl, saved_static_chain_rtx);
5122 emit_move_insn (saved_static_chain_rtx, chain);
5123 SET_DECL_VALUE_EXPR (parm, saved_static_chain_decl);
5124 DECL_HAS_VALUE_EXPR_P (parm) = 1;
5125 }
5126 }
5127
5128 /* The following was moved from init_function_start.
5129 The move was supposed to make sdb output more accurate. */
5130 /* Indicate the beginning of the function body,
5131 as opposed to parm setup. */
5132 emit_note (NOTE_INSN_FUNCTION_BEG);
5133
5134 gcc_assert (NOTE_P (get_last_insn ()));
5135
5136 parm_birth_insn = get_last_insn ();
5137
5138 /* If the function receives a non-local goto, then store the
5139 bits we need to restore the frame pointer. */
5140 if (cfun->nonlocal_goto_save_area)
5141 {
5142 tree t_save;
5143 rtx r_save;
5144
5145 tree var = TREE_OPERAND (cfun->nonlocal_goto_save_area, 0);
5146 gcc_assert (DECL_RTL_SET_P (var));
5147
5148 t_save = build4 (ARRAY_REF,
5149 TREE_TYPE (TREE_TYPE (cfun->nonlocal_goto_save_area)),
5150 cfun->nonlocal_goto_save_area,
5151 integer_zero_node, NULL_TREE, NULL_TREE);
5152 r_save = expand_expr (t_save, NULL_RTX, VOIDmode, EXPAND_WRITE);
5153 gcc_assert (GET_MODE (r_save) == Pmode);
5154
5155 emit_move_insn (r_save, hard_frame_pointer_rtx);
5156 update_nonlocal_goto_save_area ();
5157 }
5158
5159 if (crtl->profile)
5160 {
5161 #ifdef PROFILE_HOOK
5162 PROFILE_HOOK (current_function_funcdef_no);
5163 #endif
5164 }
5165
5166 /* If we are doing generic stack checking, the probe should go here. */
5167 if (flag_stack_check == GENERIC_STACK_CHECK)
5168 stack_check_probe_note = emit_note (NOTE_INSN_DELETED);
5169 }
5170 \f
5171 void
5172 pop_dummy_function (void)
5173 {
5174 pop_cfun ();
5175 in_dummy_function = false;
5176 }
5177
5178 /* Undo the effects of init_dummy_function_start. */
5179 void
5180 expand_dummy_function_end (void)
5181 {
5182 gcc_assert (in_dummy_function);
5183
5184 /* End any sequences that failed to be closed due to syntax errors. */
5185 while (in_sequence_p ())
5186 end_sequence ();
5187
5188 /* Outside function body, can't compute type's actual size
5189 until next function's body starts. */
5190
5191 free_after_parsing (cfun);
5192 free_after_compilation (cfun);
5193 pop_dummy_function ();
5194 }
5195
5196 /* Helper for diddle_return_value. */
5197
5198 void
5199 diddle_return_value_1 (void (*doit) (rtx, void *), void *arg, rtx outgoing)
5200 {
5201 if (! outgoing)
5202 return;
5203
5204 if (REG_P (outgoing))
5205 (*doit) (outgoing, arg);
5206 else if (GET_CODE (outgoing) == PARALLEL)
5207 {
5208 int i;
5209
5210 for (i = 0; i < XVECLEN (outgoing, 0); i++)
5211 {
5212 rtx x = XEXP (XVECEXP (outgoing, 0, i), 0);
5213
5214 if (REG_P (x) && REGNO (x) < FIRST_PSEUDO_REGISTER)
5215 (*doit) (x, arg);
5216 }
5217 }
5218 }
5219
5220 /* Call DOIT for each hard register used as a return value from
5221 the current function. */
5222
5223 void
5224 diddle_return_value (void (*doit) (rtx, void *), void *arg)
5225 {
5226 diddle_return_value_1 (doit, arg, crtl->return_rtx);
5227 }
5228
5229 static void
5230 do_clobber_return_reg (rtx reg, void *arg ATTRIBUTE_UNUSED)
5231 {
5232 emit_clobber (reg);
5233 }
5234
5235 void
5236 clobber_return_register (void)
5237 {
5238 diddle_return_value (do_clobber_return_reg, NULL);
5239
5240 /* In case we do use pseudo to return value, clobber it too. */
5241 if (DECL_RTL_SET_P (DECL_RESULT (current_function_decl)))
5242 {
5243 tree decl_result = DECL_RESULT (current_function_decl);
5244 rtx decl_rtl = DECL_RTL (decl_result);
5245 if (REG_P (decl_rtl) && REGNO (decl_rtl) >= FIRST_PSEUDO_REGISTER)
5246 {
5247 do_clobber_return_reg (decl_rtl, NULL);
5248 }
5249 }
5250 }
5251
5252 static void
5253 do_use_return_reg (rtx reg, void *arg ATTRIBUTE_UNUSED)
5254 {
5255 emit_use (reg);
5256 }
5257
5258 static void
5259 use_return_register (void)
5260 {
5261 diddle_return_value (do_use_return_reg, NULL);
5262 }
5263
5264 /* Generate RTL for the end of the current function. */
5265
5266 void
5267 expand_function_end (void)
5268 {
5269 /* If arg_pointer_save_area was referenced only from a nested
5270 function, we will not have initialized it yet. Do that now. */
5271 if (arg_pointer_save_area && ! crtl->arg_pointer_save_area_init)
5272 get_arg_pointer_save_area ();
5273
5274 /* If we are doing generic stack checking and this function makes calls,
5275 do a stack probe at the start of the function to ensure we have enough
5276 space for another stack frame. */
5277 if (flag_stack_check == GENERIC_STACK_CHECK)
5278 {
5279 rtx_insn *insn, *seq;
5280
5281 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
5282 if (CALL_P (insn))
5283 {
5284 rtx max_frame_size = GEN_INT (STACK_CHECK_MAX_FRAME_SIZE);
5285 start_sequence ();
5286 if (STACK_CHECK_MOVING_SP)
5287 anti_adjust_stack_and_probe (max_frame_size, true);
5288 else
5289 probe_stack_range (STACK_OLD_CHECK_PROTECT, max_frame_size);
5290 seq = get_insns ();
5291 end_sequence ();
5292 set_insn_locations (seq, prologue_location);
5293 emit_insn_before (seq, stack_check_probe_note);
5294 break;
5295 }
5296 }
5297
5298 /* End any sequences that failed to be closed due to syntax errors. */
5299 while (in_sequence_p ())
5300 end_sequence ();
5301
5302 clear_pending_stack_adjust ();
5303 do_pending_stack_adjust ();
5304
5305 /* Output a linenumber for the end of the function.
5306 SDB depended on this. */
5307 set_curr_insn_location (input_location);
5308
5309 /* Before the return label (if any), clobber the return
5310 registers so that they are not propagated live to the rest of
5311 the function. This can only happen with functions that drop
5312 through; if there had been a return statement, there would
5313 have either been a return rtx, or a jump to the return label.
5314
5315 We delay actual code generation after the current_function_value_rtx
5316 is computed. */
5317 rtx_insn *clobber_after = get_last_insn ();
5318
5319 /* Output the label for the actual return from the function. */
5320 emit_label (return_label);
5321
5322 if (targetm_common.except_unwind_info (&global_options) == UI_SJLJ)
5323 {
5324 /* Let except.c know where it should emit the call to unregister
5325 the function context for sjlj exceptions. */
5326 if (flag_exceptions)
5327 sjlj_emit_function_exit_after (get_last_insn ());
5328 }
5329
5330 /* If this is an implementation of throw, do what's necessary to
5331 communicate between __builtin_eh_return and the epilogue. */
5332 expand_eh_return ();
5333
5334 /* If stack protection is enabled for this function, check the guard. */
5335 if (crtl->stack_protect_guard
5336 && targetm.stack_protect_runtime_enabled_p ()
5337 && naked_return_label == NULL_RTX)
5338 stack_protect_epilogue ();
5339
5340 /* If scalar return value was computed in a pseudo-reg, or was a named
5341 return value that got dumped to the stack, copy that to the hard
5342 return register. */
5343 if (DECL_RTL_SET_P (DECL_RESULT (current_function_decl)))
5344 {
5345 tree decl_result = DECL_RESULT (current_function_decl);
5346 rtx decl_rtl = DECL_RTL (decl_result);
5347
5348 if (REG_P (decl_rtl)
5349 ? REGNO (decl_rtl) >= FIRST_PSEUDO_REGISTER
5350 : DECL_REGISTER (decl_result))
5351 {
5352 rtx real_decl_rtl = crtl->return_rtx;
5353 complex_mode cmode;
5354
5355 /* This should be set in assign_parms. */
5356 gcc_assert (REG_FUNCTION_VALUE_P (real_decl_rtl));
5357
5358 /* If this is a BLKmode structure being returned in registers,
5359 then use the mode computed in expand_return. Note that if
5360 decl_rtl is memory, then its mode may have been changed,
5361 but that crtl->return_rtx has not. */
5362 if (GET_MODE (real_decl_rtl) == BLKmode)
5363 PUT_MODE (real_decl_rtl, GET_MODE (decl_rtl));
5364
5365 /* If a non-BLKmode return value should be padded at the least
5366 significant end of the register, shift it left by the appropriate
5367 amount. BLKmode results are handled using the group load/store
5368 machinery. */
5369 if (TYPE_MODE (TREE_TYPE (decl_result)) != BLKmode
5370 && REG_P (real_decl_rtl)
5371 && targetm.calls.return_in_msb (TREE_TYPE (decl_result)))
5372 {
5373 emit_move_insn (gen_rtx_REG (GET_MODE (decl_rtl),
5374 REGNO (real_decl_rtl)),
5375 decl_rtl);
5376 shift_return_value (GET_MODE (decl_rtl), true, real_decl_rtl);
5377 }
5378 else if (GET_CODE (real_decl_rtl) == PARALLEL)
5379 {
5380 /* If expand_function_start has created a PARALLEL for decl_rtl,
5381 move the result to the real return registers. Otherwise, do
5382 a group load from decl_rtl for a named return. */
5383 if (GET_CODE (decl_rtl) == PARALLEL)
5384 emit_group_move (real_decl_rtl, decl_rtl);
5385 else
5386 emit_group_load (real_decl_rtl, decl_rtl,
5387 TREE_TYPE (decl_result),
5388 int_size_in_bytes (TREE_TYPE (decl_result)));
5389 }
5390 /* In the case of complex integer modes smaller than a word, we'll
5391 need to generate some non-trivial bitfield insertions. Do that
5392 on a pseudo and not the hard register. */
5393 else if (GET_CODE (decl_rtl) == CONCAT
5394 && is_complex_int_mode (GET_MODE (decl_rtl), &cmode)
5395 && GET_MODE_BITSIZE (cmode) <= BITS_PER_WORD)
5396 {
5397 int old_generating_concat_p;
5398 rtx tmp;
5399
5400 old_generating_concat_p = generating_concat_p;
5401 generating_concat_p = 0;
5402 tmp = gen_reg_rtx (GET_MODE (decl_rtl));
5403 generating_concat_p = old_generating_concat_p;
5404
5405 emit_move_insn (tmp, decl_rtl);
5406 emit_move_insn (real_decl_rtl, tmp);
5407 }
5408 /* If a named return value dumped decl_return to memory, then
5409 we may need to re-do the PROMOTE_MODE signed/unsigned
5410 extension. */
5411 else if (GET_MODE (real_decl_rtl) != GET_MODE (decl_rtl))
5412 {
5413 int unsignedp = TYPE_UNSIGNED (TREE_TYPE (decl_result));
5414 promote_function_mode (TREE_TYPE (decl_result),
5415 GET_MODE (decl_rtl), &unsignedp,
5416 TREE_TYPE (current_function_decl), 1);
5417
5418 convert_move (real_decl_rtl, decl_rtl, unsignedp);
5419 }
5420 else
5421 emit_move_insn (real_decl_rtl, decl_rtl);
5422 }
5423 }
5424
5425 /* If returning a structure, arrange to return the address of the value
5426 in a place where debuggers expect to find it.
5427
5428 If returning a structure PCC style,
5429 the caller also depends on this value.
5430 And cfun->returns_pcc_struct is not necessarily set. */
5431 if ((cfun->returns_struct || cfun->returns_pcc_struct)
5432 && !targetm.calls.omit_struct_return_reg)
5433 {
5434 rtx value_address = DECL_RTL (DECL_RESULT (current_function_decl));
5435 tree type = TREE_TYPE (DECL_RESULT (current_function_decl));
5436 rtx outgoing;
5437
5438 if (DECL_BY_REFERENCE (DECL_RESULT (current_function_decl)))
5439 type = TREE_TYPE (type);
5440 else
5441 value_address = XEXP (value_address, 0);
5442
5443 outgoing = targetm.calls.function_value (build_pointer_type (type),
5444 current_function_decl, true);
5445
5446 /* Mark this as a function return value so integrate will delete the
5447 assignment and USE below when inlining this function. */
5448 REG_FUNCTION_VALUE_P (outgoing) = 1;
5449
5450 /* The address may be ptr_mode and OUTGOING may be Pmode. */
5451 scalar_int_mode mode = as_a <scalar_int_mode> (GET_MODE (outgoing));
5452 value_address = convert_memory_address (mode, value_address);
5453
5454 emit_move_insn (outgoing, value_address);
5455
5456 /* Show return register used to hold result (in this case the address
5457 of the result. */
5458 crtl->return_rtx = outgoing;
5459 }
5460
5461 /* Emit the actual code to clobber return register. Don't emit
5462 it if clobber_after is a barrier, then the previous basic block
5463 certainly doesn't fall thru into the exit block. */
5464 if (!BARRIER_P (clobber_after))
5465 {
5466 start_sequence ();
5467 clobber_return_register ();
5468 rtx_insn *seq = get_insns ();
5469 end_sequence ();
5470
5471 emit_insn_after (seq, clobber_after);
5472 }
5473
5474 /* Output the label for the naked return from the function. */
5475 if (naked_return_label)
5476 emit_label (naked_return_label);
5477
5478 /* @@@ This is a kludge. We want to ensure that instructions that
5479 may trap are not moved into the epilogue by scheduling, because
5480 we don't always emit unwind information for the epilogue. */
5481 if (cfun->can_throw_non_call_exceptions
5482 && targetm_common.except_unwind_info (&global_options) != UI_SJLJ)
5483 emit_insn (gen_blockage ());
5484
5485 /* If stack protection is enabled for this function, check the guard. */
5486 if (crtl->stack_protect_guard
5487 && targetm.stack_protect_runtime_enabled_p ()
5488 && naked_return_label)
5489 stack_protect_epilogue ();
5490
5491 /* If we had calls to alloca, and this machine needs
5492 an accurate stack pointer to exit the function,
5493 insert some code to save and restore the stack pointer. */
5494 if (! EXIT_IGNORE_STACK
5495 && cfun->calls_alloca)
5496 {
5497 rtx tem = 0;
5498
5499 start_sequence ();
5500 emit_stack_save (SAVE_FUNCTION, &tem);
5501 rtx_insn *seq = get_insns ();
5502 end_sequence ();
5503 emit_insn_before (seq, parm_birth_insn);
5504
5505 emit_stack_restore (SAVE_FUNCTION, tem);
5506 }
5507
5508 /* ??? This should no longer be necessary since stupid is no longer with
5509 us, but there are some parts of the compiler (eg reload_combine, and
5510 sh mach_dep_reorg) that still try and compute their own lifetime info
5511 instead of using the general framework. */
5512 use_return_register ();
5513 }
5514
5515 rtx
5516 get_arg_pointer_save_area (void)
5517 {
5518 rtx ret = arg_pointer_save_area;
5519
5520 if (! ret)
5521 {
5522 ret = assign_stack_local (Pmode, GET_MODE_SIZE (Pmode), 0);
5523 arg_pointer_save_area = ret;
5524 }
5525
5526 if (! crtl->arg_pointer_save_area_init)
5527 {
5528 /* Save the arg pointer at the beginning of the function. The
5529 generated stack slot may not be a valid memory address, so we
5530 have to check it and fix it if necessary. */
5531 start_sequence ();
5532 emit_move_insn (validize_mem (copy_rtx (ret)),
5533 crtl->args.internal_arg_pointer);
5534 rtx_insn *seq = get_insns ();
5535 end_sequence ();
5536
5537 push_topmost_sequence ();
5538 emit_insn_after (seq, entry_of_function ());
5539 pop_topmost_sequence ();
5540
5541 crtl->arg_pointer_save_area_init = true;
5542 }
5543
5544 return ret;
5545 }
5546 \f
5547
5548 /* If debugging dumps are requested, dump information about how the
5549 target handled -fstack-check=clash for the prologue.
5550
5551 PROBES describes what if any probes were emitted.
5552
5553 RESIDUALS indicates if the prologue had any residual allocation
5554 (i.e. total allocation was not a multiple of PROBE_INTERVAL). */
5555
5556 void
5557 dump_stack_clash_frame_info (enum stack_clash_probes probes, bool residuals)
5558 {
5559 if (!dump_file)
5560 return;
5561
5562 switch (probes)
5563 {
5564 case NO_PROBE_NO_FRAME:
5565 fprintf (dump_file,
5566 "Stack clash no probe no stack adjustment in prologue.\n");
5567 break;
5568 case NO_PROBE_SMALL_FRAME:
5569 fprintf (dump_file,
5570 "Stack clash no probe small stack adjustment in prologue.\n");
5571 break;
5572 case PROBE_INLINE:
5573 fprintf (dump_file, "Stack clash inline probes in prologue.\n");
5574 break;
5575 case PROBE_LOOP:
5576 fprintf (dump_file, "Stack clash probe loop in prologue.\n");
5577 break;
5578 }
5579
5580 if (residuals)
5581 fprintf (dump_file, "Stack clash residual allocation in prologue.\n");
5582 else
5583 fprintf (dump_file, "Stack clash no residual allocation in prologue.\n");
5584
5585 if (frame_pointer_needed)
5586 fprintf (dump_file, "Stack clash frame pointer needed.\n");
5587 else
5588 fprintf (dump_file, "Stack clash no frame pointer needed.\n");
5589
5590 if (TREE_THIS_VOLATILE (cfun->decl))
5591 fprintf (dump_file,
5592 "Stack clash noreturn prologue, assuming no implicit"
5593 " probes in caller.\n");
5594 else
5595 fprintf (dump_file,
5596 "Stack clash not noreturn prologue.\n");
5597 }
5598
5599 /* Add a list of INSNS to the hash HASHP, possibly allocating HASHP
5600 for the first time. */
5601
5602 static void
5603 record_insns (rtx_insn *insns, rtx end, hash_table<insn_cache_hasher> **hashp)
5604 {
5605 rtx_insn *tmp;
5606 hash_table<insn_cache_hasher> *hash = *hashp;
5607
5608 if (hash == NULL)
5609 *hashp = hash = hash_table<insn_cache_hasher>::create_ggc (17);
5610
5611 for (tmp = insns; tmp != end; tmp = NEXT_INSN (tmp))
5612 {
5613 rtx *slot = hash->find_slot (tmp, INSERT);
5614 gcc_assert (*slot == NULL);
5615 *slot = tmp;
5616 }
5617 }
5618
5619 /* INSN has been duplicated or replaced by as COPY, perhaps by duplicating a
5620 basic block, splitting or peepholes. If INSN is a prologue or epilogue
5621 insn, then record COPY as well. */
5622
5623 void
5624 maybe_copy_prologue_epilogue_insn (rtx insn, rtx copy)
5625 {
5626 hash_table<insn_cache_hasher> *hash;
5627 rtx *slot;
5628
5629 hash = epilogue_insn_hash;
5630 if (!hash || !hash->find (insn))
5631 {
5632 hash = prologue_insn_hash;
5633 if (!hash || !hash->find (insn))
5634 return;
5635 }
5636
5637 slot = hash->find_slot (copy, INSERT);
5638 gcc_assert (*slot == NULL);
5639 *slot = copy;
5640 }
5641
5642 /* Determine if any INSNs in HASH are, or are part of, INSN. Because
5643 we can be running after reorg, SEQUENCE rtl is possible. */
5644
5645 static bool
5646 contains (const rtx_insn *insn, hash_table<insn_cache_hasher> *hash)
5647 {
5648 if (hash == NULL)
5649 return false;
5650
5651 if (NONJUMP_INSN_P (insn) && GET_CODE (PATTERN (insn)) == SEQUENCE)
5652 {
5653 rtx_sequence *seq = as_a <rtx_sequence *> (PATTERN (insn));
5654 int i;
5655 for (i = seq->len () - 1; i >= 0; i--)
5656 if (hash->find (seq->element (i)))
5657 return true;
5658 return false;
5659 }
5660
5661 return hash->find (const_cast<rtx_insn *> (insn)) != NULL;
5662 }
5663
5664 int
5665 prologue_contains (const rtx_insn *insn)
5666 {
5667 return contains (insn, prologue_insn_hash);
5668 }
5669
5670 int
5671 epilogue_contains (const rtx_insn *insn)
5672 {
5673 return contains (insn, epilogue_insn_hash);
5674 }
5675
5676 int
5677 prologue_epilogue_contains (const rtx_insn *insn)
5678 {
5679 if (contains (insn, prologue_insn_hash))
5680 return 1;
5681 if (contains (insn, epilogue_insn_hash))
5682 return 1;
5683 return 0;
5684 }
5685
5686 void
5687 record_prologue_seq (rtx_insn *seq)
5688 {
5689 record_insns (seq, NULL, &prologue_insn_hash);
5690 }
5691
5692 void
5693 record_epilogue_seq (rtx_insn *seq)
5694 {
5695 record_insns (seq, NULL, &epilogue_insn_hash);
5696 }
5697
5698 /* Set JUMP_LABEL for a return insn. */
5699
5700 void
5701 set_return_jump_label (rtx_insn *returnjump)
5702 {
5703 rtx pat = PATTERN (returnjump);
5704 if (GET_CODE (pat) == PARALLEL)
5705 pat = XVECEXP (pat, 0, 0);
5706 if (ANY_RETURN_P (pat))
5707 JUMP_LABEL (returnjump) = pat;
5708 else
5709 JUMP_LABEL (returnjump) = ret_rtx;
5710 }
5711
5712 /* Return a sequence to be used as the split prologue for the current
5713 function, or NULL. */
5714
5715 static rtx_insn *
5716 make_split_prologue_seq (void)
5717 {
5718 if (!flag_split_stack
5719 || lookup_attribute ("no_split_stack", DECL_ATTRIBUTES (cfun->decl)))
5720 return NULL;
5721
5722 start_sequence ();
5723 emit_insn (targetm.gen_split_stack_prologue ());
5724 rtx_insn *seq = get_insns ();
5725 end_sequence ();
5726
5727 record_insns (seq, NULL, &prologue_insn_hash);
5728 set_insn_locations (seq, prologue_location);
5729
5730 return seq;
5731 }
5732
5733 /* Return a sequence to be used as the prologue for the current function,
5734 or NULL. */
5735
5736 static rtx_insn *
5737 make_prologue_seq (void)
5738 {
5739 if (!targetm.have_prologue ())
5740 return NULL;
5741
5742 start_sequence ();
5743 rtx_insn *seq = targetm.gen_prologue ();
5744 emit_insn (seq);
5745
5746 /* Insert an explicit USE for the frame pointer
5747 if the profiling is on and the frame pointer is required. */
5748 if (crtl->profile && frame_pointer_needed)
5749 emit_use (hard_frame_pointer_rtx);
5750
5751 /* Retain a map of the prologue insns. */
5752 record_insns (seq, NULL, &prologue_insn_hash);
5753 emit_note (NOTE_INSN_PROLOGUE_END);
5754
5755 /* Ensure that instructions are not moved into the prologue when
5756 profiling is on. The call to the profiling routine can be
5757 emitted within the live range of a call-clobbered register. */
5758 if (!targetm.profile_before_prologue () && crtl->profile)
5759 emit_insn (gen_blockage ());
5760
5761 seq = get_insns ();
5762 end_sequence ();
5763 set_insn_locations (seq, prologue_location);
5764
5765 return seq;
5766 }
5767
5768 /* Return a sequence to be used as the epilogue for the current function,
5769 or NULL. */
5770
5771 static rtx_insn *
5772 make_epilogue_seq (void)
5773 {
5774 if (!targetm.have_epilogue ())
5775 return NULL;
5776
5777 start_sequence ();
5778 emit_note (NOTE_INSN_EPILOGUE_BEG);
5779 rtx_insn *seq = targetm.gen_epilogue ();
5780 if (seq)
5781 emit_jump_insn (seq);
5782
5783 /* Retain a map of the epilogue insns. */
5784 record_insns (seq, NULL, &epilogue_insn_hash);
5785 set_insn_locations (seq, epilogue_location);
5786
5787 seq = get_insns ();
5788 rtx_insn *returnjump = get_last_insn ();
5789 end_sequence ();
5790
5791 if (JUMP_P (returnjump))
5792 set_return_jump_label (returnjump);
5793
5794 return seq;
5795 }
5796
5797
5798 /* Generate the prologue and epilogue RTL if the machine supports it. Thread
5799 this into place with notes indicating where the prologue ends and where
5800 the epilogue begins. Update the basic block information when possible.
5801
5802 Notes on epilogue placement:
5803 There are several kinds of edges to the exit block:
5804 * a single fallthru edge from LAST_BB
5805 * possibly, edges from blocks containing sibcalls
5806 * possibly, fake edges from infinite loops
5807
5808 The epilogue is always emitted on the fallthru edge from the last basic
5809 block in the function, LAST_BB, into the exit block.
5810
5811 If LAST_BB is empty except for a label, it is the target of every
5812 other basic block in the function that ends in a return. If a
5813 target has a return or simple_return pattern (possibly with
5814 conditional variants), these basic blocks can be changed so that a
5815 return insn is emitted into them, and their target is adjusted to
5816 the real exit block.
5817
5818 Notes on shrink wrapping: We implement a fairly conservative
5819 version of shrink-wrapping rather than the textbook one. We only
5820 generate a single prologue and a single epilogue. This is
5821 sufficient to catch a number of interesting cases involving early
5822 exits.
5823
5824 First, we identify the blocks that require the prologue to occur before
5825 them. These are the ones that modify a call-saved register, or reference
5826 any of the stack or frame pointer registers. To simplify things, we then
5827 mark everything reachable from these blocks as also requiring a prologue.
5828 This takes care of loops automatically, and avoids the need to examine
5829 whether MEMs reference the frame, since it is sufficient to check for
5830 occurrences of the stack or frame pointer.
5831
5832 We then compute the set of blocks for which the need for a prologue
5833 is anticipatable (borrowing terminology from the shrink-wrapping
5834 description in Muchnick's book). These are the blocks which either
5835 require a prologue themselves, or those that have only successors
5836 where the prologue is anticipatable. The prologue needs to be
5837 inserted on all edges from BB1->BB2 where BB2 is in ANTIC and BB1
5838 is not. For the moment, we ensure that only one such edge exists.
5839
5840 The epilogue is placed as described above, but we make a
5841 distinction between inserting return and simple_return patterns
5842 when modifying other blocks that end in a return. Blocks that end
5843 in a sibcall omit the sibcall_epilogue if the block is not in
5844 ANTIC. */
5845
5846 void
5847 thread_prologue_and_epilogue_insns (void)
5848 {
5849 df_analyze ();
5850
5851 /* Can't deal with multiple successors of the entry block at the
5852 moment. Function should always have at least one entry
5853 point. */
5854 gcc_assert (single_succ_p (ENTRY_BLOCK_PTR_FOR_FN (cfun)));
5855
5856 edge entry_edge = single_succ_edge (ENTRY_BLOCK_PTR_FOR_FN (cfun));
5857 edge orig_entry_edge = entry_edge;
5858
5859 rtx_insn *split_prologue_seq = make_split_prologue_seq ();
5860 rtx_insn *prologue_seq = make_prologue_seq ();
5861 rtx_insn *epilogue_seq = make_epilogue_seq ();
5862
5863 /* Try to perform a kind of shrink-wrapping, making sure the
5864 prologue/epilogue is emitted only around those parts of the
5865 function that require it. */
5866 try_shrink_wrapping (&entry_edge, prologue_seq);
5867
5868 /* If the target can handle splitting the prologue/epilogue into separate
5869 components, try to shrink-wrap these components separately. */
5870 try_shrink_wrapping_separate (entry_edge->dest);
5871
5872 /* If that did anything for any component we now need the generate the
5873 "main" prologue again. Because some targets require some of these
5874 to be called in a specific order (i386 requires the split prologue
5875 to be first, for example), we create all three sequences again here.
5876 If this does not work for some target, that target should not enable
5877 separate shrink-wrapping. */
5878 if (crtl->shrink_wrapped_separate)
5879 {
5880 split_prologue_seq = make_split_prologue_seq ();
5881 prologue_seq = make_prologue_seq ();
5882 epilogue_seq = make_epilogue_seq ();
5883 }
5884
5885 rtl_profile_for_bb (EXIT_BLOCK_PTR_FOR_FN (cfun));
5886
5887 /* A small fib -- epilogue is not yet completed, but we wish to re-use
5888 this marker for the splits of EH_RETURN patterns, and nothing else
5889 uses the flag in the meantime. */
5890 epilogue_completed = 1;
5891
5892 /* Find non-fallthru edges that end with EH_RETURN instructions. On
5893 some targets, these get split to a special version of the epilogue
5894 code. In order to be able to properly annotate these with unwind
5895 info, try to split them now. If we get a valid split, drop an
5896 EPILOGUE_BEG note and mark the insns as epilogue insns. */
5897 edge e;
5898 edge_iterator ei;
5899 FOR_EACH_EDGE (e, ei, EXIT_BLOCK_PTR_FOR_FN (cfun)->preds)
5900 {
5901 rtx_insn *prev, *last, *trial;
5902
5903 if (e->flags & EDGE_FALLTHRU)
5904 continue;
5905 last = BB_END (e->src);
5906 if (!eh_returnjump_p (last))
5907 continue;
5908
5909 prev = PREV_INSN (last);
5910 trial = try_split (PATTERN (last), last, 1);
5911 if (trial == last)
5912 continue;
5913
5914 record_insns (NEXT_INSN (prev), NEXT_INSN (trial), &epilogue_insn_hash);
5915 emit_note_after (NOTE_INSN_EPILOGUE_BEG, prev);
5916 }
5917
5918 edge exit_fallthru_edge = find_fallthru_edge (EXIT_BLOCK_PTR_FOR_FN (cfun)->preds);
5919
5920 if (exit_fallthru_edge)
5921 {
5922 if (epilogue_seq)
5923 {
5924 insert_insn_on_edge (epilogue_seq, exit_fallthru_edge);
5925 commit_edge_insertions ();
5926
5927 /* The epilogue insns we inserted may cause the exit edge to no longer
5928 be fallthru. */
5929 FOR_EACH_EDGE (e, ei, EXIT_BLOCK_PTR_FOR_FN (cfun)->preds)
5930 {
5931 if (((e->flags & EDGE_FALLTHRU) != 0)
5932 && returnjump_p (BB_END (e->src)))
5933 e->flags &= ~EDGE_FALLTHRU;
5934 }
5935 }
5936 else if (next_active_insn (BB_END (exit_fallthru_edge->src)))
5937 {
5938 /* We have a fall-through edge to the exit block, the source is not
5939 at the end of the function, and there will be an assembler epilogue
5940 at the end of the function.
5941 We can't use force_nonfallthru here, because that would try to
5942 use return. Inserting a jump 'by hand' is extremely messy, so
5943 we take advantage of cfg_layout_finalize using
5944 fixup_fallthru_exit_predecessor. */
5945 cfg_layout_initialize (0);
5946 basic_block cur_bb;
5947 FOR_EACH_BB_FN (cur_bb, cfun)
5948 if (cur_bb->index >= NUM_FIXED_BLOCKS
5949 && cur_bb->next_bb->index >= NUM_FIXED_BLOCKS)
5950 cur_bb->aux = cur_bb->next_bb;
5951 cfg_layout_finalize ();
5952 }
5953 }
5954
5955 /* Insert the prologue. */
5956
5957 rtl_profile_for_bb (ENTRY_BLOCK_PTR_FOR_FN (cfun));
5958
5959 if (split_prologue_seq || prologue_seq)
5960 {
5961 rtx_insn *split_prologue_insn = split_prologue_seq;
5962 if (split_prologue_seq)
5963 {
5964 while (split_prologue_insn && !NONDEBUG_INSN_P (split_prologue_insn))
5965 split_prologue_insn = NEXT_INSN (split_prologue_insn);
5966 insert_insn_on_edge (split_prologue_seq, orig_entry_edge);
5967 }
5968
5969 rtx_insn *prologue_insn = prologue_seq;
5970 if (prologue_seq)
5971 {
5972 while (prologue_insn && !NONDEBUG_INSN_P (prologue_insn))
5973 prologue_insn = NEXT_INSN (prologue_insn);
5974 insert_insn_on_edge (prologue_seq, entry_edge);
5975 }
5976
5977 commit_edge_insertions ();
5978
5979 /* Look for basic blocks within the prologue insns. */
5980 if (split_prologue_insn
5981 && BLOCK_FOR_INSN (split_prologue_insn) == NULL)
5982 split_prologue_insn = NULL;
5983 if (prologue_insn
5984 && BLOCK_FOR_INSN (prologue_insn) == NULL)
5985 prologue_insn = NULL;
5986 if (split_prologue_insn || prologue_insn)
5987 {
5988 auto_sbitmap blocks (last_basic_block_for_fn (cfun));
5989 bitmap_clear (blocks);
5990 if (split_prologue_insn)
5991 bitmap_set_bit (blocks,
5992 BLOCK_FOR_INSN (split_prologue_insn)->index);
5993 if (prologue_insn)
5994 bitmap_set_bit (blocks, BLOCK_FOR_INSN (prologue_insn)->index);
5995 find_many_sub_basic_blocks (blocks);
5996 }
5997 }
5998
5999 default_rtl_profile ();
6000
6001 /* Emit sibling epilogues before any sibling call sites. */
6002 for (ei = ei_start (EXIT_BLOCK_PTR_FOR_FN (cfun)->preds);
6003 (e = ei_safe_edge (ei));
6004 ei_next (&ei))
6005 {
6006 /* Skip those already handled, the ones that run without prologue. */
6007 if (e->flags & EDGE_IGNORE)
6008 {
6009 e->flags &= ~EDGE_IGNORE;
6010 continue;
6011 }
6012
6013 rtx_insn *insn = BB_END (e->src);
6014
6015 if (!(CALL_P (insn) && SIBLING_CALL_P (insn)))
6016 continue;
6017
6018 if (rtx_insn *ep_seq = targetm.gen_sibcall_epilogue ())
6019 {
6020 start_sequence ();
6021 emit_note (NOTE_INSN_EPILOGUE_BEG);
6022 emit_insn (ep_seq);
6023 rtx_insn *seq = get_insns ();
6024 end_sequence ();
6025
6026 /* Retain a map of the epilogue insns. Used in life analysis to
6027 avoid getting rid of sibcall epilogue insns. Do this before we
6028 actually emit the sequence. */
6029 record_insns (seq, NULL, &epilogue_insn_hash);
6030 set_insn_locations (seq, epilogue_location);
6031
6032 emit_insn_before (seq, insn);
6033 }
6034 }
6035
6036 if (epilogue_seq)
6037 {
6038 rtx_insn *insn, *next;
6039
6040 /* Similarly, move any line notes that appear after the epilogue.
6041 There is no need, however, to be quite so anal about the existence
6042 of such a note. Also possibly move
6043 NOTE_INSN_FUNCTION_BEG notes, as those can be relevant for debug
6044 info generation. */
6045 for (insn = epilogue_seq; insn; insn = next)
6046 {
6047 next = NEXT_INSN (insn);
6048 if (NOTE_P (insn)
6049 && (NOTE_KIND (insn) == NOTE_INSN_FUNCTION_BEG))
6050 reorder_insns (insn, insn, PREV_INSN (epilogue_seq));
6051 }
6052 }
6053
6054 /* Threading the prologue and epilogue changes the artificial refs
6055 in the entry and exit blocks. */
6056 epilogue_completed = 1;
6057 df_update_entry_exit_and_calls ();
6058 }
6059
6060 /* Reposition the prologue-end and epilogue-begin notes after
6061 instruction scheduling. */
6062
6063 void
6064 reposition_prologue_and_epilogue_notes (void)
6065 {
6066 if (!targetm.have_prologue ()
6067 && !targetm.have_epilogue ()
6068 && !targetm.have_sibcall_epilogue ())
6069 return;
6070
6071 /* Since the hash table is created on demand, the fact that it is
6072 non-null is a signal that it is non-empty. */
6073 if (prologue_insn_hash != NULL)
6074 {
6075 size_t len = prologue_insn_hash->elements ();
6076 rtx_insn *insn, *last = NULL, *note = NULL;
6077
6078 /* Scan from the beginning until we reach the last prologue insn. */
6079 /* ??? While we do have the CFG intact, there are two problems:
6080 (1) The prologue can contain loops (typically probing the stack),
6081 which means that the end of the prologue isn't in the first bb.
6082 (2) Sometimes the PROLOGUE_END note gets pushed into the next bb. */
6083 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
6084 {
6085 if (NOTE_P (insn))
6086 {
6087 if (NOTE_KIND (insn) == NOTE_INSN_PROLOGUE_END)
6088 note = insn;
6089 }
6090 else if (contains (insn, prologue_insn_hash))
6091 {
6092 last = insn;
6093 if (--len == 0)
6094 break;
6095 }
6096 }
6097
6098 if (last)
6099 {
6100 if (note == NULL)
6101 {
6102 /* Scan forward looking for the PROLOGUE_END note. It should
6103 be right at the beginning of the block, possibly with other
6104 insn notes that got moved there. */
6105 for (note = NEXT_INSN (last); ; note = NEXT_INSN (note))
6106 {
6107 if (NOTE_P (note)
6108 && NOTE_KIND (note) == NOTE_INSN_PROLOGUE_END)
6109 break;
6110 }
6111 }
6112
6113 /* Avoid placing note between CODE_LABEL and BASIC_BLOCK note. */
6114 if (LABEL_P (last))
6115 last = NEXT_INSN (last);
6116 reorder_insns (note, note, last);
6117 }
6118 }
6119
6120 if (epilogue_insn_hash != NULL)
6121 {
6122 edge_iterator ei;
6123 edge e;
6124
6125 FOR_EACH_EDGE (e, ei, EXIT_BLOCK_PTR_FOR_FN (cfun)->preds)
6126 {
6127 rtx_insn *insn, *first = NULL, *note = NULL;
6128 basic_block bb = e->src;
6129
6130 /* Scan from the beginning until we reach the first epilogue insn. */
6131 FOR_BB_INSNS (bb, insn)
6132 {
6133 if (NOTE_P (insn))
6134 {
6135 if (NOTE_KIND (insn) == NOTE_INSN_EPILOGUE_BEG)
6136 {
6137 note = insn;
6138 if (first != NULL)
6139 break;
6140 }
6141 }
6142 else if (first == NULL && contains (insn, epilogue_insn_hash))
6143 {
6144 first = insn;
6145 if (note != NULL)
6146 break;
6147 }
6148 }
6149
6150 if (note)
6151 {
6152 /* If the function has a single basic block, and no real
6153 epilogue insns (e.g. sibcall with no cleanup), the
6154 epilogue note can get scheduled before the prologue
6155 note. If we have frame related prologue insns, having
6156 them scanned during the epilogue will result in a crash.
6157 In this case re-order the epilogue note to just before
6158 the last insn in the block. */
6159 if (first == NULL)
6160 first = BB_END (bb);
6161
6162 if (PREV_INSN (first) != note)
6163 reorder_insns (note, note, PREV_INSN (first));
6164 }
6165 }
6166 }
6167 }
6168
6169 /* Returns the name of function declared by FNDECL. */
6170 const char *
6171 fndecl_name (tree fndecl)
6172 {
6173 if (fndecl == NULL)
6174 return "(nofn)";
6175 return lang_hooks.decl_printable_name (fndecl, 1);
6176 }
6177
6178 /* Returns the name of function FN. */
6179 const char *
6180 function_name (struct function *fn)
6181 {
6182 tree fndecl = (fn == NULL) ? NULL : fn->decl;
6183 return fndecl_name (fndecl);
6184 }
6185
6186 /* Returns the name of the current function. */
6187 const char *
6188 current_function_name (void)
6189 {
6190 return function_name (cfun);
6191 }
6192 \f
6193
6194 static unsigned int
6195 rest_of_handle_check_leaf_regs (void)
6196 {
6197 #ifdef LEAF_REGISTERS
6198 crtl->uses_only_leaf_regs
6199 = optimize > 0 && only_leaf_regs_used () && leaf_function_p ();
6200 #endif
6201 return 0;
6202 }
6203
6204 /* Insert a TYPE into the used types hash table of CFUN. */
6205
6206 static void
6207 used_types_insert_helper (tree type, struct function *func)
6208 {
6209 if (type != NULL && func != NULL)
6210 {
6211 if (func->used_types_hash == NULL)
6212 func->used_types_hash = hash_set<tree>::create_ggc (37);
6213
6214 func->used_types_hash->add (type);
6215 }
6216 }
6217
6218 /* Given a type, insert it into the used hash table in cfun. */
6219 void
6220 used_types_insert (tree t)
6221 {
6222 while (POINTER_TYPE_P (t) || TREE_CODE (t) == ARRAY_TYPE)
6223 if (TYPE_NAME (t))
6224 break;
6225 else
6226 t = TREE_TYPE (t);
6227 if (TREE_CODE (t) == ERROR_MARK)
6228 return;
6229 if (TYPE_NAME (t) == NULL_TREE
6230 || TYPE_NAME (t) == TYPE_NAME (TYPE_MAIN_VARIANT (t)))
6231 t = TYPE_MAIN_VARIANT (t);
6232 if (debug_info_level > DINFO_LEVEL_NONE)
6233 {
6234 if (cfun)
6235 used_types_insert_helper (t, cfun);
6236 else
6237 {
6238 /* So this might be a type referenced by a global variable.
6239 Record that type so that we can later decide to emit its
6240 debug information. */
6241 vec_safe_push (types_used_by_cur_var_decl, t);
6242 }
6243 }
6244 }
6245
6246 /* Helper to Hash a struct types_used_by_vars_entry. */
6247
6248 static hashval_t
6249 hash_types_used_by_vars_entry (const struct types_used_by_vars_entry *entry)
6250 {
6251 gcc_assert (entry && entry->var_decl && entry->type);
6252
6253 return iterative_hash_object (entry->type,
6254 iterative_hash_object (entry->var_decl, 0));
6255 }
6256
6257 /* Hash function of the types_used_by_vars_entry hash table. */
6258
6259 hashval_t
6260 used_type_hasher::hash (types_used_by_vars_entry *entry)
6261 {
6262 return hash_types_used_by_vars_entry (entry);
6263 }
6264
6265 /*Equality function of the types_used_by_vars_entry hash table. */
6266
6267 bool
6268 used_type_hasher::equal (types_used_by_vars_entry *e1,
6269 types_used_by_vars_entry *e2)
6270 {
6271 return (e1->var_decl == e2->var_decl && e1->type == e2->type);
6272 }
6273
6274 /* Inserts an entry into the types_used_by_vars_hash hash table. */
6275
6276 void
6277 types_used_by_var_decl_insert (tree type, tree var_decl)
6278 {
6279 if (type != NULL && var_decl != NULL)
6280 {
6281 types_used_by_vars_entry **slot;
6282 struct types_used_by_vars_entry e;
6283 e.var_decl = var_decl;
6284 e.type = type;
6285 if (types_used_by_vars_hash == NULL)
6286 types_used_by_vars_hash
6287 = hash_table<used_type_hasher>::create_ggc (37);
6288
6289 slot = types_used_by_vars_hash->find_slot (&e, INSERT);
6290 if (*slot == NULL)
6291 {
6292 struct types_used_by_vars_entry *entry;
6293 entry = ggc_alloc<types_used_by_vars_entry> ();
6294 entry->type = type;
6295 entry->var_decl = var_decl;
6296 *slot = entry;
6297 }
6298 }
6299 }
6300
6301 namespace {
6302
6303 const pass_data pass_data_leaf_regs =
6304 {
6305 RTL_PASS, /* type */
6306 "*leaf_regs", /* name */
6307 OPTGROUP_NONE, /* optinfo_flags */
6308 TV_NONE, /* tv_id */
6309 0, /* properties_required */
6310 0, /* properties_provided */
6311 0, /* properties_destroyed */
6312 0, /* todo_flags_start */
6313 0, /* todo_flags_finish */
6314 };
6315
6316 class pass_leaf_regs : public rtl_opt_pass
6317 {
6318 public:
6319 pass_leaf_regs (gcc::context *ctxt)
6320 : rtl_opt_pass (pass_data_leaf_regs, ctxt)
6321 {}
6322
6323 /* opt_pass methods: */
6324 virtual unsigned int execute (function *)
6325 {
6326 return rest_of_handle_check_leaf_regs ();
6327 }
6328
6329 }; // class pass_leaf_regs
6330
6331 } // anon namespace
6332
6333 rtl_opt_pass *
6334 make_pass_leaf_regs (gcc::context *ctxt)
6335 {
6336 return new pass_leaf_regs (ctxt);
6337 }
6338
6339 static unsigned int
6340 rest_of_handle_thread_prologue_and_epilogue (void)
6341 {
6342 /* prepare_shrink_wrap is sensitive to the block structure of the control
6343 flow graph, so clean it up first. */
6344 if (optimize)
6345 cleanup_cfg (0);
6346
6347 /* On some machines, the prologue and epilogue code, or parts thereof,
6348 can be represented as RTL. Doing so lets us schedule insns between
6349 it and the rest of the code and also allows delayed branch
6350 scheduling to operate in the epilogue. */
6351 thread_prologue_and_epilogue_insns ();
6352
6353 /* Some non-cold blocks may now be only reachable from cold blocks.
6354 Fix that up. */
6355 fixup_partitions ();
6356
6357 /* Shrink-wrapping can result in unreachable edges in the epilogue,
6358 see PR57320. */
6359 cleanup_cfg (optimize ? CLEANUP_EXPENSIVE : 0);
6360
6361 /* The stack usage info is finalized during prologue expansion. */
6362 if (flag_stack_usage_info)
6363 output_stack_usage ();
6364
6365 return 0;
6366 }
6367
6368 namespace {
6369
6370 const pass_data pass_data_thread_prologue_and_epilogue =
6371 {
6372 RTL_PASS, /* type */
6373 "pro_and_epilogue", /* name */
6374 OPTGROUP_NONE, /* optinfo_flags */
6375 TV_THREAD_PROLOGUE_AND_EPILOGUE, /* tv_id */
6376 0, /* properties_required */
6377 0, /* properties_provided */
6378 0, /* properties_destroyed */
6379 0, /* todo_flags_start */
6380 ( TODO_df_verify | TODO_df_finish ), /* todo_flags_finish */
6381 };
6382
6383 class pass_thread_prologue_and_epilogue : public rtl_opt_pass
6384 {
6385 public:
6386 pass_thread_prologue_and_epilogue (gcc::context *ctxt)
6387 : rtl_opt_pass (pass_data_thread_prologue_and_epilogue, ctxt)
6388 {}
6389
6390 /* opt_pass methods: */
6391 virtual unsigned int execute (function *)
6392 {
6393 return rest_of_handle_thread_prologue_and_epilogue ();
6394 }
6395
6396 }; // class pass_thread_prologue_and_epilogue
6397
6398 } // anon namespace
6399
6400 rtl_opt_pass *
6401 make_pass_thread_prologue_and_epilogue (gcc::context *ctxt)
6402 {
6403 return new pass_thread_prologue_and_epilogue (ctxt);
6404 }
6405 \f
6406
6407 /* If CONSTRAINT is a matching constraint, then return its number.
6408 Otherwise, return -1. */
6409
6410 static int
6411 matching_constraint_num (const char *constraint)
6412 {
6413 if (*constraint == '%')
6414 constraint++;
6415
6416 if (IN_RANGE (*constraint, '0', '9'))
6417 return strtoul (constraint, NULL, 10);
6418
6419 return -1;
6420 }
6421
6422 /* This mini-pass fixes fall-out from SSA in asm statements that have
6423 in-out constraints. Say you start with
6424
6425 orig = inout;
6426 asm ("": "+mr" (inout));
6427 use (orig);
6428
6429 which is transformed very early to use explicit output and match operands:
6430
6431 orig = inout;
6432 asm ("": "=mr" (inout) : "0" (inout));
6433 use (orig);
6434
6435 Or, after SSA and copyprop,
6436
6437 asm ("": "=mr" (inout_2) : "0" (inout_1));
6438 use (inout_1);
6439
6440 Clearly inout_2 and inout_1 can't be coalesced easily anymore, as
6441 they represent two separate values, so they will get different pseudo
6442 registers during expansion. Then, since the two operands need to match
6443 per the constraints, but use different pseudo registers, reload can
6444 only register a reload for these operands. But reloads can only be
6445 satisfied by hardregs, not by memory, so we need a register for this
6446 reload, just because we are presented with non-matching operands.
6447 So, even though we allow memory for this operand, no memory can be
6448 used for it, just because the two operands don't match. This can
6449 cause reload failures on register-starved targets.
6450
6451 So it's a symptom of reload not being able to use memory for reloads
6452 or, alternatively it's also a symptom of both operands not coming into
6453 reload as matching (in which case the pseudo could go to memory just
6454 fine, as the alternative allows it, and no reload would be necessary).
6455 We fix the latter problem here, by transforming
6456
6457 asm ("": "=mr" (inout_2) : "0" (inout_1));
6458
6459 back to
6460
6461 inout_2 = inout_1;
6462 asm ("": "=mr" (inout_2) : "0" (inout_2)); */
6463
6464 static void
6465 match_asm_constraints_1 (rtx_insn *insn, rtx *p_sets, int noutputs)
6466 {
6467 int i;
6468 bool changed = false;
6469 rtx op = SET_SRC (p_sets[0]);
6470 int ninputs = ASM_OPERANDS_INPUT_LENGTH (op);
6471 rtvec inputs = ASM_OPERANDS_INPUT_VEC (op);
6472 bool *output_matched = XALLOCAVEC (bool, noutputs);
6473
6474 memset (output_matched, 0, noutputs * sizeof (bool));
6475 for (i = 0; i < ninputs; i++)
6476 {
6477 rtx input, output;
6478 rtx_insn *insns;
6479 const char *constraint = ASM_OPERANDS_INPUT_CONSTRAINT (op, i);
6480 int match, j;
6481
6482 match = matching_constraint_num (constraint);
6483 if (match < 0)
6484 continue;
6485
6486 gcc_assert (match < noutputs);
6487 output = SET_DEST (p_sets[match]);
6488 input = RTVEC_ELT (inputs, i);
6489 /* Only do the transformation for pseudos. */
6490 if (! REG_P (output)
6491 || rtx_equal_p (output, input)
6492 || !(REG_P (input) || SUBREG_P (input)
6493 || MEM_P (input) || CONSTANT_P (input))
6494 || !general_operand (input, GET_MODE (output)))
6495 continue;
6496
6497 /* We can't do anything if the output is also used as input,
6498 as we're going to overwrite it. */
6499 for (j = 0; j < ninputs; j++)
6500 if (reg_overlap_mentioned_p (output, RTVEC_ELT (inputs, j)))
6501 break;
6502 if (j != ninputs)
6503 continue;
6504
6505 /* Avoid changing the same input several times. For
6506 asm ("" : "=mr" (out1), "=mr" (out2) : "0" (in), "1" (in));
6507 only change it once (to out1), rather than changing it
6508 first to out1 and afterwards to out2. */
6509 if (i > 0)
6510 {
6511 for (j = 0; j < noutputs; j++)
6512 if (output_matched[j] && input == SET_DEST (p_sets[j]))
6513 break;
6514 if (j != noutputs)
6515 continue;
6516 }
6517 output_matched[match] = true;
6518
6519 start_sequence ();
6520 emit_move_insn (output, copy_rtx (input));
6521 insns = get_insns ();
6522 end_sequence ();
6523 emit_insn_before (insns, insn);
6524
6525 constraint = ASM_OPERANDS_OUTPUT_CONSTRAINT(SET_SRC(p_sets[match]));
6526 bool early_clobber_p = strchr (constraint, '&') != NULL;
6527
6528 /* Now replace all mentions of the input with output. We can't
6529 just replace the occurrence in inputs[i], as the register might
6530 also be used in some other input (or even in an address of an
6531 output), which would mean possibly increasing the number of
6532 inputs by one (namely 'output' in addition), which might pose
6533 a too complicated problem for reload to solve. E.g. this situation:
6534
6535 asm ("" : "=r" (output), "=m" (input) : "0" (input))
6536
6537 Here 'input' is used in two occurrences as input (once for the
6538 input operand, once for the address in the second output operand).
6539 If we would replace only the occurrence of the input operand (to
6540 make the matching) we would be left with this:
6541
6542 output = input
6543 asm ("" : "=r" (output), "=m" (input) : "0" (output))
6544
6545 Now we suddenly have two different input values (containing the same
6546 value, but different pseudos) where we formerly had only one.
6547 With more complicated asms this might lead to reload failures
6548 which wouldn't have happen without this pass. So, iterate over
6549 all operands and replace all occurrences of the register used.
6550
6551 However, if one or more of the 'input' uses have a non-matching
6552 constraint and the matched output operand is an early clobber
6553 operand, then do not replace the input operand, since by definition
6554 it conflicts with the output operand and cannot share the same
6555 register. See PR89313 for details. */
6556
6557 for (j = 0; j < noutputs; j++)
6558 if (!rtx_equal_p (SET_DEST (p_sets[j]), input)
6559 && reg_overlap_mentioned_p (input, SET_DEST (p_sets[j])))
6560 SET_DEST (p_sets[j]) = replace_rtx (SET_DEST (p_sets[j]),
6561 input, output);
6562 for (j = 0; j < ninputs; j++)
6563 if (reg_overlap_mentioned_p (input, RTVEC_ELT (inputs, j)))
6564 {
6565 if (!early_clobber_p
6566 || match == matching_constraint_num
6567 (ASM_OPERANDS_INPUT_CONSTRAINT (op, j)))
6568 RTVEC_ELT (inputs, j) = replace_rtx (RTVEC_ELT (inputs, j),
6569 input, output);
6570 }
6571
6572 changed = true;
6573 }
6574
6575 if (changed)
6576 df_insn_rescan (insn);
6577 }
6578
6579 /* Add the decl D to the local_decls list of FUN. */
6580
6581 void
6582 add_local_decl (struct function *fun, tree d)
6583 {
6584 gcc_assert (VAR_P (d));
6585 vec_safe_push (fun->local_decls, d);
6586 }
6587
6588 namespace {
6589
6590 const pass_data pass_data_match_asm_constraints =
6591 {
6592 RTL_PASS, /* type */
6593 "asmcons", /* name */
6594 OPTGROUP_NONE, /* optinfo_flags */
6595 TV_NONE, /* tv_id */
6596 0, /* properties_required */
6597 0, /* properties_provided */
6598 0, /* properties_destroyed */
6599 0, /* todo_flags_start */
6600 0, /* todo_flags_finish */
6601 };
6602
6603 class pass_match_asm_constraints : public rtl_opt_pass
6604 {
6605 public:
6606 pass_match_asm_constraints (gcc::context *ctxt)
6607 : rtl_opt_pass (pass_data_match_asm_constraints, ctxt)
6608 {}
6609
6610 /* opt_pass methods: */
6611 virtual unsigned int execute (function *);
6612
6613 }; // class pass_match_asm_constraints
6614
6615 unsigned
6616 pass_match_asm_constraints::execute (function *fun)
6617 {
6618 basic_block bb;
6619 rtx_insn *insn;
6620 rtx pat, *p_sets;
6621 int noutputs;
6622
6623 if (!crtl->has_asm_statement)
6624 return 0;
6625
6626 df_set_flags (DF_DEFER_INSN_RESCAN);
6627 FOR_EACH_BB_FN (bb, fun)
6628 {
6629 FOR_BB_INSNS (bb, insn)
6630 {
6631 if (!INSN_P (insn))
6632 continue;
6633
6634 pat = PATTERN (insn);
6635 if (GET_CODE (pat) == PARALLEL)
6636 p_sets = &XVECEXP (pat, 0, 0), noutputs = XVECLEN (pat, 0);
6637 else if (GET_CODE (pat) == SET)
6638 p_sets = &PATTERN (insn), noutputs = 1;
6639 else
6640 continue;
6641
6642 if (GET_CODE (*p_sets) == SET
6643 && GET_CODE (SET_SRC (*p_sets)) == ASM_OPERANDS)
6644 match_asm_constraints_1 (insn, p_sets, noutputs);
6645 }
6646 }
6647
6648 return TODO_df_finish;
6649 }
6650
6651 } // anon namespace
6652
6653 rtl_opt_pass *
6654 make_pass_match_asm_constraints (gcc::context *ctxt)
6655 {
6656 return new pass_match_asm_constraints (ctxt);
6657 }
6658
6659
6660 #include "gt-function.h"