]> git.ipfire.org Git - thirdparty/gcc.git/blob - gcc/config/mcore/mcore.c
re PR middle-end/46500 (target.h includes tm.h)
[thirdparty/gcc.git] / gcc / config / mcore / mcore.c
1 /* Output routines for Motorola MCore processor
2 Copyright (C) 1993, 1999, 2000, 2001, 2002, 2003, 2004, 2005, 2007, 2008,
3 2009, 2010, 2011 Free Software Foundation, Inc.
4
5 This file is part of GCC.
6
7 GCC is free software; you can redistribute it and/or modify it
8 under the terms of the GNU General Public License as published
9 by the Free Software Foundation; either version 3, or (at your
10 option) any later version.
11
12 GCC is distributed in the hope that it will be useful, but WITHOUT
13 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
14 or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public
15 License for more details.
16
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
20
21 #include "config.h"
22 #include "system.h"
23 #include "coretypes.h"
24 #include "tm.h"
25 #include "rtl.h"
26 #include "tree.h"
27 #include "tm_p.h"
28 #include "mcore.h"
29 #include "regs.h"
30 #include "hard-reg-set.h"
31 #include "insn-config.h"
32 #include "conditions.h"
33 #include "output.h"
34 #include "insn-attr.h"
35 #include "flags.h"
36 #include "obstack.h"
37 #include "expr.h"
38 #include "reload.h"
39 #include "recog.h"
40 #include "function.h"
41 #include "ggc.h"
42 #include "diagnostic-core.h"
43 #include "target.h"
44 #include "target-def.h"
45 #include "df.h"
46
47 /* For dumping information about frame sizes. */
48 char * mcore_current_function_name = 0;
49 long mcore_current_compilation_timestamp = 0;
50
51 /* Global variables for machine-dependent things. */
52
53 /* Provides the class number of the smallest class containing
54 reg number. */
55 const enum reg_class regno_reg_class[FIRST_PSEUDO_REGISTER] =
56 {
57 GENERAL_REGS, ONLYR1_REGS, LRW_REGS, LRW_REGS,
58 LRW_REGS, LRW_REGS, LRW_REGS, LRW_REGS,
59 LRW_REGS, LRW_REGS, LRW_REGS, LRW_REGS,
60 LRW_REGS, LRW_REGS, LRW_REGS, GENERAL_REGS,
61 GENERAL_REGS, C_REGS, NO_REGS, NO_REGS,
62 };
63
64 struct mcore_frame
65 {
66 int arg_size; /* Stdarg spills (bytes). */
67 int reg_size; /* Non-volatile reg saves (bytes). */
68 int reg_mask; /* Non-volatile reg saves. */
69 int local_size; /* Locals. */
70 int outbound_size; /* Arg overflow on calls out. */
71 int pad_outbound;
72 int pad_local;
73 int pad_reg;
74 /* Describe the steps we'll use to grow it. */
75 #define MAX_STACK_GROWS 4 /* Gives us some spare space. */
76 int growth[MAX_STACK_GROWS];
77 int arg_offset;
78 int reg_offset;
79 int reg_growth;
80 int local_growth;
81 };
82
83 typedef enum
84 {
85 COND_NO,
86 COND_MOV_INSN,
87 COND_CLR_INSN,
88 COND_INC_INSN,
89 COND_DEC_INSN,
90 COND_BRANCH_INSN
91 }
92 cond_type;
93
94 static void output_stack_adjust (int, int);
95 static int calc_live_regs (int *);
96 static int try_constant_tricks (long, HOST_WIDE_INT *, HOST_WIDE_INT *);
97 static const char * output_inline_const (enum machine_mode, rtx *);
98 static void layout_mcore_frame (struct mcore_frame *);
99 static void mcore_setup_incoming_varargs (cumulative_args_t, enum machine_mode, tree, int *, int);
100 static cond_type is_cond_candidate (rtx);
101 static rtx emit_new_cond_insn (rtx, int);
102 static rtx conditionalize_block (rtx);
103 static void conditionalize_optimization (void);
104 static void mcore_reorg (void);
105 static rtx handle_structs_in_regs (enum machine_mode, const_tree, int);
106 static void mcore_mark_dllexport (tree);
107 static void mcore_mark_dllimport (tree);
108 static int mcore_dllexport_p (tree);
109 static int mcore_dllimport_p (tree);
110 static tree mcore_handle_naked_attribute (tree *, tree, tree, int, bool *);
111 #ifdef OBJECT_FORMAT_ELF
112 static void mcore_asm_named_section (const char *,
113 unsigned int, tree);
114 #endif
115 static void mcore_print_operand (FILE *, rtx, int);
116 static void mcore_print_operand_address (FILE *, rtx);
117 static bool mcore_print_operand_punct_valid_p (unsigned char code);
118 static void mcore_unique_section (tree, int);
119 static void mcore_encode_section_info (tree, rtx, int);
120 static const char *mcore_strip_name_encoding (const char *);
121 static int mcore_const_costs (rtx, RTX_CODE);
122 static int mcore_and_cost (rtx);
123 static int mcore_ior_cost (rtx);
124 static bool mcore_rtx_costs (rtx, int, int, int *, bool);
125 static void mcore_external_libcall (rtx);
126 static bool mcore_return_in_memory (const_tree, const_tree);
127 static int mcore_arg_partial_bytes (cumulative_args_t,
128 enum machine_mode,
129 tree, bool);
130 static rtx mcore_function_arg (cumulative_args_t,
131 enum machine_mode,
132 const_tree, bool);
133 static void mcore_function_arg_advance (cumulative_args_t,
134 enum machine_mode,
135 const_tree, bool);
136 static unsigned int mcore_function_arg_boundary (enum machine_mode,
137 const_tree);
138 static void mcore_asm_trampoline_template (FILE *);
139 static void mcore_trampoline_init (rtx, tree, rtx);
140 static void mcore_option_override (void);
141 static bool mcore_legitimate_constant_p (enum machine_mode, rtx);
142 \f
143 /* MCore specific attributes. */
144
145 static const struct attribute_spec mcore_attribute_table[] =
146 {
147 /* { name, min_len, max_len, decl_req, type_req, fn_type_req, handler,
148 affects_type_identity } */
149 { "dllexport", 0, 0, true, false, false, NULL, false },
150 { "dllimport", 0, 0, true, false, false, NULL, false },
151 { "naked", 0, 0, true, false, false, mcore_handle_naked_attribute,
152 false },
153 { NULL, 0, 0, false, false, false, NULL, false }
154 };
155 \f
156 /* Initialize the GCC target structure. */
157 #undef TARGET_ASM_EXTERNAL_LIBCALL
158 #define TARGET_ASM_EXTERNAL_LIBCALL mcore_external_libcall
159
160 #if TARGET_DLLIMPORT_DECL_ATTRIBUTES
161 #undef TARGET_MERGE_DECL_ATTRIBUTES
162 #define TARGET_MERGE_DECL_ATTRIBUTES merge_dllimport_decl_attributes
163 #endif
164
165 #ifdef OBJECT_FORMAT_ELF
166 #undef TARGET_ASM_UNALIGNED_HI_OP
167 #define TARGET_ASM_UNALIGNED_HI_OP "\t.short\t"
168 #undef TARGET_ASM_UNALIGNED_SI_OP
169 #define TARGET_ASM_UNALIGNED_SI_OP "\t.long\t"
170 #endif
171
172 #undef TARGET_PRINT_OPERAND
173 #define TARGET_PRINT_OPERAND mcore_print_operand
174 #undef TARGET_PRINT_OPERAND_ADDRESS
175 #define TARGET_PRINT_OPERAND_ADDRESS mcore_print_operand_address
176 #undef TARGET_PRINT_OPERAND_PUNCT_VALID_P
177 #define TARGET_PRINT_OPERAND_PUNCT_VALID_P mcore_print_operand_punct_valid_p
178
179 #undef TARGET_ATTRIBUTE_TABLE
180 #define TARGET_ATTRIBUTE_TABLE mcore_attribute_table
181 #undef TARGET_ASM_UNIQUE_SECTION
182 #define TARGET_ASM_UNIQUE_SECTION mcore_unique_section
183 #undef TARGET_ASM_FUNCTION_RODATA_SECTION
184 #define TARGET_ASM_FUNCTION_RODATA_SECTION default_no_function_rodata_section
185 #undef TARGET_ENCODE_SECTION_INFO
186 #define TARGET_ENCODE_SECTION_INFO mcore_encode_section_info
187 #undef TARGET_STRIP_NAME_ENCODING
188 #define TARGET_STRIP_NAME_ENCODING mcore_strip_name_encoding
189 #undef TARGET_RTX_COSTS
190 #define TARGET_RTX_COSTS mcore_rtx_costs
191 #undef TARGET_ADDRESS_COST
192 #define TARGET_ADDRESS_COST hook_int_rtx_bool_0
193 #undef TARGET_MACHINE_DEPENDENT_REORG
194 #define TARGET_MACHINE_DEPENDENT_REORG mcore_reorg
195
196 #undef TARGET_PROMOTE_FUNCTION_MODE
197 #define TARGET_PROMOTE_FUNCTION_MODE default_promote_function_mode_always_promote
198 #undef TARGET_PROMOTE_PROTOTYPES
199 #define TARGET_PROMOTE_PROTOTYPES hook_bool_const_tree_true
200
201 #undef TARGET_RETURN_IN_MEMORY
202 #define TARGET_RETURN_IN_MEMORY mcore_return_in_memory
203 #undef TARGET_MUST_PASS_IN_STACK
204 #define TARGET_MUST_PASS_IN_STACK must_pass_in_stack_var_size
205 #undef TARGET_PASS_BY_REFERENCE
206 #define TARGET_PASS_BY_REFERENCE hook_pass_by_reference_must_pass_in_stack
207 #undef TARGET_ARG_PARTIAL_BYTES
208 #define TARGET_ARG_PARTIAL_BYTES mcore_arg_partial_bytes
209 #undef TARGET_FUNCTION_ARG
210 #define TARGET_FUNCTION_ARG mcore_function_arg
211 #undef TARGET_FUNCTION_ARG_ADVANCE
212 #define TARGET_FUNCTION_ARG_ADVANCE mcore_function_arg_advance
213 #undef TARGET_FUNCTION_ARG_BOUNDARY
214 #define TARGET_FUNCTION_ARG_BOUNDARY mcore_function_arg_boundary
215
216 #undef TARGET_SETUP_INCOMING_VARARGS
217 #define TARGET_SETUP_INCOMING_VARARGS mcore_setup_incoming_varargs
218
219 #undef TARGET_ASM_TRAMPOLINE_TEMPLATE
220 #define TARGET_ASM_TRAMPOLINE_TEMPLATE mcore_asm_trampoline_template
221 #undef TARGET_TRAMPOLINE_INIT
222 #define TARGET_TRAMPOLINE_INIT mcore_trampoline_init
223
224 #undef TARGET_OPTION_OVERRIDE
225 #define TARGET_OPTION_OVERRIDE mcore_option_override
226
227 #undef TARGET_LEGITIMATE_CONSTANT_P
228 #define TARGET_LEGITIMATE_CONSTANT_P mcore_legitimate_constant_p
229
230 struct gcc_target targetm = TARGET_INITIALIZER;
231 \f
232 /* Adjust the stack and return the number of bytes taken to do it. */
233 static void
234 output_stack_adjust (int direction, int size)
235 {
236 /* If extending stack a lot, we do it incrementally. */
237 if (direction < 0 && size > mcore_stack_increment && mcore_stack_increment > 0)
238 {
239 rtx tmp = gen_rtx_REG (SImode, 1);
240 rtx memref;
241
242 emit_insn (gen_movsi (tmp, GEN_INT (mcore_stack_increment)));
243 do
244 {
245 emit_insn (gen_subsi3 (stack_pointer_rtx, stack_pointer_rtx, tmp));
246 memref = gen_rtx_MEM (SImode, stack_pointer_rtx);
247 MEM_VOLATILE_P (memref) = 1;
248 emit_insn (gen_movsi (memref, stack_pointer_rtx));
249 size -= mcore_stack_increment;
250 }
251 while (size > mcore_stack_increment);
252
253 /* SIZE is now the residual for the last adjustment,
254 which doesn't require a probe. */
255 }
256
257 if (size)
258 {
259 rtx insn;
260 rtx val = GEN_INT (size);
261
262 if (size > 32)
263 {
264 rtx nval = gen_rtx_REG (SImode, 1);
265 emit_insn (gen_movsi (nval, val));
266 val = nval;
267 }
268
269 if (direction > 0)
270 insn = gen_addsi3 (stack_pointer_rtx, stack_pointer_rtx, val);
271 else
272 insn = gen_subsi3 (stack_pointer_rtx, stack_pointer_rtx, val);
273
274 emit_insn (insn);
275 }
276 }
277
278 /* Work out the registers which need to be saved,
279 both as a mask and a count. */
280
281 static int
282 calc_live_regs (int * count)
283 {
284 int reg;
285 int live_regs_mask = 0;
286
287 * count = 0;
288
289 for (reg = 0; reg < FIRST_PSEUDO_REGISTER; reg++)
290 {
291 if (df_regs_ever_live_p (reg) && !call_used_regs[reg])
292 {
293 (*count)++;
294 live_regs_mask |= (1 << reg);
295 }
296 }
297
298 return live_regs_mask;
299 }
300
301 /* Print the operand address in x to the stream. */
302
303 static void
304 mcore_print_operand_address (FILE * stream, rtx x)
305 {
306 switch (GET_CODE (x))
307 {
308 case REG:
309 fprintf (stream, "(%s)", reg_names[REGNO (x)]);
310 break;
311
312 case PLUS:
313 {
314 rtx base = XEXP (x, 0);
315 rtx index = XEXP (x, 1);
316
317 if (GET_CODE (base) != REG)
318 {
319 /* Ensure that BASE is a register (one of them must be). */
320 rtx temp = base;
321 base = index;
322 index = temp;
323 }
324
325 switch (GET_CODE (index))
326 {
327 case CONST_INT:
328 fprintf (stream, "(%s," HOST_WIDE_INT_PRINT_DEC ")",
329 reg_names[REGNO(base)], INTVAL (index));
330 break;
331
332 default:
333 gcc_unreachable ();
334 }
335 }
336
337 break;
338
339 default:
340 output_addr_const (stream, x);
341 break;
342 }
343 }
344
345 static bool
346 mcore_print_operand_punct_valid_p (unsigned char code)
347 {
348 return (code == '.' || code == '#' || code == '*' || code == '^'
349 || code == '!');
350 }
351
352 /* Print operand x (an rtx) in assembler syntax to file stream
353 according to modifier code.
354
355 'R' print the next register or memory location along, i.e. the lsw in
356 a double word value
357 'O' print a constant without the #
358 'M' print a constant as its negative
359 'P' print log2 of a power of two
360 'Q' print log2 of an inverse of a power of two
361 'U' print register for ldm/stm instruction
362 'X' print byte number for xtrbN instruction. */
363
364 static void
365 mcore_print_operand (FILE * stream, rtx x, int code)
366 {
367 switch (code)
368 {
369 case 'N':
370 if (INTVAL(x) == -1)
371 fprintf (asm_out_file, "32");
372 else
373 fprintf (asm_out_file, "%d", exact_log2 (INTVAL (x) + 1));
374 break;
375 case 'P':
376 fprintf (asm_out_file, "%d", exact_log2 (INTVAL (x) & 0xffffffff));
377 break;
378 case 'Q':
379 fprintf (asm_out_file, "%d", exact_log2 (~INTVAL (x)));
380 break;
381 case 'O':
382 fprintf (asm_out_file, HOST_WIDE_INT_PRINT_DEC, INTVAL (x));
383 break;
384 case 'M':
385 fprintf (asm_out_file, HOST_WIDE_INT_PRINT_DEC, - INTVAL (x));
386 break;
387 case 'R':
388 /* Next location along in memory or register. */
389 switch (GET_CODE (x))
390 {
391 case REG:
392 fputs (reg_names[REGNO (x) + 1], (stream));
393 break;
394 case MEM:
395 mcore_print_operand_address
396 (stream, XEXP (adjust_address (x, SImode, 4), 0));
397 break;
398 default:
399 gcc_unreachable ();
400 }
401 break;
402 case 'U':
403 fprintf (asm_out_file, "%s-%s", reg_names[REGNO (x)],
404 reg_names[REGNO (x) + 3]);
405 break;
406 case 'x':
407 fprintf (asm_out_file, HOST_WIDE_INT_PRINT_HEX, INTVAL (x));
408 break;
409 case 'X':
410 fprintf (asm_out_file, HOST_WIDE_INT_PRINT_DEC, 3 - INTVAL (x) / 8);
411 break;
412
413 default:
414 switch (GET_CODE (x))
415 {
416 case REG:
417 fputs (reg_names[REGNO (x)], (stream));
418 break;
419 case MEM:
420 output_address (XEXP (x, 0));
421 break;
422 default:
423 output_addr_const (stream, x);
424 break;
425 }
426 break;
427 }
428 }
429
430 /* What does a constant cost ? */
431
432 static int
433 mcore_const_costs (rtx exp, enum rtx_code code)
434 {
435 HOST_WIDE_INT val = INTVAL (exp);
436
437 /* Easy constants. */
438 if ( CONST_OK_FOR_I (val)
439 || CONST_OK_FOR_M (val)
440 || CONST_OK_FOR_N (val)
441 || (code == PLUS && CONST_OK_FOR_L (val)))
442 return 1;
443 else if (code == AND
444 && ( CONST_OK_FOR_M (~val)
445 || CONST_OK_FOR_N (~val)))
446 return 2;
447 else if (code == PLUS
448 && ( CONST_OK_FOR_I (-val)
449 || CONST_OK_FOR_M (-val)
450 || CONST_OK_FOR_N (-val)))
451 return 2;
452
453 return 5;
454 }
455
456 /* What does an and instruction cost - we do this b/c immediates may
457 have been relaxed. We want to ensure that cse will cse relaxed immeds
458 out. Otherwise we'll get bad code (multiple reloads of the same const). */
459
460 static int
461 mcore_and_cost (rtx x)
462 {
463 HOST_WIDE_INT val;
464
465 if (GET_CODE (XEXP (x, 1)) != CONST_INT)
466 return 2;
467
468 val = INTVAL (XEXP (x, 1));
469
470 /* Do it directly. */
471 if (CONST_OK_FOR_K (val) || CONST_OK_FOR_M (~val))
472 return 2;
473 /* Takes one instruction to load. */
474 else if (const_ok_for_mcore (val))
475 return 3;
476 /* Takes two instructions to load. */
477 else if (TARGET_HARDLIT && mcore_const_ok_for_inline (val))
478 return 4;
479
480 /* Takes a lrw to load. */
481 return 5;
482 }
483
484 /* What does an or cost - see and_cost(). */
485
486 static int
487 mcore_ior_cost (rtx x)
488 {
489 HOST_WIDE_INT val;
490
491 if (GET_CODE (XEXP (x, 1)) != CONST_INT)
492 return 2;
493
494 val = INTVAL (XEXP (x, 1));
495
496 /* Do it directly with bclri. */
497 if (CONST_OK_FOR_M (val))
498 return 2;
499 /* Takes one instruction to load. */
500 else if (const_ok_for_mcore (val))
501 return 3;
502 /* Takes two instructions to load. */
503 else if (TARGET_HARDLIT && mcore_const_ok_for_inline (val))
504 return 4;
505
506 /* Takes a lrw to load. */
507 return 5;
508 }
509
510 static bool
511 mcore_rtx_costs (rtx x, int code, int outer_code, int * total,
512 bool speed ATTRIBUTE_UNUSED)
513 {
514 switch (code)
515 {
516 case CONST_INT:
517 *total = mcore_const_costs (x, (enum rtx_code) outer_code);
518 return true;
519 case CONST:
520 case LABEL_REF:
521 case SYMBOL_REF:
522 *total = 5;
523 return true;
524 case CONST_DOUBLE:
525 *total = 10;
526 return true;
527
528 case AND:
529 *total = COSTS_N_INSNS (mcore_and_cost (x));
530 return true;
531
532 case IOR:
533 *total = COSTS_N_INSNS (mcore_ior_cost (x));
534 return true;
535
536 case DIV:
537 case UDIV:
538 case MOD:
539 case UMOD:
540 case FLOAT:
541 case FIX:
542 *total = COSTS_N_INSNS (100);
543 return true;
544
545 default:
546 return false;
547 }
548 }
549
550 /* Prepare the operands for a comparison. Return whether the branch/setcc
551 should reverse the operands. */
552
553 bool
554 mcore_gen_compare (enum rtx_code code, rtx op0, rtx op1)
555 {
556 rtx cc_reg = gen_rtx_REG (CCmode, CC_REG);
557 bool invert;
558
559 if (GET_CODE (op1) == CONST_INT)
560 {
561 HOST_WIDE_INT val = INTVAL (op1);
562
563 switch (code)
564 {
565 case GTU:
566 /* Unsigned > 0 is the same as != 0; everything else is converted
567 below to LEU (reversed cmphs). */
568 if (val == 0)
569 code = NE;
570 break;
571
572 /* Check whether (LE A imm) can become (LT A imm + 1),
573 or (GT A imm) can become (GE A imm + 1). */
574 case GT:
575 case LE:
576 if (CONST_OK_FOR_J (val + 1))
577 {
578 op1 = GEN_INT (val + 1);
579 code = code == LE ? LT : GE;
580 }
581 break;
582
583 default:
584 break;
585 }
586 }
587
588 if (CONSTANT_P (op1) && GET_CODE (op1) != CONST_INT)
589 op1 = force_reg (SImode, op1);
590
591 /* cmpnei: 0-31 (K immediate)
592 cmplti: 1-32 (J immediate, 0 using btsti x,31). */
593 invert = false;
594 switch (code)
595 {
596 case EQ: /* Use inverted condition, cmpne. */
597 code = NE;
598 invert = true;
599 /* Drop through. */
600
601 case NE: /* Use normal condition, cmpne. */
602 if (GET_CODE (op1) == CONST_INT && ! CONST_OK_FOR_K (INTVAL (op1)))
603 op1 = force_reg (SImode, op1);
604 break;
605
606 case LE: /* Use inverted condition, reversed cmplt. */
607 code = GT;
608 invert = true;
609 /* Drop through. */
610
611 case GT: /* Use normal condition, reversed cmplt. */
612 if (GET_CODE (op1) == CONST_INT)
613 op1 = force_reg (SImode, op1);
614 break;
615
616 case GE: /* Use inverted condition, cmplt. */
617 code = LT;
618 invert = true;
619 /* Drop through. */
620
621 case LT: /* Use normal condition, cmplt. */
622 if (GET_CODE (op1) == CONST_INT &&
623 /* covered by btsti x,31. */
624 INTVAL (op1) != 0 &&
625 ! CONST_OK_FOR_J (INTVAL (op1)))
626 op1 = force_reg (SImode, op1);
627 break;
628
629 case GTU: /* Use inverted condition, cmple. */
630 /* We coped with unsigned > 0 above. */
631 gcc_assert (GET_CODE (op1) != CONST_INT || INTVAL (op1) != 0);
632 code = LEU;
633 invert = true;
634 /* Drop through. */
635
636 case LEU: /* Use normal condition, reversed cmphs. */
637 if (GET_CODE (op1) == CONST_INT && INTVAL (op1) != 0)
638 op1 = force_reg (SImode, op1);
639 break;
640
641 case LTU: /* Use inverted condition, cmphs. */
642 code = GEU;
643 invert = true;
644 /* Drop through. */
645
646 case GEU: /* Use normal condition, cmphs. */
647 if (GET_CODE (op1) == CONST_INT && INTVAL (op1) != 0)
648 op1 = force_reg (SImode, op1);
649 break;
650
651 default:
652 break;
653 }
654
655 emit_insn (gen_rtx_SET (VOIDmode,
656 cc_reg,
657 gen_rtx_fmt_ee (code, CCmode, op0, op1)));
658 return invert;
659 }
660
661 int
662 mcore_symbolic_address_p (rtx x)
663 {
664 switch (GET_CODE (x))
665 {
666 case SYMBOL_REF:
667 case LABEL_REF:
668 return 1;
669 case CONST:
670 x = XEXP (x, 0);
671 return ( (GET_CODE (XEXP (x, 0)) == SYMBOL_REF
672 || GET_CODE (XEXP (x, 0)) == LABEL_REF)
673 && GET_CODE (XEXP (x, 1)) == CONST_INT);
674 default:
675 return 0;
676 }
677 }
678
679 /* Functions to output assembly code for a function call. */
680
681 char *
682 mcore_output_call (rtx operands[], int index)
683 {
684 static char buffer[20];
685 rtx addr = operands [index];
686
687 if (REG_P (addr))
688 {
689 if (TARGET_CG_DATA)
690 {
691 gcc_assert (mcore_current_function_name);
692
693 ASM_OUTPUT_CG_EDGE (asm_out_file, mcore_current_function_name,
694 "unknown", 1);
695 }
696
697 sprintf (buffer, "jsr\t%%%d", index);
698 }
699 else
700 {
701 if (TARGET_CG_DATA)
702 {
703 gcc_assert (mcore_current_function_name);
704 gcc_assert (GET_CODE (addr) == SYMBOL_REF);
705
706 ASM_OUTPUT_CG_EDGE (asm_out_file, mcore_current_function_name,
707 XSTR (addr, 0), 0);
708 }
709
710 sprintf (buffer, "jbsr\t%%%d", index);
711 }
712
713 return buffer;
714 }
715
716 /* Can we load a constant with a single instruction ? */
717
718 int
719 const_ok_for_mcore (HOST_WIDE_INT value)
720 {
721 if (value >= 0 && value <= 127)
722 return 1;
723
724 /* Try exact power of two. */
725 if (CONST_OK_FOR_M (value))
726 return 1;
727
728 /* Try exact power of two - 1. */
729 if (CONST_OK_FOR_N (value) && value != -1)
730 return 1;
731
732 return 0;
733 }
734
735 /* Can we load a constant inline with up to 2 instructions ? */
736
737 int
738 mcore_const_ok_for_inline (HOST_WIDE_INT value)
739 {
740 HOST_WIDE_INT x, y;
741
742 return try_constant_tricks (value, & x, & y) > 0;
743 }
744
745 /* Are we loading the constant using a not ? */
746
747 int
748 mcore_const_trick_uses_not (HOST_WIDE_INT value)
749 {
750 HOST_WIDE_INT x, y;
751
752 return try_constant_tricks (value, & x, & y) == 2;
753 }
754
755 /* Try tricks to load a constant inline and return the trick number if
756 success (0 is non-inlinable).
757
758 0: not inlinable
759 1: single instruction (do the usual thing)
760 2: single insn followed by a 'not'
761 3: single insn followed by a subi
762 4: single insn followed by an addi
763 5: single insn followed by rsubi
764 6: single insn followed by bseti
765 7: single insn followed by bclri
766 8: single insn followed by rotli
767 9: single insn followed by lsli
768 10: single insn followed by ixh
769 11: single insn followed by ixw. */
770
771 static int
772 try_constant_tricks (HOST_WIDE_INT value, HOST_WIDE_INT * x, HOST_WIDE_INT * y)
773 {
774 HOST_WIDE_INT i;
775 unsigned HOST_WIDE_INT bit, shf, rot;
776
777 if (const_ok_for_mcore (value))
778 return 1; /* Do the usual thing. */
779
780 if (! TARGET_HARDLIT)
781 return 0;
782
783 if (const_ok_for_mcore (~value))
784 {
785 *x = ~value;
786 return 2;
787 }
788
789 for (i = 1; i <= 32; i++)
790 {
791 if (const_ok_for_mcore (value - i))
792 {
793 *x = value - i;
794 *y = i;
795
796 return 3;
797 }
798
799 if (const_ok_for_mcore (value + i))
800 {
801 *x = value + i;
802 *y = i;
803
804 return 4;
805 }
806 }
807
808 bit = 0x80000000ULL;
809
810 for (i = 0; i <= 31; i++)
811 {
812 if (const_ok_for_mcore (i - value))
813 {
814 *x = i - value;
815 *y = i;
816
817 return 5;
818 }
819
820 if (const_ok_for_mcore (value & ~bit))
821 {
822 *y = bit;
823 *x = value & ~bit;
824 return 6;
825 }
826
827 if (const_ok_for_mcore (value | bit))
828 {
829 *y = ~bit;
830 *x = value | bit;
831
832 return 7;
833 }
834
835 bit >>= 1;
836 }
837
838 shf = value;
839 rot = value;
840
841 for (i = 1; i < 31; i++)
842 {
843 int c;
844
845 /* MCore has rotate left. */
846 c = rot << 31;
847 rot >>= 1;
848 rot &= 0x7FFFFFFF;
849 rot |= c; /* Simulate rotate. */
850
851 if (const_ok_for_mcore (rot))
852 {
853 *y = i;
854 *x = rot;
855
856 return 8;
857 }
858
859 if (shf & 1)
860 shf = 0; /* Can't use logical shift, low order bit is one. */
861
862 shf >>= 1;
863
864 if (shf != 0 && const_ok_for_mcore (shf))
865 {
866 *y = i;
867 *x = shf;
868
869 return 9;
870 }
871 }
872
873 if ((value % 3) == 0 && const_ok_for_mcore (value / 3))
874 {
875 *x = value / 3;
876
877 return 10;
878 }
879
880 if ((value % 5) == 0 && const_ok_for_mcore (value / 5))
881 {
882 *x = value / 5;
883
884 return 11;
885 }
886
887 return 0;
888 }
889
890 /* Check whether reg is dead at first. This is done by searching ahead
891 for either the next use (i.e., reg is live), a death note, or a set of
892 reg. Don't just use dead_or_set_p() since reload does not always mark
893 deaths (especially if PRESERVE_DEATH_NOTES_REGNO_P is not defined). We
894 can ignore subregs by extracting the actual register. BRC */
895
896 int
897 mcore_is_dead (rtx first, rtx reg)
898 {
899 rtx insn;
900
901 /* For mcore, subregs can't live independently of their parent regs. */
902 if (GET_CODE (reg) == SUBREG)
903 reg = SUBREG_REG (reg);
904
905 /* Dies immediately. */
906 if (dead_or_set_p (first, reg))
907 return 1;
908
909 /* Look for conclusive evidence of live/death, otherwise we have
910 to assume that it is live. */
911 for (insn = NEXT_INSN (first); insn; insn = NEXT_INSN (insn))
912 {
913 if (GET_CODE (insn) == JUMP_INSN)
914 return 0; /* We lose track, assume it is alive. */
915
916 else if (GET_CODE(insn) == CALL_INSN)
917 {
918 /* Call's might use it for target or register parms. */
919 if (reg_referenced_p (reg, PATTERN (insn))
920 || find_reg_fusage (insn, USE, reg))
921 return 0;
922 else if (dead_or_set_p (insn, reg))
923 return 1;
924 }
925 else if (GET_CODE (insn) == INSN)
926 {
927 if (reg_referenced_p (reg, PATTERN (insn)))
928 return 0;
929 else if (dead_or_set_p (insn, reg))
930 return 1;
931 }
932 }
933
934 /* No conclusive evidence either way, we cannot take the chance
935 that control flow hid the use from us -- "I'm not dead yet". */
936 return 0;
937 }
938
939 /* Count the number of ones in mask. */
940
941 int
942 mcore_num_ones (HOST_WIDE_INT mask)
943 {
944 /* A trick to count set bits recently posted on comp.compilers. */
945 mask = (mask >> 1 & 0x55555555) + (mask & 0x55555555);
946 mask = ((mask >> 2) & 0x33333333) + (mask & 0x33333333);
947 mask = ((mask >> 4) + mask) & 0x0f0f0f0f;
948 mask = ((mask >> 8) + mask);
949
950 return (mask + (mask >> 16)) & 0xff;
951 }
952
953 /* Count the number of zeros in mask. */
954
955 int
956 mcore_num_zeros (HOST_WIDE_INT mask)
957 {
958 return 32 - mcore_num_ones (mask);
959 }
960
961 /* Determine byte being masked. */
962
963 int
964 mcore_byte_offset (unsigned int mask)
965 {
966 if (mask == 0x00ffffffL)
967 return 0;
968 else if (mask == 0xff00ffffL)
969 return 1;
970 else if (mask == 0xffff00ffL)
971 return 2;
972 else if (mask == 0xffffff00L)
973 return 3;
974
975 return -1;
976 }
977
978 /* Determine halfword being masked. */
979
980 int
981 mcore_halfword_offset (unsigned int mask)
982 {
983 if (mask == 0x0000ffffL)
984 return 0;
985 else if (mask == 0xffff0000L)
986 return 1;
987
988 return -1;
989 }
990
991 /* Output a series of bseti's corresponding to mask. */
992
993 const char *
994 mcore_output_bseti (rtx dst, int mask)
995 {
996 rtx out_operands[2];
997 int bit;
998
999 out_operands[0] = dst;
1000
1001 for (bit = 0; bit < 32; bit++)
1002 {
1003 if ((mask & 0x1) == 0x1)
1004 {
1005 out_operands[1] = GEN_INT (bit);
1006
1007 output_asm_insn ("bseti\t%0,%1", out_operands);
1008 }
1009 mask >>= 1;
1010 }
1011
1012 return "";
1013 }
1014
1015 /* Output a series of bclri's corresponding to mask. */
1016
1017 const char *
1018 mcore_output_bclri (rtx dst, int mask)
1019 {
1020 rtx out_operands[2];
1021 int bit;
1022
1023 out_operands[0] = dst;
1024
1025 for (bit = 0; bit < 32; bit++)
1026 {
1027 if ((mask & 0x1) == 0x0)
1028 {
1029 out_operands[1] = GEN_INT (bit);
1030
1031 output_asm_insn ("bclri\t%0,%1", out_operands);
1032 }
1033
1034 mask >>= 1;
1035 }
1036
1037 return "";
1038 }
1039
1040 /* Output a conditional move of two constants that are +/- 1 within each
1041 other. See the "movtK" patterns in mcore.md. I'm not sure this is
1042 really worth the effort. */
1043
1044 const char *
1045 mcore_output_cmov (rtx operands[], int cmp_t, const char * test)
1046 {
1047 HOST_WIDE_INT load_value;
1048 HOST_WIDE_INT adjust_value;
1049 rtx out_operands[4];
1050
1051 out_operands[0] = operands[0];
1052
1053 /* Check to see which constant is loadable. */
1054 if (const_ok_for_mcore (INTVAL (operands[1])))
1055 {
1056 out_operands[1] = operands[1];
1057 out_operands[2] = operands[2];
1058 }
1059 else if (const_ok_for_mcore (INTVAL (operands[2])))
1060 {
1061 out_operands[1] = operands[2];
1062 out_operands[2] = operands[1];
1063
1064 /* Complement test since constants are swapped. */
1065 cmp_t = (cmp_t == 0);
1066 }
1067 load_value = INTVAL (out_operands[1]);
1068 adjust_value = INTVAL (out_operands[2]);
1069
1070 /* First output the test if folded into the pattern. */
1071
1072 if (test)
1073 output_asm_insn (test, operands);
1074
1075 /* Load the constant - for now, only support constants that can be
1076 generated with a single instruction. maybe add general inlinable
1077 constants later (this will increase the # of patterns since the
1078 instruction sequence has a different length attribute). */
1079 if (load_value >= 0 && load_value <= 127)
1080 output_asm_insn ("movi\t%0,%1", out_operands);
1081 else if (CONST_OK_FOR_M (load_value))
1082 output_asm_insn ("bgeni\t%0,%P1", out_operands);
1083 else if (CONST_OK_FOR_N (load_value))
1084 output_asm_insn ("bmaski\t%0,%N1", out_operands);
1085
1086 /* Output the constant adjustment. */
1087 if (load_value > adjust_value)
1088 {
1089 if (cmp_t)
1090 output_asm_insn ("decf\t%0", out_operands);
1091 else
1092 output_asm_insn ("dect\t%0", out_operands);
1093 }
1094 else
1095 {
1096 if (cmp_t)
1097 output_asm_insn ("incf\t%0", out_operands);
1098 else
1099 output_asm_insn ("inct\t%0", out_operands);
1100 }
1101
1102 return "";
1103 }
1104
1105 /* Outputs the peephole for moving a constant that gets not'ed followed
1106 by an and (i.e. combine the not and the and into andn). BRC */
1107
1108 const char *
1109 mcore_output_andn (rtx insn ATTRIBUTE_UNUSED, rtx operands[])
1110 {
1111 HOST_WIDE_INT x, y;
1112 rtx out_operands[3];
1113 const char * load_op;
1114 char buf[256];
1115 int trick_no;
1116
1117 trick_no = try_constant_tricks (INTVAL (operands[1]), &x, &y);
1118 gcc_assert (trick_no == 2);
1119
1120 out_operands[0] = operands[0];
1121 out_operands[1] = GEN_INT (x);
1122 out_operands[2] = operands[2];
1123
1124 if (x >= 0 && x <= 127)
1125 load_op = "movi\t%0,%1";
1126
1127 /* Try exact power of two. */
1128 else if (CONST_OK_FOR_M (x))
1129 load_op = "bgeni\t%0,%P1";
1130
1131 /* Try exact power of two - 1. */
1132 else if (CONST_OK_FOR_N (x))
1133 load_op = "bmaski\t%0,%N1";
1134
1135 else
1136 {
1137 load_op = "BADMOVI-andn\t%0, %1";
1138 gcc_unreachable ();
1139 }
1140
1141 sprintf (buf, "%s\n\tandn\t%%2,%%0", load_op);
1142 output_asm_insn (buf, out_operands);
1143
1144 return "";
1145 }
1146
1147 /* Output an inline constant. */
1148
1149 static const char *
1150 output_inline_const (enum machine_mode mode, rtx operands[])
1151 {
1152 HOST_WIDE_INT x = 0, y = 0;
1153 int trick_no;
1154 rtx out_operands[3];
1155 char buf[256];
1156 char load_op[256];
1157 const char *dst_fmt;
1158 HOST_WIDE_INT value;
1159
1160 value = INTVAL (operands[1]);
1161
1162 trick_no = try_constant_tricks (value, &x, &y);
1163 /* lrw's are handled separately: Large inlinable constants never get
1164 turned into lrw's. Our caller uses try_constant_tricks to back
1165 off to an lrw rather than calling this routine. */
1166 gcc_assert (trick_no != 0);
1167
1168 if (trick_no == 1)
1169 x = value;
1170
1171 /* operands: 0 = dst, 1 = load immed., 2 = immed. adjustment. */
1172 out_operands[0] = operands[0];
1173 out_operands[1] = GEN_INT (x);
1174
1175 if (trick_no > 2)
1176 out_operands[2] = GEN_INT (y);
1177
1178 /* Select dst format based on mode. */
1179 if (mode == DImode && (! TARGET_LITTLE_END))
1180 dst_fmt = "%R0";
1181 else
1182 dst_fmt = "%0";
1183
1184 if (x >= 0 && x <= 127)
1185 sprintf (load_op, "movi\t%s,%%1", dst_fmt);
1186
1187 /* Try exact power of two. */
1188 else if (CONST_OK_FOR_M (x))
1189 sprintf (load_op, "bgeni\t%s,%%P1", dst_fmt);
1190
1191 /* Try exact power of two - 1. */
1192 else if (CONST_OK_FOR_N (x))
1193 sprintf (load_op, "bmaski\t%s,%%N1", dst_fmt);
1194
1195 else
1196 {
1197 sprintf (load_op, "BADMOVI-inline_const %s, %%1", dst_fmt);
1198 gcc_unreachable ();
1199 }
1200
1201 switch (trick_no)
1202 {
1203 case 1:
1204 strcpy (buf, load_op);
1205 break;
1206 case 2: /* not */
1207 sprintf (buf, "%s\n\tnot\t%s\t// %ld 0x%lx", load_op, dst_fmt, value, value);
1208 break;
1209 case 3: /* add */
1210 sprintf (buf, "%s\n\taddi\t%s,%%2\t// %ld 0x%lx", load_op, dst_fmt, value, value);
1211 break;
1212 case 4: /* sub */
1213 sprintf (buf, "%s\n\tsubi\t%s,%%2\t// %ld 0x%lx", load_op, dst_fmt, value, value);
1214 break;
1215 case 5: /* rsub */
1216 /* Never happens unless -mrsubi, see try_constant_tricks(). */
1217 sprintf (buf, "%s\n\trsubi\t%s,%%2\t// %ld 0x%lx", load_op, dst_fmt, value, value);
1218 break;
1219 case 6: /* bseti */
1220 sprintf (buf, "%s\n\tbseti\t%s,%%P2\t// %ld 0x%lx", load_op, dst_fmt, value, value);
1221 break;
1222 case 7: /* bclr */
1223 sprintf (buf, "%s\n\tbclri\t%s,%%Q2\t// %ld 0x%lx", load_op, dst_fmt, value, value);
1224 break;
1225 case 8: /* rotl */
1226 sprintf (buf, "%s\n\trotli\t%s,%%2\t// %ld 0x%lx", load_op, dst_fmt, value, value);
1227 break;
1228 case 9: /* lsl */
1229 sprintf (buf, "%s\n\tlsli\t%s,%%2\t// %ld 0x%lx", load_op, dst_fmt, value, value);
1230 break;
1231 case 10: /* ixh */
1232 sprintf (buf, "%s\n\tixh\t%s,%s\t// %ld 0x%lx", load_op, dst_fmt, dst_fmt, value, value);
1233 break;
1234 case 11: /* ixw */
1235 sprintf (buf, "%s\n\tixw\t%s,%s\t// %ld 0x%lx", load_op, dst_fmt, dst_fmt, value, value);
1236 break;
1237 default:
1238 return "";
1239 }
1240
1241 output_asm_insn (buf, out_operands);
1242
1243 return "";
1244 }
1245
1246 /* Output a move of a word or less value. */
1247
1248 const char *
1249 mcore_output_move (rtx insn ATTRIBUTE_UNUSED, rtx operands[],
1250 enum machine_mode mode ATTRIBUTE_UNUSED)
1251 {
1252 rtx dst = operands[0];
1253 rtx src = operands[1];
1254
1255 if (GET_CODE (dst) == REG)
1256 {
1257 if (GET_CODE (src) == REG)
1258 {
1259 if (REGNO (src) == CC_REG) /* r-c */
1260 return "mvc\t%0";
1261 else
1262 return "mov\t%0,%1"; /* r-r*/
1263 }
1264 else if (GET_CODE (src) == MEM)
1265 {
1266 if (GET_CODE (XEXP (src, 0)) == LABEL_REF)
1267 return "lrw\t%0,[%1]"; /* a-R */
1268 else
1269 switch (GET_MODE (src)) /* r-m */
1270 {
1271 case SImode:
1272 return "ldw\t%0,%1";
1273 case HImode:
1274 return "ld.h\t%0,%1";
1275 case QImode:
1276 return "ld.b\t%0,%1";
1277 default:
1278 gcc_unreachable ();
1279 }
1280 }
1281 else if (GET_CODE (src) == CONST_INT)
1282 {
1283 HOST_WIDE_INT x, y;
1284
1285 if (CONST_OK_FOR_I (INTVAL (src))) /* r-I */
1286 return "movi\t%0,%1";
1287 else if (CONST_OK_FOR_M (INTVAL (src))) /* r-M */
1288 return "bgeni\t%0,%P1\t// %1 %x1";
1289 else if (CONST_OK_FOR_N (INTVAL (src))) /* r-N */
1290 return "bmaski\t%0,%N1\t// %1 %x1";
1291 else if (try_constant_tricks (INTVAL (src), &x, &y)) /* R-P */
1292 return output_inline_const (SImode, operands); /* 1-2 insns */
1293 else
1294 return "lrw\t%0,%x1\t// %1"; /* Get it from literal pool. */
1295 }
1296 else
1297 return "lrw\t%0, %1"; /* Into the literal pool. */
1298 }
1299 else if (GET_CODE (dst) == MEM) /* m-r */
1300 switch (GET_MODE (dst))
1301 {
1302 case SImode:
1303 return "stw\t%1,%0";
1304 case HImode:
1305 return "st.h\t%1,%0";
1306 case QImode:
1307 return "st.b\t%1,%0";
1308 default:
1309 gcc_unreachable ();
1310 }
1311
1312 gcc_unreachable ();
1313 }
1314
1315 /* Return a sequence of instructions to perform DI or DF move.
1316 Since the MCORE cannot move a DI or DF in one instruction, we have
1317 to take care when we see overlapping source and dest registers. */
1318
1319 const char *
1320 mcore_output_movedouble (rtx operands[], enum machine_mode mode ATTRIBUTE_UNUSED)
1321 {
1322 rtx dst = operands[0];
1323 rtx src = operands[1];
1324
1325 if (GET_CODE (dst) == REG)
1326 {
1327 if (GET_CODE (src) == REG)
1328 {
1329 int dstreg = REGNO (dst);
1330 int srcreg = REGNO (src);
1331
1332 /* Ensure the second source not overwritten. */
1333 if (srcreg + 1 == dstreg)
1334 return "mov %R0,%R1\n\tmov %0,%1";
1335 else
1336 return "mov %0,%1\n\tmov %R0,%R1";
1337 }
1338 else if (GET_CODE (src) == MEM)
1339 {
1340 rtx memexp = memexp = XEXP (src, 0);
1341 int dstreg = REGNO (dst);
1342 int basereg = -1;
1343
1344 if (GET_CODE (memexp) == LABEL_REF)
1345 return "lrw\t%0,[%1]\n\tlrw\t%R0,[%R1]";
1346 else if (GET_CODE (memexp) == REG)
1347 basereg = REGNO (memexp);
1348 else if (GET_CODE (memexp) == PLUS)
1349 {
1350 if (GET_CODE (XEXP (memexp, 0)) == REG)
1351 basereg = REGNO (XEXP (memexp, 0));
1352 else if (GET_CODE (XEXP (memexp, 1)) == REG)
1353 basereg = REGNO (XEXP (memexp, 1));
1354 else
1355 gcc_unreachable ();
1356 }
1357 else
1358 gcc_unreachable ();
1359
1360 /* ??? length attribute is wrong here. */
1361 if (dstreg == basereg)
1362 {
1363 /* Just load them in reverse order. */
1364 return "ldw\t%R0,%R1\n\tldw\t%0,%1";
1365
1366 /* XXX: alternative: move basereg to basereg+1
1367 and then fall through. */
1368 }
1369 else
1370 return "ldw\t%0,%1\n\tldw\t%R0,%R1";
1371 }
1372 else if (GET_CODE (src) == CONST_INT)
1373 {
1374 if (TARGET_LITTLE_END)
1375 {
1376 if (CONST_OK_FOR_I (INTVAL (src)))
1377 output_asm_insn ("movi %0,%1", operands);
1378 else if (CONST_OK_FOR_M (INTVAL (src)))
1379 output_asm_insn ("bgeni %0,%P1", operands);
1380 else if (CONST_OK_FOR_N (INTVAL (src)))
1381 output_asm_insn ("bmaski %0,%N1", operands);
1382 else
1383 gcc_unreachable ();
1384
1385 if (INTVAL (src) < 0)
1386 return "bmaski %R0,32";
1387 else
1388 return "movi %R0,0";
1389 }
1390 else
1391 {
1392 if (CONST_OK_FOR_I (INTVAL (src)))
1393 output_asm_insn ("movi %R0,%1", operands);
1394 else if (CONST_OK_FOR_M (INTVAL (src)))
1395 output_asm_insn ("bgeni %R0,%P1", operands);
1396 else if (CONST_OK_FOR_N (INTVAL (src)))
1397 output_asm_insn ("bmaski %R0,%N1", operands);
1398 else
1399 gcc_unreachable ();
1400
1401 if (INTVAL (src) < 0)
1402 return "bmaski %0,32";
1403 else
1404 return "movi %0,0";
1405 }
1406 }
1407 else
1408 gcc_unreachable ();
1409 }
1410 else if (GET_CODE (dst) == MEM && GET_CODE (src) == REG)
1411 return "stw\t%1,%0\n\tstw\t%R1,%R0";
1412 else
1413 gcc_unreachable ();
1414 }
1415
1416 /* Predicates used by the templates. */
1417
1418 int
1419 mcore_arith_S_operand (rtx op)
1420 {
1421 if (GET_CODE (op) == CONST_INT && CONST_OK_FOR_M (~INTVAL (op)))
1422 return 1;
1423
1424 return 0;
1425 }
1426
1427 /* Expand insert bit field. BRC */
1428
1429 int
1430 mcore_expand_insv (rtx operands[])
1431 {
1432 int width = INTVAL (operands[1]);
1433 int posn = INTVAL (operands[2]);
1434 int mask;
1435 rtx mreg, sreg, ereg;
1436
1437 /* To get width 1 insv, the test in store_bit_field() (expmed.c, line 191)
1438 for width==1 must be removed. Look around line 368. This is something
1439 we really want the md part to do. */
1440 if (width == 1 && GET_CODE (operands[3]) == CONST_INT)
1441 {
1442 /* Do directly with bseti or bclri. */
1443 /* RBE: 2/97 consider only low bit of constant. */
1444 if ((INTVAL (operands[3]) & 1) == 0)
1445 {
1446 mask = ~(1 << posn);
1447 emit_insn (gen_rtx_SET (SImode, operands[0],
1448 gen_rtx_AND (SImode, operands[0], GEN_INT (mask))));
1449 }
1450 else
1451 {
1452 mask = 1 << posn;
1453 emit_insn (gen_rtx_SET (SImode, operands[0],
1454 gen_rtx_IOR (SImode, operands[0], GEN_INT (mask))));
1455 }
1456
1457 return 1;
1458 }
1459
1460 /* Look at some bit-field placements that we aren't interested
1461 in handling ourselves, unless specifically directed to do so. */
1462 if (! TARGET_W_FIELD)
1463 return 0; /* Generally, give up about now. */
1464
1465 if (width == 8 && posn % 8 == 0)
1466 /* Byte sized and aligned; let caller break it up. */
1467 return 0;
1468
1469 if (width == 16 && posn % 16 == 0)
1470 /* Short sized and aligned; let caller break it up. */
1471 return 0;
1472
1473 /* The general case - we can do this a little bit better than what the
1474 machine independent part tries. This will get rid of all the subregs
1475 that mess up constant folding in combine when working with relaxed
1476 immediates. */
1477
1478 /* If setting the entire field, do it directly. */
1479 if (GET_CODE (operands[3]) == CONST_INT
1480 && INTVAL (operands[3]) == ((1 << width) - 1))
1481 {
1482 mreg = force_reg (SImode, GEN_INT (INTVAL (operands[3]) << posn));
1483 emit_insn (gen_rtx_SET (SImode, operands[0],
1484 gen_rtx_IOR (SImode, operands[0], mreg)));
1485 return 1;
1486 }
1487
1488 /* Generate the clear mask. */
1489 mreg = force_reg (SImode, GEN_INT (~(((1 << width) - 1) << posn)));
1490
1491 /* Clear the field, to overlay it later with the source. */
1492 emit_insn (gen_rtx_SET (SImode, operands[0],
1493 gen_rtx_AND (SImode, operands[0], mreg)));
1494
1495 /* If the source is constant 0, we've nothing to add back. */
1496 if (GET_CODE (operands[3]) == CONST_INT && INTVAL (operands[3]) == 0)
1497 return 1;
1498
1499 /* XXX: Should we worry about more games with constant values?
1500 We've covered the high profile: set/clear single-bit and many-bit
1501 fields. How often do we see "arbitrary bit pattern" constants? */
1502 sreg = copy_to_mode_reg (SImode, operands[3]);
1503
1504 /* Extract src as same width as dst (needed for signed values). We
1505 always have to do this since we widen everything to SImode.
1506 We don't have to mask if we're shifting this up against the
1507 MSB of the register (e.g., the shift will push out any hi-order
1508 bits. */
1509 if (width + posn != (int) GET_MODE_SIZE (SImode))
1510 {
1511 ereg = force_reg (SImode, GEN_INT ((1 << width) - 1));
1512 emit_insn (gen_rtx_SET (SImode, sreg,
1513 gen_rtx_AND (SImode, sreg, ereg)));
1514 }
1515
1516 /* Insert source value in dest. */
1517 if (posn != 0)
1518 emit_insn (gen_rtx_SET (SImode, sreg,
1519 gen_rtx_ASHIFT (SImode, sreg, GEN_INT (posn))));
1520
1521 emit_insn (gen_rtx_SET (SImode, operands[0],
1522 gen_rtx_IOR (SImode, operands[0], sreg)));
1523
1524 return 1;
1525 }
1526 \f
1527 /* ??? Block move stuff stolen from m88k. This code has not been
1528 verified for correctness. */
1529
1530 /* Emit code to perform a block move. Choose the best method.
1531
1532 OPERANDS[0] is the destination.
1533 OPERANDS[1] is the source.
1534 OPERANDS[2] is the size.
1535 OPERANDS[3] is the alignment safe to use. */
1536
1537 /* Emit code to perform a block move with an offset sequence of ldw/st
1538 instructions (..., ldw 0, stw 1, ldw 1, stw 0, ...). SIZE and ALIGN are
1539 known constants. DEST and SRC are registers. OFFSET is the known
1540 starting point for the output pattern. */
1541
1542 static const enum machine_mode mode_from_align[] =
1543 {
1544 VOIDmode, QImode, HImode, VOIDmode, SImode,
1545 };
1546
1547 static void
1548 block_move_sequence (rtx dst_mem, rtx src_mem, int size, int align)
1549 {
1550 rtx temp[2];
1551 enum machine_mode mode[2];
1552 int amount[2];
1553 bool active[2];
1554 int phase = 0;
1555 int next;
1556 int offset_ld = 0;
1557 int offset_st = 0;
1558 rtx x;
1559
1560 x = XEXP (dst_mem, 0);
1561 if (!REG_P (x))
1562 {
1563 x = force_reg (Pmode, x);
1564 dst_mem = replace_equiv_address (dst_mem, x);
1565 }
1566
1567 x = XEXP (src_mem, 0);
1568 if (!REG_P (x))
1569 {
1570 x = force_reg (Pmode, x);
1571 src_mem = replace_equiv_address (src_mem, x);
1572 }
1573
1574 active[0] = active[1] = false;
1575
1576 do
1577 {
1578 next = phase;
1579 phase ^= 1;
1580
1581 if (size > 0)
1582 {
1583 int next_amount;
1584
1585 next_amount = (size >= 4 ? 4 : (size >= 2 ? 2 : 1));
1586 next_amount = MIN (next_amount, align);
1587
1588 amount[next] = next_amount;
1589 mode[next] = mode_from_align[next_amount];
1590 temp[next] = gen_reg_rtx (mode[next]);
1591
1592 x = adjust_address (src_mem, mode[next], offset_ld);
1593 emit_insn (gen_rtx_SET (VOIDmode, temp[next], x));
1594
1595 offset_ld += next_amount;
1596 size -= next_amount;
1597 active[next] = true;
1598 }
1599
1600 if (active[phase])
1601 {
1602 active[phase] = false;
1603
1604 x = adjust_address (dst_mem, mode[phase], offset_st);
1605 emit_insn (gen_rtx_SET (VOIDmode, x, temp[phase]));
1606
1607 offset_st += amount[phase];
1608 }
1609 }
1610 while (active[next]);
1611 }
1612
1613 bool
1614 mcore_expand_block_move (rtx *operands)
1615 {
1616 HOST_WIDE_INT align, bytes, max;
1617
1618 if (GET_CODE (operands[2]) != CONST_INT)
1619 return false;
1620
1621 bytes = INTVAL (operands[2]);
1622 align = INTVAL (operands[3]);
1623
1624 if (bytes <= 0)
1625 return false;
1626 if (align > 4)
1627 align = 4;
1628
1629 switch (align)
1630 {
1631 case 4:
1632 if (bytes & 1)
1633 max = 4*4;
1634 else if (bytes & 3)
1635 max = 8*4;
1636 else
1637 max = 16*4;
1638 break;
1639 case 2:
1640 max = 4*2;
1641 break;
1642 case 1:
1643 max = 4*1;
1644 break;
1645 default:
1646 gcc_unreachable ();
1647 }
1648
1649 if (bytes <= max)
1650 {
1651 block_move_sequence (operands[0], operands[1], bytes, align);
1652 return true;
1653 }
1654
1655 return false;
1656 }
1657 \f
1658
1659 /* Code to generate prologue and epilogue sequences. */
1660 static int number_of_regs_before_varargs;
1661
1662 /* Set by TARGET_SETUP_INCOMING_VARARGS to indicate to prolog that this is
1663 for a varargs function. */
1664 static int current_function_anonymous_args;
1665
1666 #define STACK_BYTES (STACK_BOUNDARY/BITS_PER_UNIT)
1667 #define STORE_REACH (64) /* Maximum displace of word store + 4. */
1668 #define ADDI_REACH (32) /* Maximum addi operand. */
1669
1670 static void
1671 layout_mcore_frame (struct mcore_frame * infp)
1672 {
1673 int n;
1674 unsigned int i;
1675 int nbytes;
1676 int regarg;
1677 int localregarg;
1678 int outbounds;
1679 unsigned int growths;
1680 int step;
1681
1682 /* Might have to spill bytes to re-assemble a big argument that
1683 was passed partially in registers and partially on the stack. */
1684 nbytes = crtl->args.pretend_args_size;
1685
1686 /* Determine how much space for spilled anonymous args (e.g., stdarg). */
1687 if (current_function_anonymous_args)
1688 nbytes += (NPARM_REGS - number_of_regs_before_varargs) * UNITS_PER_WORD;
1689
1690 infp->arg_size = nbytes;
1691
1692 /* How much space to save non-volatile registers we stomp. */
1693 infp->reg_mask = calc_live_regs (& n);
1694 infp->reg_size = n * 4;
1695
1696 /* And the rest of it... locals and space for overflowed outbounds. */
1697 infp->local_size = get_frame_size ();
1698 infp->outbound_size = crtl->outgoing_args_size;
1699
1700 /* Make sure we have a whole number of words for the locals. */
1701 if (infp->local_size % STACK_BYTES)
1702 infp->local_size = (infp->local_size + STACK_BYTES - 1) & ~ (STACK_BYTES -1);
1703
1704 /* Only thing we know we have to pad is the outbound space, since
1705 we've aligned our locals assuming that base of locals is aligned. */
1706 infp->pad_local = 0;
1707 infp->pad_reg = 0;
1708 infp->pad_outbound = 0;
1709 if (infp->outbound_size % STACK_BYTES)
1710 infp->pad_outbound = STACK_BYTES - (infp->outbound_size % STACK_BYTES);
1711
1712 /* Now we see how we want to stage the prologue so that it does
1713 the most appropriate stack growth and register saves to either:
1714 (1) run fast,
1715 (2) reduce instruction space, or
1716 (3) reduce stack space. */
1717 for (i = 0; i < ARRAY_SIZE (infp->growth); i++)
1718 infp->growth[i] = 0;
1719
1720 regarg = infp->reg_size + infp->arg_size;
1721 localregarg = infp->local_size + regarg;
1722 outbounds = infp->outbound_size + infp->pad_outbound;
1723 growths = 0;
1724
1725 /* XXX: Consider one where we consider localregarg + outbound too! */
1726
1727 /* Frame of <= 32 bytes and using stm would get <= 2 registers.
1728 use stw's with offsets and buy the frame in one shot. */
1729 if (localregarg <= ADDI_REACH
1730 && (infp->reg_size <= 8 || (infp->reg_mask & 0xc000) != 0xc000))
1731 {
1732 /* Make sure we'll be aligned. */
1733 if (localregarg % STACK_BYTES)
1734 infp->pad_reg = STACK_BYTES - (localregarg % STACK_BYTES);
1735
1736 step = localregarg + infp->pad_reg;
1737 infp->reg_offset = infp->local_size;
1738
1739 if (outbounds + step <= ADDI_REACH && !frame_pointer_needed)
1740 {
1741 step += outbounds;
1742 infp->reg_offset += outbounds;
1743 outbounds = 0;
1744 }
1745
1746 infp->arg_offset = step - 4;
1747 infp->growth[growths++] = step;
1748 infp->reg_growth = growths;
1749 infp->local_growth = growths;
1750
1751 /* If we haven't already folded it in. */
1752 if (outbounds)
1753 infp->growth[growths++] = outbounds;
1754
1755 goto finish;
1756 }
1757
1758 /* Frame can't be done with a single subi, but can be done with 2
1759 insns. If the 'stm' is getting <= 2 registers, we use stw's and
1760 shift some of the stack purchase into the first subi, so both are
1761 single instructions. */
1762 if (localregarg <= STORE_REACH
1763 && (infp->local_size > ADDI_REACH)
1764 && (infp->reg_size <= 8 || (infp->reg_mask & 0xc000) != 0xc000))
1765 {
1766 int all;
1767
1768 /* Make sure we'll be aligned; use either pad_reg or pad_local. */
1769 if (localregarg % STACK_BYTES)
1770 infp->pad_reg = STACK_BYTES - (localregarg % STACK_BYTES);
1771
1772 all = localregarg + infp->pad_reg + infp->pad_local;
1773 step = ADDI_REACH; /* As much up front as we can. */
1774 if (step > all)
1775 step = all;
1776
1777 /* XXX: Consider whether step will still be aligned; we believe so. */
1778 infp->arg_offset = step - 4;
1779 infp->growth[growths++] = step;
1780 infp->reg_growth = growths;
1781 infp->reg_offset = step - infp->pad_reg - infp->reg_size;
1782 all -= step;
1783
1784 /* Can we fold in any space required for outbounds? */
1785 if (outbounds + all <= ADDI_REACH && !frame_pointer_needed)
1786 {
1787 all += outbounds;
1788 outbounds = 0;
1789 }
1790
1791 /* Get the rest of the locals in place. */
1792 step = all;
1793 infp->growth[growths++] = step;
1794 infp->local_growth = growths;
1795 all -= step;
1796
1797 gcc_assert (all == 0);
1798
1799 /* Finish off if we need to do so. */
1800 if (outbounds)
1801 infp->growth[growths++] = outbounds;
1802
1803 goto finish;
1804 }
1805
1806 /* Registers + args is nicely aligned, so we'll buy that in one shot.
1807 Then we buy the rest of the frame in 1 or 2 steps depending on
1808 whether we need a frame pointer. */
1809 if ((regarg % STACK_BYTES) == 0)
1810 {
1811 infp->growth[growths++] = regarg;
1812 infp->reg_growth = growths;
1813 infp->arg_offset = regarg - 4;
1814 infp->reg_offset = 0;
1815
1816 if (infp->local_size % STACK_BYTES)
1817 infp->pad_local = STACK_BYTES - (infp->local_size % STACK_BYTES);
1818
1819 step = infp->local_size + infp->pad_local;
1820
1821 if (!frame_pointer_needed)
1822 {
1823 step += outbounds;
1824 outbounds = 0;
1825 }
1826
1827 infp->growth[growths++] = step;
1828 infp->local_growth = growths;
1829
1830 /* If there's any left to be done. */
1831 if (outbounds)
1832 infp->growth[growths++] = outbounds;
1833
1834 goto finish;
1835 }
1836
1837 /* XXX: optimizations that we'll want to play with....
1838 -- regarg is not aligned, but it's a small number of registers;
1839 use some of localsize so that regarg is aligned and then
1840 save the registers. */
1841
1842 /* Simple encoding; plods down the stack buying the pieces as it goes.
1843 -- does not optimize space consumption.
1844 -- does not attempt to optimize instruction counts.
1845 -- but it is safe for all alignments. */
1846 if (regarg % STACK_BYTES != 0)
1847 infp->pad_reg = STACK_BYTES - (regarg % STACK_BYTES);
1848
1849 infp->growth[growths++] = infp->arg_size + infp->reg_size + infp->pad_reg;
1850 infp->reg_growth = growths;
1851 infp->arg_offset = infp->growth[0] - 4;
1852 infp->reg_offset = 0;
1853
1854 if (frame_pointer_needed)
1855 {
1856 if (infp->local_size % STACK_BYTES != 0)
1857 infp->pad_local = STACK_BYTES - (infp->local_size % STACK_BYTES);
1858
1859 infp->growth[growths++] = infp->local_size + infp->pad_local;
1860 infp->local_growth = growths;
1861
1862 infp->growth[growths++] = outbounds;
1863 }
1864 else
1865 {
1866 if ((infp->local_size + outbounds) % STACK_BYTES != 0)
1867 infp->pad_local = STACK_BYTES - ((infp->local_size + outbounds) % STACK_BYTES);
1868
1869 infp->growth[growths++] = infp->local_size + infp->pad_local + outbounds;
1870 infp->local_growth = growths;
1871 }
1872
1873 /* Anything else that we've forgotten?, plus a few consistency checks. */
1874 finish:
1875 gcc_assert (infp->reg_offset >= 0);
1876 gcc_assert (growths <= MAX_STACK_GROWS);
1877
1878 for (i = 0; i < growths; i++)
1879 gcc_assert (!(infp->growth[i] % STACK_BYTES));
1880 }
1881
1882 /* Define the offset between two registers, one to be eliminated, and
1883 the other its replacement, at the start of a routine. */
1884
1885 int
1886 mcore_initial_elimination_offset (int from, int to)
1887 {
1888 int above_frame;
1889 int below_frame;
1890 struct mcore_frame fi;
1891
1892 layout_mcore_frame (& fi);
1893
1894 /* fp to ap */
1895 above_frame = fi.local_size + fi.pad_local + fi.reg_size + fi.pad_reg;
1896 /* sp to fp */
1897 below_frame = fi.outbound_size + fi.pad_outbound;
1898
1899 if (from == ARG_POINTER_REGNUM && to == FRAME_POINTER_REGNUM)
1900 return above_frame;
1901
1902 if (from == ARG_POINTER_REGNUM && to == STACK_POINTER_REGNUM)
1903 return above_frame + below_frame;
1904
1905 if (from == FRAME_POINTER_REGNUM && to == STACK_POINTER_REGNUM)
1906 return below_frame;
1907
1908 gcc_unreachable ();
1909 }
1910
1911 /* Keep track of some information about varargs for the prolog. */
1912
1913 static void
1914 mcore_setup_incoming_varargs (cumulative_args_t args_so_far_v,
1915 enum machine_mode mode, tree type,
1916 int * ptr_pretend_size ATTRIBUTE_UNUSED,
1917 int second_time ATTRIBUTE_UNUSED)
1918 {
1919 CUMULATIVE_ARGS *args_so_far = get_cumulative_args (args_so_far_v);
1920
1921 current_function_anonymous_args = 1;
1922
1923 /* We need to know how many argument registers are used before
1924 the varargs start, so that we can push the remaining argument
1925 registers during the prologue. */
1926 number_of_regs_before_varargs = *args_so_far + mcore_num_arg_regs (mode, type);
1927
1928 /* There is a bug somewhere in the arg handling code.
1929 Until I can find it this workaround always pushes the
1930 last named argument onto the stack. */
1931 number_of_regs_before_varargs = *args_so_far;
1932
1933 /* The last named argument may be split between argument registers
1934 and the stack. Allow for this here. */
1935 if (number_of_regs_before_varargs > NPARM_REGS)
1936 number_of_regs_before_varargs = NPARM_REGS;
1937 }
1938
1939 void
1940 mcore_expand_prolog (void)
1941 {
1942 struct mcore_frame fi;
1943 int space_allocated = 0;
1944 int growth = 0;
1945
1946 /* Find out what we're doing. */
1947 layout_mcore_frame (&fi);
1948
1949 space_allocated = fi.arg_size + fi.reg_size + fi.local_size +
1950 fi.outbound_size + fi.pad_outbound + fi.pad_local + fi.pad_reg;
1951
1952 if (TARGET_CG_DATA)
1953 {
1954 /* Emit a symbol for this routine's frame size. */
1955 rtx x;
1956
1957 x = DECL_RTL (current_function_decl);
1958
1959 gcc_assert (GET_CODE (x) == MEM);
1960
1961 x = XEXP (x, 0);
1962
1963 gcc_assert (GET_CODE (x) == SYMBOL_REF);
1964
1965 free (mcore_current_function_name);
1966
1967 mcore_current_function_name = xstrdup (XSTR (x, 0));
1968
1969 ASM_OUTPUT_CG_NODE (asm_out_file, mcore_current_function_name, space_allocated);
1970
1971 if (cfun->calls_alloca)
1972 ASM_OUTPUT_CG_EDGE (asm_out_file, mcore_current_function_name, "alloca", 1);
1973
1974 /* 970425: RBE:
1975 We're looking at how the 8byte alignment affects stack layout
1976 and where we had to pad things. This emits information we can
1977 extract which tells us about frame sizes and the like. */
1978 fprintf (asm_out_file,
1979 "\t.equ\t__$frame$info$_%s_$_%d_%d_x%x_%d_%d_%d,0\n",
1980 mcore_current_function_name,
1981 fi.arg_size, fi.reg_size, fi.reg_mask,
1982 fi.local_size, fi.outbound_size,
1983 frame_pointer_needed);
1984 }
1985
1986 if (mcore_naked_function_p ())
1987 return;
1988
1989 /* Handle stdarg+regsaves in one shot: can't be more than 64 bytes. */
1990 output_stack_adjust (-1, fi.growth[growth++]); /* Grows it. */
1991
1992 /* If we have a parameter passed partially in regs and partially in memory,
1993 the registers will have been stored to memory already in function.c. So
1994 we only need to do something here for varargs functions. */
1995 if (fi.arg_size != 0 && crtl->args.pretend_args_size == 0)
1996 {
1997 int offset;
1998 int rn = FIRST_PARM_REG + NPARM_REGS - 1;
1999 int remaining = fi.arg_size;
2000
2001 for (offset = fi.arg_offset; remaining >= 4; offset -= 4, rn--, remaining -= 4)
2002 {
2003 emit_insn (gen_movsi
2004 (gen_rtx_MEM (SImode,
2005 plus_constant (stack_pointer_rtx, offset)),
2006 gen_rtx_REG (SImode, rn)));
2007 }
2008 }
2009
2010 /* Do we need another stack adjustment before we do the register saves? */
2011 if (growth < fi.reg_growth)
2012 output_stack_adjust (-1, fi.growth[growth++]); /* Grows it. */
2013
2014 if (fi.reg_size != 0)
2015 {
2016 int i;
2017 int offs = fi.reg_offset;
2018
2019 for (i = 15; i >= 0; i--)
2020 {
2021 if (offs == 0 && i == 15 && ((fi.reg_mask & 0xc000) == 0xc000))
2022 {
2023 int first_reg = 15;
2024
2025 while (fi.reg_mask & (1 << first_reg))
2026 first_reg--;
2027 first_reg++;
2028
2029 emit_insn (gen_store_multiple (gen_rtx_MEM (SImode, stack_pointer_rtx),
2030 gen_rtx_REG (SImode, first_reg),
2031 GEN_INT (16 - first_reg)));
2032
2033 i -= (15 - first_reg);
2034 offs += (16 - first_reg) * 4;
2035 }
2036 else if (fi.reg_mask & (1 << i))
2037 {
2038 emit_insn (gen_movsi
2039 (gen_rtx_MEM (SImode,
2040 plus_constant (stack_pointer_rtx, offs)),
2041 gen_rtx_REG (SImode, i)));
2042 offs += 4;
2043 }
2044 }
2045 }
2046
2047 /* Figure the locals + outbounds. */
2048 if (frame_pointer_needed)
2049 {
2050 /* If we haven't already purchased to 'fp'. */
2051 if (growth < fi.local_growth)
2052 output_stack_adjust (-1, fi.growth[growth++]); /* Grows it. */
2053
2054 emit_insn (gen_movsi (frame_pointer_rtx, stack_pointer_rtx));
2055
2056 /* ... and then go any remaining distance for outbounds, etc. */
2057 if (fi.growth[growth])
2058 output_stack_adjust (-1, fi.growth[growth++]);
2059 }
2060 else
2061 {
2062 if (growth < fi.local_growth)
2063 output_stack_adjust (-1, fi.growth[growth++]); /* Grows it. */
2064 if (fi.growth[growth])
2065 output_stack_adjust (-1, fi.growth[growth++]);
2066 }
2067 }
2068
2069 void
2070 mcore_expand_epilog (void)
2071 {
2072 struct mcore_frame fi;
2073 int i;
2074 int offs;
2075 int growth = MAX_STACK_GROWS - 1 ;
2076
2077
2078 /* Find out what we're doing. */
2079 layout_mcore_frame(&fi);
2080
2081 if (mcore_naked_function_p ())
2082 return;
2083
2084 /* If we had a frame pointer, restore the sp from that. */
2085 if (frame_pointer_needed)
2086 {
2087 emit_insn (gen_movsi (stack_pointer_rtx, frame_pointer_rtx));
2088 growth = fi.local_growth - 1;
2089 }
2090 else
2091 {
2092 /* XXX: while loop should accumulate and do a single sell. */
2093 while (growth >= fi.local_growth)
2094 {
2095 if (fi.growth[growth] != 0)
2096 output_stack_adjust (1, fi.growth[growth]);
2097 growth--;
2098 }
2099 }
2100
2101 /* Make sure we've shrunk stack back to the point where the registers
2102 were laid down. This is typically 0/1 iterations. Then pull the
2103 register save information back off the stack. */
2104 while (growth >= fi.reg_growth)
2105 output_stack_adjust ( 1, fi.growth[growth--]);
2106
2107 offs = fi.reg_offset;
2108
2109 for (i = 15; i >= 0; i--)
2110 {
2111 if (offs == 0 && i == 15 && ((fi.reg_mask & 0xc000) == 0xc000))
2112 {
2113 int first_reg;
2114
2115 /* Find the starting register. */
2116 first_reg = 15;
2117
2118 while (fi.reg_mask & (1 << first_reg))
2119 first_reg--;
2120
2121 first_reg++;
2122
2123 emit_insn (gen_load_multiple (gen_rtx_REG (SImode, first_reg),
2124 gen_rtx_MEM (SImode, stack_pointer_rtx),
2125 GEN_INT (16 - first_reg)));
2126
2127 i -= (15 - first_reg);
2128 offs += (16 - first_reg) * 4;
2129 }
2130 else if (fi.reg_mask & (1 << i))
2131 {
2132 emit_insn (gen_movsi
2133 (gen_rtx_REG (SImode, i),
2134 gen_rtx_MEM (SImode,
2135 plus_constant (stack_pointer_rtx, offs))));
2136 offs += 4;
2137 }
2138 }
2139
2140 /* Give back anything else. */
2141 /* XXX: Should accumulate total and then give it back. */
2142 while (growth >= 0)
2143 output_stack_adjust ( 1, fi.growth[growth--]);
2144 }
2145 \f
2146 /* This code is borrowed from the SH port. */
2147
2148 /* The MCORE cannot load a large constant into a register, constants have to
2149 come from a pc relative load. The reference of a pc relative load
2150 instruction must be less than 1k in front of the instruction. This
2151 means that we often have to dump a constant inside a function, and
2152 generate code to branch around it.
2153
2154 It is important to minimize this, since the branches will slow things
2155 down and make things bigger.
2156
2157 Worst case code looks like:
2158
2159 lrw L1,r0
2160 br L2
2161 align
2162 L1: .long value
2163 L2:
2164 ..
2165
2166 lrw L3,r0
2167 br L4
2168 align
2169 L3: .long value
2170 L4:
2171 ..
2172
2173 We fix this by performing a scan before scheduling, which notices which
2174 instructions need to have their operands fetched from the constant table
2175 and builds the table.
2176
2177 The algorithm is:
2178
2179 scan, find an instruction which needs a pcrel move. Look forward, find the
2180 last barrier which is within MAX_COUNT bytes of the requirement.
2181 If there isn't one, make one. Process all the instructions between
2182 the find and the barrier.
2183
2184 In the above example, we can tell that L3 is within 1k of L1, so
2185 the first move can be shrunk from the 2 insn+constant sequence into
2186 just 1 insn, and the constant moved to L3 to make:
2187
2188 lrw L1,r0
2189 ..
2190 lrw L3,r0
2191 bra L4
2192 align
2193 L3:.long value
2194 L4:.long value
2195
2196 Then the second move becomes the target for the shortening process. */
2197
2198 typedef struct
2199 {
2200 rtx value; /* Value in table. */
2201 rtx label; /* Label of value. */
2202 } pool_node;
2203
2204 /* The maximum number of constants that can fit into one pool, since
2205 the pc relative range is 0...1020 bytes and constants are at least 4
2206 bytes long. We subtract 4 from the range to allow for the case where
2207 we need to add a branch/align before the constant pool. */
2208
2209 #define MAX_COUNT 1016
2210 #define MAX_POOL_SIZE (MAX_COUNT/4)
2211 static pool_node pool_vector[MAX_POOL_SIZE];
2212 static int pool_size;
2213
2214 /* Dump out any constants accumulated in the final pass. These
2215 will only be labels. */
2216
2217 const char *
2218 mcore_output_jump_label_table (void)
2219 {
2220 int i;
2221
2222 if (pool_size)
2223 {
2224 fprintf (asm_out_file, "\t.align 2\n");
2225
2226 for (i = 0; i < pool_size; i++)
2227 {
2228 pool_node * p = pool_vector + i;
2229
2230 (*targetm.asm_out.internal_label) (asm_out_file, "L", CODE_LABEL_NUMBER (p->label));
2231
2232 output_asm_insn (".long %0", &p->value);
2233 }
2234
2235 pool_size = 0;
2236 }
2237
2238 return "";
2239 }
2240
2241 /* Check whether insn is a candidate for a conditional. */
2242
2243 static cond_type
2244 is_cond_candidate (rtx insn)
2245 {
2246 /* The only things we conditionalize are those that can be directly
2247 changed into a conditional. Only bother with SImode items. If
2248 we wanted to be a little more aggressive, we could also do other
2249 modes such as DImode with reg-reg move or load 0. */
2250 if (GET_CODE (insn) == INSN)
2251 {
2252 rtx pat = PATTERN (insn);
2253 rtx src, dst;
2254
2255 if (GET_CODE (pat) != SET)
2256 return COND_NO;
2257
2258 dst = XEXP (pat, 0);
2259
2260 if ((GET_CODE (dst) != REG &&
2261 GET_CODE (dst) != SUBREG) ||
2262 GET_MODE (dst) != SImode)
2263 return COND_NO;
2264
2265 src = XEXP (pat, 1);
2266
2267 if ((GET_CODE (src) == REG ||
2268 (GET_CODE (src) == SUBREG &&
2269 GET_CODE (SUBREG_REG (src)) == REG)) &&
2270 GET_MODE (src) == SImode)
2271 return COND_MOV_INSN;
2272 else if (GET_CODE (src) == CONST_INT &&
2273 INTVAL (src) == 0)
2274 return COND_CLR_INSN;
2275 else if (GET_CODE (src) == PLUS &&
2276 (GET_CODE (XEXP (src, 0)) == REG ||
2277 (GET_CODE (XEXP (src, 0)) == SUBREG &&
2278 GET_CODE (SUBREG_REG (XEXP (src, 0))) == REG)) &&
2279 GET_MODE (XEXP (src, 0)) == SImode &&
2280 GET_CODE (XEXP (src, 1)) == CONST_INT &&
2281 INTVAL (XEXP (src, 1)) == 1)
2282 return COND_INC_INSN;
2283 else if (((GET_CODE (src) == MINUS &&
2284 GET_CODE (XEXP (src, 1)) == CONST_INT &&
2285 INTVAL( XEXP (src, 1)) == 1) ||
2286 (GET_CODE (src) == PLUS &&
2287 GET_CODE (XEXP (src, 1)) == CONST_INT &&
2288 INTVAL (XEXP (src, 1)) == -1)) &&
2289 (GET_CODE (XEXP (src, 0)) == REG ||
2290 (GET_CODE (XEXP (src, 0)) == SUBREG &&
2291 GET_CODE (SUBREG_REG (XEXP (src, 0))) == REG)) &&
2292 GET_MODE (XEXP (src, 0)) == SImode)
2293 return COND_DEC_INSN;
2294
2295 /* Some insns that we don't bother with:
2296 (set (rx:DI) (ry:DI))
2297 (set (rx:DI) (const_int 0))
2298 */
2299
2300 }
2301 else if (GET_CODE (insn) == JUMP_INSN &&
2302 GET_CODE (PATTERN (insn)) == SET &&
2303 GET_CODE (XEXP (PATTERN (insn), 1)) == LABEL_REF)
2304 return COND_BRANCH_INSN;
2305
2306 return COND_NO;
2307 }
2308
2309 /* Emit a conditional version of insn and replace the old insn with the
2310 new one. Return the new insn if emitted. */
2311
2312 static rtx
2313 emit_new_cond_insn (rtx insn, int cond)
2314 {
2315 rtx c_insn = 0;
2316 rtx pat, dst, src;
2317 cond_type num;
2318
2319 if ((num = is_cond_candidate (insn)) == COND_NO)
2320 return NULL;
2321
2322 pat = PATTERN (insn);
2323
2324 if (GET_CODE (insn) == INSN)
2325 {
2326 dst = SET_DEST (pat);
2327 src = SET_SRC (pat);
2328 }
2329 else
2330 {
2331 dst = JUMP_LABEL (insn);
2332 src = NULL_RTX;
2333 }
2334
2335 switch (num)
2336 {
2337 case COND_MOV_INSN:
2338 case COND_CLR_INSN:
2339 if (cond)
2340 c_insn = gen_movt0 (dst, src, dst);
2341 else
2342 c_insn = gen_movt0 (dst, dst, src);
2343 break;
2344
2345 case COND_INC_INSN:
2346 if (cond)
2347 c_insn = gen_incscc (dst, dst);
2348 else
2349 c_insn = gen_incscc_false (dst, dst);
2350 break;
2351
2352 case COND_DEC_INSN:
2353 if (cond)
2354 c_insn = gen_decscc (dst, dst);
2355 else
2356 c_insn = gen_decscc_false (dst, dst);
2357 break;
2358
2359 case COND_BRANCH_INSN:
2360 if (cond)
2361 c_insn = gen_branch_true (dst);
2362 else
2363 c_insn = gen_branch_false (dst);
2364 break;
2365
2366 default:
2367 return NULL;
2368 }
2369
2370 /* Only copy the notes if they exist. */
2371 if (rtx_length [GET_CODE (c_insn)] >= 7 && rtx_length [GET_CODE (insn)] >= 7)
2372 {
2373 /* We really don't need to bother with the notes and links at this
2374 point, but go ahead and save the notes. This will help is_dead()
2375 when applying peepholes (links don't matter since they are not
2376 used any more beyond this point for the mcore). */
2377 REG_NOTES (c_insn) = REG_NOTES (insn);
2378 }
2379
2380 if (num == COND_BRANCH_INSN)
2381 {
2382 /* For jumps, we need to be a little bit careful and emit the new jump
2383 before the old one and to update the use count for the target label.
2384 This way, the barrier following the old (uncond) jump will get
2385 deleted, but the label won't. */
2386 c_insn = emit_jump_insn_before (c_insn, insn);
2387
2388 ++ LABEL_NUSES (dst);
2389
2390 JUMP_LABEL (c_insn) = dst;
2391 }
2392 else
2393 c_insn = emit_insn_after (c_insn, insn);
2394
2395 delete_insn (insn);
2396
2397 return c_insn;
2398 }
2399
2400 /* Attempt to change a basic block into a series of conditional insns. This
2401 works by taking the branch at the end of the 1st block and scanning for the
2402 end of the 2nd block. If all instructions in the 2nd block have cond.
2403 versions and the label at the start of block 3 is the same as the target
2404 from the branch at block 1, then conditionalize all insn in block 2 using
2405 the inverse condition of the branch at block 1. (Note I'm bending the
2406 definition of basic block here.)
2407
2408 e.g., change:
2409
2410 bt L2 <-- end of block 1 (delete)
2411 mov r7,r8
2412 addu r7,1
2413 br L3 <-- end of block 2
2414
2415 L2: ... <-- start of block 3 (NUSES==1)
2416 L3: ...
2417
2418 to:
2419
2420 movf r7,r8
2421 incf r7
2422 bf L3
2423
2424 L3: ...
2425
2426 we can delete the L2 label if NUSES==1 and re-apply the optimization
2427 starting at the last instruction of block 2. This may allow an entire
2428 if-then-else statement to be conditionalized. BRC */
2429 static rtx
2430 conditionalize_block (rtx first)
2431 {
2432 rtx insn;
2433 rtx br_pat;
2434 rtx end_blk_1_br = 0;
2435 rtx end_blk_2_insn = 0;
2436 rtx start_blk_3_lab = 0;
2437 int cond;
2438 int br_lab_num;
2439 int blk_size = 0;
2440
2441
2442 /* Check that the first insn is a candidate conditional jump. This is
2443 the one that we'll eliminate. If not, advance to the next insn to
2444 try. */
2445 if (GET_CODE (first) != JUMP_INSN ||
2446 GET_CODE (PATTERN (first)) != SET ||
2447 GET_CODE (XEXP (PATTERN (first), 1)) != IF_THEN_ELSE)
2448 return NEXT_INSN (first);
2449
2450 /* Extract some information we need. */
2451 end_blk_1_br = first;
2452 br_pat = PATTERN (end_blk_1_br);
2453
2454 /* Complement the condition since we use the reverse cond. for the insns. */
2455 cond = (GET_CODE (XEXP (XEXP (br_pat, 1), 0)) == EQ);
2456
2457 /* Determine what kind of branch we have. */
2458 if (GET_CODE (XEXP (XEXP (br_pat, 1), 1)) == LABEL_REF)
2459 {
2460 /* A normal branch, so extract label out of first arm. */
2461 br_lab_num = CODE_LABEL_NUMBER (XEXP (XEXP (XEXP (br_pat, 1), 1), 0));
2462 }
2463 else
2464 {
2465 /* An inverse branch, so extract the label out of the 2nd arm
2466 and complement the condition. */
2467 cond = (cond == 0);
2468 br_lab_num = CODE_LABEL_NUMBER (XEXP (XEXP (XEXP (br_pat, 1), 2), 0));
2469 }
2470
2471 /* Scan forward for the start of block 2: it must start with a
2472 label and that label must be the same as the branch target
2473 label from block 1. We don't care about whether block 2 actually
2474 ends with a branch or a label (an uncond. branch is
2475 conditionalizable). */
2476 for (insn = NEXT_INSN (first); insn; insn = NEXT_INSN (insn))
2477 {
2478 enum rtx_code code;
2479
2480 code = GET_CODE (insn);
2481
2482 /* Look for the label at the start of block 3. */
2483 if (code == CODE_LABEL && CODE_LABEL_NUMBER (insn) == br_lab_num)
2484 break;
2485
2486 /* Skip barriers, notes, and conditionalizable insns. If the
2487 insn is not conditionalizable or makes this optimization fail,
2488 just return the next insn so we can start over from that point. */
2489 if (code != BARRIER && code != NOTE && !is_cond_candidate (insn))
2490 return NEXT_INSN (insn);
2491
2492 /* Remember the last real insn before the label (i.e. end of block 2). */
2493 if (code == JUMP_INSN || code == INSN)
2494 {
2495 blk_size ++;
2496 end_blk_2_insn = insn;
2497 }
2498 }
2499
2500 if (!insn)
2501 return insn;
2502
2503 /* It is possible for this optimization to slow performance if the blocks
2504 are long. This really depends upon whether the branch is likely taken
2505 or not. If the branch is taken, we slow performance in many cases. But,
2506 if the branch is not taken, we always help performance (for a single
2507 block, but for a double block (i.e. when the optimization is re-applied)
2508 this is not true since the 'right thing' depends on the overall length of
2509 the collapsed block). As a compromise, don't apply this optimization on
2510 blocks larger than size 2 (unlikely for the mcore) when speed is important.
2511 the best threshold depends on the latencies of the instructions (i.e.,
2512 the branch penalty). */
2513 if (optimize > 1 && blk_size > 2)
2514 return insn;
2515
2516 /* At this point, we've found the start of block 3 and we know that
2517 it is the destination of the branch from block 1. Also, all
2518 instructions in the block 2 are conditionalizable. So, apply the
2519 conditionalization and delete the branch. */
2520 start_blk_3_lab = insn;
2521
2522 for (insn = NEXT_INSN (end_blk_1_br); insn != start_blk_3_lab;
2523 insn = NEXT_INSN (insn))
2524 {
2525 rtx newinsn;
2526
2527 if (INSN_DELETED_P (insn))
2528 continue;
2529
2530 /* Try to form a conditional variant of the instruction and emit it. */
2531 if ((newinsn = emit_new_cond_insn (insn, cond)))
2532 {
2533 if (end_blk_2_insn == insn)
2534 end_blk_2_insn = newinsn;
2535
2536 insn = newinsn;
2537 }
2538 }
2539
2540 /* Note whether we will delete the label starting blk 3 when the jump
2541 gets deleted. If so, we want to re-apply this optimization at the
2542 last real instruction right before the label. */
2543 if (LABEL_NUSES (start_blk_3_lab) == 1)
2544 {
2545 start_blk_3_lab = 0;
2546 }
2547
2548 /* ??? we probably should redistribute the death notes for this insn, esp.
2549 the death of cc, but it doesn't really matter this late in the game.
2550 The peepholes all use is_dead() which will find the correct death
2551 regardless of whether there is a note. */
2552 delete_insn (end_blk_1_br);
2553
2554 if (! start_blk_3_lab)
2555 return end_blk_2_insn;
2556
2557 /* Return the insn right after the label at the start of block 3. */
2558 return NEXT_INSN (start_blk_3_lab);
2559 }
2560
2561 /* Apply the conditionalization of blocks optimization. This is the
2562 outer loop that traverses through the insns scanning for a branch
2563 that signifies an opportunity to apply the optimization. Note that
2564 this optimization is applied late. If we could apply it earlier,
2565 say before cse 2, it may expose more optimization opportunities.
2566 but, the pay back probably isn't really worth the effort (we'd have
2567 to update all reg/flow/notes/links/etc to make it work - and stick it
2568 in before cse 2). */
2569
2570 static void
2571 conditionalize_optimization (void)
2572 {
2573 rtx insn;
2574
2575 for (insn = get_insns (); insn; insn = conditionalize_block (insn))
2576 continue;
2577 }
2578
2579 static int saved_warn_return_type = -1;
2580 static int saved_warn_return_type_count = 0;
2581
2582 /* This is to handle loads from the constant pool. */
2583
2584 static void
2585 mcore_reorg (void)
2586 {
2587 /* Reset this variable. */
2588 current_function_anonymous_args = 0;
2589
2590 /* Restore the warn_return_type if it has been altered. */
2591 if (saved_warn_return_type != -1)
2592 {
2593 /* Only restore the value if we have reached another function.
2594 The test of warn_return_type occurs in final_function () in
2595 c-decl.c a long time after the code for the function is generated,
2596 so we need a counter to tell us when we have finished parsing that
2597 function and can restore the flag. */
2598 if (--saved_warn_return_type_count == 0)
2599 {
2600 warn_return_type = saved_warn_return_type;
2601 saved_warn_return_type = -1;
2602 }
2603 }
2604
2605 if (optimize == 0)
2606 return;
2607
2608 /* Conditionalize blocks where we can. */
2609 conditionalize_optimization ();
2610
2611 /* Literal pool generation is now pushed off until the assembler. */
2612 }
2613
2614 \f
2615 /* Return true if X is something that can be moved directly into r15. */
2616
2617 bool
2618 mcore_r15_operand_p (rtx x)
2619 {
2620 switch (GET_CODE (x))
2621 {
2622 case CONST_INT:
2623 return mcore_const_ok_for_inline (INTVAL (x));
2624
2625 case REG:
2626 case SUBREG:
2627 case MEM:
2628 return 1;
2629
2630 default:
2631 return 0;
2632 }
2633 }
2634
2635 /* Implement SECONDARY_RELOAD_CLASS. If RCLASS contains r15, and we can't
2636 directly move X into it, use r1-r14 as a temporary. */
2637
2638 enum reg_class
2639 mcore_secondary_reload_class (enum reg_class rclass,
2640 enum machine_mode mode ATTRIBUTE_UNUSED, rtx x)
2641 {
2642 if (TEST_HARD_REG_BIT (reg_class_contents[rclass], 15)
2643 && !mcore_r15_operand_p (x))
2644 return LRW_REGS;
2645 return NO_REGS;
2646 }
2647
2648 /* Return the reg_class to use when reloading the rtx X into the class
2649 RCLASS. If X is too complex to move directly into r15, prefer to
2650 use LRW_REGS instead. */
2651
2652 enum reg_class
2653 mcore_reload_class (rtx x, enum reg_class rclass)
2654 {
2655 if (reg_class_subset_p (LRW_REGS, rclass) && !mcore_r15_operand_p (x))
2656 return LRW_REGS;
2657
2658 return rclass;
2659 }
2660
2661 /* Tell me if a pair of reg/subreg rtx's actually refer to the same
2662 register. Note that the current version doesn't worry about whether
2663 they are the same mode or note (e.g., a QImode in r2 matches an HImode
2664 in r2 matches an SImode in r2. Might think in the future about whether
2665 we want to be able to say something about modes. */
2666
2667 int
2668 mcore_is_same_reg (rtx x, rtx y)
2669 {
2670 /* Strip any and all of the subreg wrappers. */
2671 while (GET_CODE (x) == SUBREG)
2672 x = SUBREG_REG (x);
2673
2674 while (GET_CODE (y) == SUBREG)
2675 y = SUBREG_REG (y);
2676
2677 if (GET_CODE(x) == REG && GET_CODE(y) == REG && REGNO(x) == REGNO(y))
2678 return 1;
2679
2680 return 0;
2681 }
2682
2683 static void
2684 mcore_option_override (void)
2685 {
2686 /* Only the m340 supports little endian code. */
2687 if (TARGET_LITTLE_END && ! TARGET_M340)
2688 target_flags |= MASK_M340;
2689 }
2690
2691 \f
2692 /* Compute the number of word sized registers needed to
2693 hold a function argument of mode MODE and type TYPE. */
2694
2695 int
2696 mcore_num_arg_regs (enum machine_mode mode, const_tree type)
2697 {
2698 int size;
2699
2700 if (targetm.calls.must_pass_in_stack (mode, type))
2701 return 0;
2702
2703 if (type && mode == BLKmode)
2704 size = int_size_in_bytes (type);
2705 else
2706 size = GET_MODE_SIZE (mode);
2707
2708 return ROUND_ADVANCE (size);
2709 }
2710
2711 static rtx
2712 handle_structs_in_regs (enum machine_mode mode, const_tree type, int reg)
2713 {
2714 int size;
2715
2716 /* The MCore ABI defines that a structure whose size is not a whole multiple
2717 of bytes is passed packed into registers (or spilled onto the stack if
2718 not enough registers are available) with the last few bytes of the
2719 structure being packed, left-justified, into the last register/stack slot.
2720 GCC handles this correctly if the last word is in a stack slot, but we
2721 have to generate a special, PARALLEL RTX if the last word is in an
2722 argument register. */
2723 if (type
2724 && TYPE_MODE (type) == BLKmode
2725 && TREE_CODE (TYPE_SIZE (type)) == INTEGER_CST
2726 && (size = int_size_in_bytes (type)) > UNITS_PER_WORD
2727 && (size % UNITS_PER_WORD != 0)
2728 && (reg + mcore_num_arg_regs (mode, type) <= (FIRST_PARM_REG + NPARM_REGS)))
2729 {
2730 rtx arg_regs [NPARM_REGS];
2731 int nregs;
2732 rtx result;
2733 rtvec rtvec;
2734
2735 for (nregs = 0; size > 0; size -= UNITS_PER_WORD)
2736 {
2737 arg_regs [nregs] =
2738 gen_rtx_EXPR_LIST (SImode, gen_rtx_REG (SImode, reg ++),
2739 GEN_INT (nregs * UNITS_PER_WORD));
2740 nregs ++;
2741 }
2742
2743 /* We assume here that NPARM_REGS == 6. The assert checks this. */
2744 gcc_assert (ARRAY_SIZE (arg_regs) == 6);
2745 rtvec = gen_rtvec (nregs, arg_regs[0], arg_regs[1], arg_regs[2],
2746 arg_regs[3], arg_regs[4], arg_regs[5]);
2747
2748 result = gen_rtx_PARALLEL (mode, rtvec);
2749 return result;
2750 }
2751
2752 return gen_rtx_REG (mode, reg);
2753 }
2754
2755 rtx
2756 mcore_function_value (const_tree valtype, const_tree func)
2757 {
2758 enum machine_mode mode;
2759 int unsigned_p;
2760
2761 mode = TYPE_MODE (valtype);
2762
2763 /* Since we promote return types, we must promote the mode here too. */
2764 mode = promote_function_mode (valtype, mode, &unsigned_p, func, 1);
2765
2766 return handle_structs_in_regs (mode, valtype, FIRST_RET_REG);
2767 }
2768
2769 /* Define where to put the arguments to a function.
2770 Value is zero to push the argument on the stack,
2771 or a hard register in which to store the argument.
2772
2773 MODE is the argument's machine mode.
2774 TYPE is the data type of the argument (as a tree).
2775 This is null for libcalls where that information may
2776 not be available.
2777 CUM is a variable of type CUMULATIVE_ARGS which gives info about
2778 the preceding args and about the function being called.
2779 NAMED is nonzero if this argument is a named parameter
2780 (otherwise it is an extra parameter matching an ellipsis).
2781
2782 On MCore the first args are normally in registers
2783 and the rest are pushed. Any arg that starts within the first
2784 NPARM_REGS words is at least partially passed in a register unless
2785 its data type forbids. */
2786
2787 static rtx
2788 mcore_function_arg (cumulative_args_t cum, enum machine_mode mode,
2789 const_tree type, bool named)
2790 {
2791 int arg_reg;
2792
2793 if (! named || mode == VOIDmode)
2794 return 0;
2795
2796 if (targetm.calls.must_pass_in_stack (mode, type))
2797 return 0;
2798
2799 arg_reg = ROUND_REG (*get_cumulative_args (cum), mode);
2800
2801 if (arg_reg < NPARM_REGS)
2802 return handle_structs_in_regs (mode, type, FIRST_PARM_REG + arg_reg);
2803
2804 return 0;
2805 }
2806
2807 static void
2808 mcore_function_arg_advance (cumulative_args_t cum_v, enum machine_mode mode,
2809 const_tree type, bool named ATTRIBUTE_UNUSED)
2810 {
2811 CUMULATIVE_ARGS *cum = get_cumulative_args (cum_v);
2812
2813 *cum = (ROUND_REG (*cum, mode)
2814 + (int)named * mcore_num_arg_regs (mode, type));
2815 }
2816
2817 static unsigned int
2818 mcore_function_arg_boundary (enum machine_mode mode,
2819 const_tree type ATTRIBUTE_UNUSED)
2820 {
2821 /* Doubles must be aligned to an 8 byte boundary. */
2822 return (mode != BLKmode && GET_MODE_SIZE (mode) == 8
2823 ? BIGGEST_ALIGNMENT
2824 : PARM_BOUNDARY);
2825 }
2826
2827 /* Returns the number of bytes of argument registers required to hold *part*
2828 of a parameter of machine mode MODE and type TYPE (which may be NULL if
2829 the type is not known). If the argument fits entirely in the argument
2830 registers, or entirely on the stack, then 0 is returned. CUM is the
2831 number of argument registers already used by earlier parameters to
2832 the function. */
2833
2834 static int
2835 mcore_arg_partial_bytes (cumulative_args_t cum, enum machine_mode mode,
2836 tree type, bool named)
2837 {
2838 int reg = ROUND_REG (*get_cumulative_args (cum), mode);
2839
2840 if (named == 0)
2841 return 0;
2842
2843 if (targetm.calls.must_pass_in_stack (mode, type))
2844 return 0;
2845
2846 /* REG is not the *hardware* register number of the register that holds
2847 the argument, it is the *argument* register number. So for example,
2848 the first argument to a function goes in argument register 0, which
2849 translates (for the MCore) into hardware register 2. The second
2850 argument goes into argument register 1, which translates into hardware
2851 register 3, and so on. NPARM_REGS is the number of argument registers
2852 supported by the target, not the maximum hardware register number of
2853 the target. */
2854 if (reg >= NPARM_REGS)
2855 return 0;
2856
2857 /* If the argument fits entirely in registers, return 0. */
2858 if (reg + mcore_num_arg_regs (mode, type) <= NPARM_REGS)
2859 return 0;
2860
2861 /* The argument overflows the number of available argument registers.
2862 Compute how many argument registers have not yet been assigned to
2863 hold an argument. */
2864 reg = NPARM_REGS - reg;
2865
2866 /* Return partially in registers and partially on the stack. */
2867 return reg * UNITS_PER_WORD;
2868 }
2869 \f
2870 /* Return nonzero if SYMBOL is marked as being dllexport'd. */
2871
2872 int
2873 mcore_dllexport_name_p (const char * symbol)
2874 {
2875 return symbol[0] == '@' && symbol[1] == 'e' && symbol[2] == '.';
2876 }
2877
2878 /* Return nonzero if SYMBOL is marked as being dllimport'd. */
2879
2880 int
2881 mcore_dllimport_name_p (const char * symbol)
2882 {
2883 return symbol[0] == '@' && symbol[1] == 'i' && symbol[2] == '.';
2884 }
2885
2886 /* Mark a DECL as being dllexport'd. */
2887
2888 static void
2889 mcore_mark_dllexport (tree decl)
2890 {
2891 const char * oldname;
2892 char * newname;
2893 rtx rtlname;
2894 tree idp;
2895
2896 rtlname = XEXP (DECL_RTL (decl), 0);
2897
2898 if (GET_CODE (rtlname) == MEM)
2899 rtlname = XEXP (rtlname, 0);
2900 gcc_assert (GET_CODE (rtlname) == SYMBOL_REF);
2901 oldname = XSTR (rtlname, 0);
2902
2903 if (mcore_dllexport_name_p (oldname))
2904 return; /* Already done. */
2905
2906 newname = XALLOCAVEC (char, strlen (oldname) + 4);
2907 sprintf (newname, "@e.%s", oldname);
2908
2909 /* We pass newname through get_identifier to ensure it has a unique
2910 address. RTL processing can sometimes peek inside the symbol ref
2911 and compare the string's addresses to see if two symbols are
2912 identical. */
2913 /* ??? At least I think that's why we do this. */
2914 idp = get_identifier (newname);
2915
2916 XEXP (DECL_RTL (decl), 0) =
2917 gen_rtx_SYMBOL_REF (Pmode, IDENTIFIER_POINTER (idp));
2918 }
2919
2920 /* Mark a DECL as being dllimport'd. */
2921
2922 static void
2923 mcore_mark_dllimport (tree decl)
2924 {
2925 const char * oldname;
2926 char * newname;
2927 tree idp;
2928 rtx rtlname;
2929 rtx newrtl;
2930
2931 rtlname = XEXP (DECL_RTL (decl), 0);
2932
2933 if (GET_CODE (rtlname) == MEM)
2934 rtlname = XEXP (rtlname, 0);
2935 gcc_assert (GET_CODE (rtlname) == SYMBOL_REF);
2936 oldname = XSTR (rtlname, 0);
2937
2938 gcc_assert (!mcore_dllexport_name_p (oldname));
2939 if (mcore_dllimport_name_p (oldname))
2940 return; /* Already done. */
2941
2942 /* ??? One can well ask why we're making these checks here,
2943 and that would be a good question. */
2944
2945 /* Imported variables can't be initialized. */
2946 if (TREE_CODE (decl) == VAR_DECL
2947 && !DECL_VIRTUAL_P (decl)
2948 && DECL_INITIAL (decl))
2949 {
2950 error ("initialized variable %q+D is marked dllimport", decl);
2951 return;
2952 }
2953
2954 /* `extern' needn't be specified with dllimport.
2955 Specify `extern' now and hope for the best. Sigh. */
2956 if (TREE_CODE (decl) == VAR_DECL
2957 /* ??? Is this test for vtables needed? */
2958 && !DECL_VIRTUAL_P (decl))
2959 {
2960 DECL_EXTERNAL (decl) = 1;
2961 TREE_PUBLIC (decl) = 1;
2962 }
2963
2964 newname = XALLOCAVEC (char, strlen (oldname) + 11);
2965 sprintf (newname, "@i.__imp_%s", oldname);
2966
2967 /* We pass newname through get_identifier to ensure it has a unique
2968 address. RTL processing can sometimes peek inside the symbol ref
2969 and compare the string's addresses to see if two symbols are
2970 identical. */
2971 /* ??? At least I think that's why we do this. */
2972 idp = get_identifier (newname);
2973
2974 newrtl = gen_rtx_MEM (Pmode,
2975 gen_rtx_SYMBOL_REF (Pmode,
2976 IDENTIFIER_POINTER (idp)));
2977 XEXP (DECL_RTL (decl), 0) = newrtl;
2978 }
2979
2980 static int
2981 mcore_dllexport_p (tree decl)
2982 {
2983 if ( TREE_CODE (decl) != VAR_DECL
2984 && TREE_CODE (decl) != FUNCTION_DECL)
2985 return 0;
2986
2987 return lookup_attribute ("dllexport", DECL_ATTRIBUTES (decl)) != 0;
2988 }
2989
2990 static int
2991 mcore_dllimport_p (tree decl)
2992 {
2993 if ( TREE_CODE (decl) != VAR_DECL
2994 && TREE_CODE (decl) != FUNCTION_DECL)
2995 return 0;
2996
2997 return lookup_attribute ("dllimport", DECL_ATTRIBUTES (decl)) != 0;
2998 }
2999
3000 /* We must mark dll symbols specially. Definitions of dllexport'd objects
3001 install some info in the .drective (PE) or .exports (ELF) sections. */
3002
3003 static void
3004 mcore_encode_section_info (tree decl, rtx rtl ATTRIBUTE_UNUSED, int first ATTRIBUTE_UNUSED)
3005 {
3006 /* Mark the decl so we can tell from the rtl whether the object is
3007 dllexport'd or dllimport'd. */
3008 if (mcore_dllexport_p (decl))
3009 mcore_mark_dllexport (decl);
3010 else if (mcore_dllimport_p (decl))
3011 mcore_mark_dllimport (decl);
3012
3013 /* It might be that DECL has already been marked as dllimport, but
3014 a subsequent definition nullified that. The attribute is gone
3015 but DECL_RTL still has @i.__imp_foo. We need to remove that. */
3016 else if ((TREE_CODE (decl) == FUNCTION_DECL
3017 || TREE_CODE (decl) == VAR_DECL)
3018 && DECL_RTL (decl) != NULL_RTX
3019 && GET_CODE (DECL_RTL (decl)) == MEM
3020 && GET_CODE (XEXP (DECL_RTL (decl), 0)) == MEM
3021 && GET_CODE (XEXP (XEXP (DECL_RTL (decl), 0), 0)) == SYMBOL_REF
3022 && mcore_dllimport_name_p (XSTR (XEXP (XEXP (DECL_RTL (decl), 0), 0), 0)))
3023 {
3024 const char * oldname = XSTR (XEXP (XEXP (DECL_RTL (decl), 0), 0), 0);
3025 tree idp = get_identifier (oldname + 9);
3026 rtx newrtl = gen_rtx_SYMBOL_REF (Pmode, IDENTIFIER_POINTER (idp));
3027
3028 XEXP (DECL_RTL (decl), 0) = newrtl;
3029
3030 /* We previously set TREE_PUBLIC and DECL_EXTERNAL.
3031 ??? We leave these alone for now. */
3032 }
3033 }
3034
3035 /* Undo the effects of the above. */
3036
3037 static const char *
3038 mcore_strip_name_encoding (const char * str)
3039 {
3040 return str + (str[0] == '@' ? 3 : 0);
3041 }
3042
3043 /* MCore specific attribute support.
3044 dllexport - for exporting a function/variable that will live in a dll
3045 dllimport - for importing a function/variable from a dll
3046 naked - do not create a function prologue/epilogue. */
3047
3048 /* Handle a "naked" attribute; arguments as in
3049 struct attribute_spec.handler. */
3050
3051 static tree
3052 mcore_handle_naked_attribute (tree * node, tree name, tree args ATTRIBUTE_UNUSED,
3053 int flags ATTRIBUTE_UNUSED, bool * no_add_attrs)
3054 {
3055 if (TREE_CODE (*node) == FUNCTION_DECL)
3056 {
3057 /* PR14310 - don't complain about lack of return statement
3058 in naked functions. The solution here is a gross hack
3059 but this is the only way to solve the problem without
3060 adding a new feature to GCC. I did try submitting a patch
3061 that would add such a new feature, but it was (rightfully)
3062 rejected on the grounds that it was creeping featurism,
3063 so hence this code. */
3064 if (warn_return_type)
3065 {
3066 saved_warn_return_type = warn_return_type;
3067 warn_return_type = 0;
3068 saved_warn_return_type_count = 2;
3069 }
3070 else if (saved_warn_return_type_count)
3071 saved_warn_return_type_count = 2;
3072 }
3073 else
3074 {
3075 warning (OPT_Wattributes, "%qE attribute only applies to functions",
3076 name);
3077 *no_add_attrs = true;
3078 }
3079
3080 return NULL_TREE;
3081 }
3082
3083 /* ??? It looks like this is PE specific? Oh well, this is what the
3084 old code did as well. */
3085
3086 static void
3087 mcore_unique_section (tree decl, int reloc ATTRIBUTE_UNUSED)
3088 {
3089 int len;
3090 const char * name;
3091 char * string;
3092 const char * prefix;
3093
3094 name = IDENTIFIER_POINTER (DECL_ASSEMBLER_NAME (decl));
3095
3096 /* Strip off any encoding in name. */
3097 name = (* targetm.strip_name_encoding) (name);
3098
3099 /* The object is put in, for example, section .text$foo.
3100 The linker will then ultimately place them in .text
3101 (everything from the $ on is stripped). */
3102 if (TREE_CODE (decl) == FUNCTION_DECL)
3103 prefix = ".text$";
3104 /* For compatibility with EPOC, we ignore the fact that the
3105 section might have relocs against it. */
3106 else if (decl_readonly_section (decl, 0))
3107 prefix = ".rdata$";
3108 else
3109 prefix = ".data$";
3110
3111 len = strlen (name) + strlen (prefix);
3112 string = XALLOCAVEC (char, len + 1);
3113
3114 sprintf (string, "%s%s", prefix, name);
3115
3116 DECL_SECTION_NAME (decl) = build_string (len, string);
3117 }
3118
3119 int
3120 mcore_naked_function_p (void)
3121 {
3122 return lookup_attribute ("naked", DECL_ATTRIBUTES (current_function_decl)) != NULL_TREE;
3123 }
3124
3125 #ifdef OBJECT_FORMAT_ELF
3126 static void
3127 mcore_asm_named_section (const char *name,
3128 unsigned int flags ATTRIBUTE_UNUSED,
3129 tree decl ATTRIBUTE_UNUSED)
3130 {
3131 fprintf (asm_out_file, "\t.section %s\n", name);
3132 }
3133 #endif /* OBJECT_FORMAT_ELF */
3134
3135 /* Worker function for TARGET_ASM_EXTERNAL_LIBCALL. */
3136
3137 static void
3138 mcore_external_libcall (rtx fun)
3139 {
3140 fprintf (asm_out_file, "\t.import\t");
3141 assemble_name (asm_out_file, XSTR (fun, 0));
3142 fprintf (asm_out_file, "\n");
3143 }
3144
3145 /* Worker function for TARGET_RETURN_IN_MEMORY. */
3146
3147 static bool
3148 mcore_return_in_memory (const_tree type, const_tree fntype ATTRIBUTE_UNUSED)
3149 {
3150 const HOST_WIDE_INT size = int_size_in_bytes (type);
3151 return (size == -1 || size > 2 * UNITS_PER_WORD);
3152 }
3153
3154 /* Worker function for TARGET_ASM_TRAMPOLINE_TEMPLATE.
3155 Output assembler code for a block containing the constant parts
3156 of a trampoline, leaving space for the variable parts.
3157
3158 On the MCore, the trampoline looks like:
3159 lrw r1, function
3160 lrw r13, area
3161 jmp r13
3162 or r0, r0
3163 .literals */
3164
3165 static void
3166 mcore_asm_trampoline_template (FILE *f)
3167 {
3168 fprintf (f, "\t.short 0x7102\n");
3169 fprintf (f, "\t.short 0x7d02\n");
3170 fprintf (f, "\t.short 0x00cd\n");
3171 fprintf (f, "\t.short 0x1e00\n");
3172 fprintf (f, "\t.long 0\n");
3173 fprintf (f, "\t.long 0\n");
3174 }
3175
3176 /* Worker function for TARGET_TRAMPOLINE_INIT. */
3177
3178 static void
3179 mcore_trampoline_init (rtx m_tramp, tree fndecl, rtx chain_value)
3180 {
3181 rtx fnaddr = XEXP (DECL_RTL (fndecl), 0);
3182 rtx mem;
3183
3184 emit_block_move (m_tramp, assemble_trampoline_template (),
3185 GEN_INT (2*UNITS_PER_WORD), BLOCK_OP_NORMAL);
3186
3187 mem = adjust_address (m_tramp, SImode, 8);
3188 emit_move_insn (mem, chain_value);
3189 mem = adjust_address (m_tramp, SImode, 12);
3190 emit_move_insn (mem, fnaddr);
3191 }
3192
3193 /* Implement TARGET_LEGITIMATE_CONSTANT_P
3194
3195 On the MCore, allow anything but a double. */
3196
3197 static bool
3198 mcore_legitimate_constant_p (enum machine_mode mode ATTRIBUTE_UNUSED, rtx x)
3199 {
3200 return GET_CODE (x) != CONST_DOUBLE;
3201 }