]> git.ipfire.org Git - thirdparty/gcc.git/blob - gcc/config/mcore/mcore.c
mcore-protos.h (mcore_print_operand): Delete.
[thirdparty/gcc.git] / gcc / config / mcore / mcore.c
1 /* Output routines for Motorola MCore processor
2 Copyright (C) 1993, 1999, 2000, 2001, 2002, 2003, 2004, 2005, 2007, 2008,
3 2009 Free Software Foundation, Inc.
4
5 This file is part of GCC.
6
7 GCC is free software; you can redistribute it and/or modify it
8 under the terms of the GNU General Public License as published
9 by the Free Software Foundation; either version 3, or (at your
10 option) any later version.
11
12 GCC is distributed in the hope that it will be useful, but WITHOUT
13 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
14 or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public
15 License for more details.
16
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
20
21 #include "config.h"
22 #include "system.h"
23 #include "coretypes.h"
24 #include "tm.h"
25 #include "rtl.h"
26 #include "tree.h"
27 #include "tm_p.h"
28 #include "assert.h"
29 #include "mcore.h"
30 #include "regs.h"
31 #include "hard-reg-set.h"
32 #include "insn-config.h"
33 #include "conditions.h"
34 #include "output.h"
35 #include "insn-attr.h"
36 #include "flags.h"
37 #include "obstack.h"
38 #include "expr.h"
39 #include "reload.h"
40 #include "recog.h"
41 #include "function.h"
42 #include "ggc.h"
43 #include "toplev.h"
44 #include "target.h"
45 #include "target-def.h"
46 #include "df.h"
47
48 /* Maximum size we are allowed to grow the stack in a single operation.
49 If we want more, we must do it in increments of at most this size.
50 If this value is 0, we don't check at all. */
51 int mcore_stack_increment = STACK_UNITS_MAXSTEP;
52
53 /* For dumping information about frame sizes. */
54 char * mcore_current_function_name = 0;
55 long mcore_current_compilation_timestamp = 0;
56
57 /* Global variables for machine-dependent things. */
58
59 /* Provides the class number of the smallest class containing
60 reg number. */
61 const enum reg_class regno_reg_class[FIRST_PSEUDO_REGISTER] =
62 {
63 GENERAL_REGS, ONLYR1_REGS, LRW_REGS, LRW_REGS,
64 LRW_REGS, LRW_REGS, LRW_REGS, LRW_REGS,
65 LRW_REGS, LRW_REGS, LRW_REGS, LRW_REGS,
66 LRW_REGS, LRW_REGS, LRW_REGS, GENERAL_REGS,
67 GENERAL_REGS, C_REGS, NO_REGS, NO_REGS,
68 };
69
70 /* Provide reg_class from a letter such as appears in the machine
71 description. */
72 const enum reg_class reg_class_from_letter[] =
73 {
74 /* a */ LRW_REGS, /* b */ ONLYR1_REGS, /* c */ C_REGS, /* d */ NO_REGS,
75 /* e */ NO_REGS, /* f */ NO_REGS, /* g */ NO_REGS, /* h */ NO_REGS,
76 /* i */ NO_REGS, /* j */ NO_REGS, /* k */ NO_REGS, /* l */ NO_REGS,
77 /* m */ NO_REGS, /* n */ NO_REGS, /* o */ NO_REGS, /* p */ NO_REGS,
78 /* q */ NO_REGS, /* r */ GENERAL_REGS, /* s */ NO_REGS, /* t */ NO_REGS,
79 /* u */ NO_REGS, /* v */ NO_REGS, /* w */ NO_REGS, /* x */ ALL_REGS,
80 /* y */ NO_REGS, /* z */ NO_REGS
81 };
82
83 struct mcore_frame
84 {
85 int arg_size; /* Stdarg spills (bytes). */
86 int reg_size; /* Non-volatile reg saves (bytes). */
87 int reg_mask; /* Non-volatile reg saves. */
88 int local_size; /* Locals. */
89 int outbound_size; /* Arg overflow on calls out. */
90 int pad_outbound;
91 int pad_local;
92 int pad_reg;
93 /* Describe the steps we'll use to grow it. */
94 #define MAX_STACK_GROWS 4 /* Gives us some spare space. */
95 int growth[MAX_STACK_GROWS];
96 int arg_offset;
97 int reg_offset;
98 int reg_growth;
99 int local_growth;
100 };
101
102 typedef enum
103 {
104 COND_NO,
105 COND_MOV_INSN,
106 COND_CLR_INSN,
107 COND_INC_INSN,
108 COND_DEC_INSN,
109 COND_BRANCH_INSN
110 }
111 cond_type;
112
113 static void output_stack_adjust (int, int);
114 static int calc_live_regs (int *);
115 static int try_constant_tricks (long, HOST_WIDE_INT *, HOST_WIDE_INT *);
116 static const char * output_inline_const (enum machine_mode, rtx *);
117 static void layout_mcore_frame (struct mcore_frame *);
118 static void mcore_setup_incoming_varargs (CUMULATIVE_ARGS *, enum machine_mode, tree, int *, int);
119 static cond_type is_cond_candidate (rtx);
120 static rtx emit_new_cond_insn (rtx, int);
121 static rtx conditionalize_block (rtx);
122 static void conditionalize_optimization (void);
123 static void mcore_reorg (void);
124 static rtx handle_structs_in_regs (enum machine_mode, const_tree, int);
125 static void mcore_mark_dllexport (tree);
126 static void mcore_mark_dllimport (tree);
127 static int mcore_dllexport_p (tree);
128 static int mcore_dllimport_p (tree);
129 static tree mcore_handle_naked_attribute (tree *, tree, tree, int, bool *);
130 #ifdef OBJECT_FORMAT_ELF
131 static void mcore_asm_named_section (const char *,
132 unsigned int, tree);
133 #endif
134 static void mcore_print_operand (FILE *, rtx, int);
135 static void mcore_print_operand_address (FILE *, rtx);
136 static bool mcore_print_operand_punct_valid_p (unsigned char code);
137 static void mcore_unique_section (tree, int);
138 static void mcore_encode_section_info (tree, rtx, int);
139 static const char *mcore_strip_name_encoding (const char *);
140 static int mcore_const_costs (rtx, RTX_CODE);
141 static int mcore_and_cost (rtx);
142 static int mcore_ior_cost (rtx);
143 static bool mcore_rtx_costs (rtx, int, int, int *, bool);
144 static void mcore_external_libcall (rtx);
145 static bool mcore_return_in_memory (const_tree, const_tree);
146 static int mcore_arg_partial_bytes (CUMULATIVE_ARGS *,
147 enum machine_mode,
148 tree, bool);
149 static void mcore_asm_trampoline_template (FILE *);
150 static void mcore_trampoline_init (rtx, tree, rtx);
151 \f
152 /* MCore specific attributes. */
153
154 static const struct attribute_spec mcore_attribute_table[] =
155 {
156 /* { name, min_len, max_len, decl_req, type_req, fn_type_req, handler } */
157 { "dllexport", 0, 0, true, false, false, NULL },
158 { "dllimport", 0, 0, true, false, false, NULL },
159 { "naked", 0, 0, true, false, false, mcore_handle_naked_attribute },
160 { NULL, 0, 0, false, false, false, NULL }
161 };
162 \f
163 /* Initialize the GCC target structure. */
164 #undef TARGET_ASM_EXTERNAL_LIBCALL
165 #define TARGET_ASM_EXTERNAL_LIBCALL mcore_external_libcall
166
167 #if TARGET_DLLIMPORT_DECL_ATTRIBUTES
168 #undef TARGET_MERGE_DECL_ATTRIBUTES
169 #define TARGET_MERGE_DECL_ATTRIBUTES merge_dllimport_decl_attributes
170 #endif
171
172 #ifdef OBJECT_FORMAT_ELF
173 #undef TARGET_ASM_UNALIGNED_HI_OP
174 #define TARGET_ASM_UNALIGNED_HI_OP "\t.short\t"
175 #undef TARGET_ASM_UNALIGNED_SI_OP
176 #define TARGET_ASM_UNALIGNED_SI_OP "\t.long\t"
177 #endif
178
179 #undef TARGET_PRINT_OPERAND
180 #define TARGET_PRINT_OPERAND mcore_print_operand
181 #undef TARGET_PRINT_OPERAND_ADDRESS
182 #define TARGET_PRINT_OPERAND_ADDRESS mcore_print_operand_address
183 #undef TARGET_PRINT_OPERAND_PUNCT_VALID_P
184 #define TARGET_PRINT_OPERAND_PUNCT_VALID_P mcore_print_operand_punct_valid_p
185
186 #undef TARGET_ATTRIBUTE_TABLE
187 #define TARGET_ATTRIBUTE_TABLE mcore_attribute_table
188 #undef TARGET_ASM_UNIQUE_SECTION
189 #define TARGET_ASM_UNIQUE_SECTION mcore_unique_section
190 #undef TARGET_ASM_FUNCTION_RODATA_SECTION
191 #define TARGET_ASM_FUNCTION_RODATA_SECTION default_no_function_rodata_section
192 #undef TARGET_DEFAULT_TARGET_FLAGS
193 #define TARGET_DEFAULT_TARGET_FLAGS TARGET_DEFAULT
194 #undef TARGET_ENCODE_SECTION_INFO
195 #define TARGET_ENCODE_SECTION_INFO mcore_encode_section_info
196 #undef TARGET_STRIP_NAME_ENCODING
197 #define TARGET_STRIP_NAME_ENCODING mcore_strip_name_encoding
198 #undef TARGET_RTX_COSTS
199 #define TARGET_RTX_COSTS mcore_rtx_costs
200 #undef TARGET_ADDRESS_COST
201 #define TARGET_ADDRESS_COST hook_int_rtx_bool_0
202 #undef TARGET_MACHINE_DEPENDENT_REORG
203 #define TARGET_MACHINE_DEPENDENT_REORG mcore_reorg
204
205 #undef TARGET_PROMOTE_FUNCTION_MODE
206 #define TARGET_PROMOTE_FUNCTION_MODE default_promote_function_mode_always_promote
207 #undef TARGET_PROMOTE_PROTOTYPES
208 #define TARGET_PROMOTE_PROTOTYPES hook_bool_const_tree_true
209
210 #undef TARGET_RETURN_IN_MEMORY
211 #define TARGET_RETURN_IN_MEMORY mcore_return_in_memory
212 #undef TARGET_MUST_PASS_IN_STACK
213 #define TARGET_MUST_PASS_IN_STACK must_pass_in_stack_var_size
214 #undef TARGET_PASS_BY_REFERENCE
215 #define TARGET_PASS_BY_REFERENCE hook_pass_by_reference_must_pass_in_stack
216 #undef TARGET_ARG_PARTIAL_BYTES
217 #define TARGET_ARG_PARTIAL_BYTES mcore_arg_partial_bytes
218
219 #undef TARGET_SETUP_INCOMING_VARARGS
220 #define TARGET_SETUP_INCOMING_VARARGS mcore_setup_incoming_varargs
221
222 #undef TARGET_ASM_TRAMPOLINE_TEMPLATE
223 #define TARGET_ASM_TRAMPOLINE_TEMPLATE mcore_asm_trampoline_template
224 #undef TARGET_TRAMPOLINE_INIT
225 #define TARGET_TRAMPOLINE_INIT mcore_trampoline_init
226
227 struct gcc_target targetm = TARGET_INITIALIZER;
228 \f
229 /* Adjust the stack and return the number of bytes taken to do it. */
230 static void
231 output_stack_adjust (int direction, int size)
232 {
233 /* If extending stack a lot, we do it incrementally. */
234 if (direction < 0 && size > mcore_stack_increment && mcore_stack_increment > 0)
235 {
236 rtx tmp = gen_rtx_REG (SImode, 1);
237 rtx memref;
238
239 emit_insn (gen_movsi (tmp, GEN_INT (mcore_stack_increment)));
240 do
241 {
242 emit_insn (gen_subsi3 (stack_pointer_rtx, stack_pointer_rtx, tmp));
243 memref = gen_rtx_MEM (SImode, stack_pointer_rtx);
244 MEM_VOLATILE_P (memref) = 1;
245 emit_insn (gen_movsi (memref, stack_pointer_rtx));
246 size -= mcore_stack_increment;
247 }
248 while (size > mcore_stack_increment);
249
250 /* SIZE is now the residual for the last adjustment,
251 which doesn't require a probe. */
252 }
253
254 if (size)
255 {
256 rtx insn;
257 rtx val = GEN_INT (size);
258
259 if (size > 32)
260 {
261 rtx nval = gen_rtx_REG (SImode, 1);
262 emit_insn (gen_movsi (nval, val));
263 val = nval;
264 }
265
266 if (direction > 0)
267 insn = gen_addsi3 (stack_pointer_rtx, stack_pointer_rtx, val);
268 else
269 insn = gen_subsi3 (stack_pointer_rtx, stack_pointer_rtx, val);
270
271 emit_insn (insn);
272 }
273 }
274
275 /* Work out the registers which need to be saved,
276 both as a mask and a count. */
277
278 static int
279 calc_live_regs (int * count)
280 {
281 int reg;
282 int live_regs_mask = 0;
283
284 * count = 0;
285
286 for (reg = 0; reg < FIRST_PSEUDO_REGISTER; reg++)
287 {
288 if (df_regs_ever_live_p (reg) && !call_used_regs[reg])
289 {
290 (*count)++;
291 live_regs_mask |= (1 << reg);
292 }
293 }
294
295 return live_regs_mask;
296 }
297
298 /* Print the operand address in x to the stream. */
299
300 static void
301 mcore_print_operand_address (FILE * stream, rtx x)
302 {
303 switch (GET_CODE (x))
304 {
305 case REG:
306 fprintf (stream, "(%s)", reg_names[REGNO (x)]);
307 break;
308
309 case PLUS:
310 {
311 rtx base = XEXP (x, 0);
312 rtx index = XEXP (x, 1);
313
314 if (GET_CODE (base) != REG)
315 {
316 /* Ensure that BASE is a register (one of them must be). */
317 rtx temp = base;
318 base = index;
319 index = temp;
320 }
321
322 switch (GET_CODE (index))
323 {
324 case CONST_INT:
325 fprintf (stream, "(%s," HOST_WIDE_INT_PRINT_DEC ")",
326 reg_names[REGNO(base)], INTVAL (index));
327 break;
328
329 default:
330 gcc_unreachable ();
331 }
332 }
333
334 break;
335
336 default:
337 output_addr_const (stream, x);
338 break;
339 }
340 }
341
342 static bool
343 mcore_print_operand_punct_valid_p (unsigned char code)
344 {
345 return (code == '.' || code == '#' || code == '*' || code == '^'
346 || code == '!');
347 }
348
349 /* Print operand x (an rtx) in assembler syntax to file stream
350 according to modifier code.
351
352 'R' print the next register or memory location along, i.e. the lsw in
353 a double word value
354 'O' print a constant without the #
355 'M' print a constant as its negative
356 'P' print log2 of a power of two
357 'Q' print log2 of an inverse of a power of two
358 'U' print register for ldm/stm instruction
359 'X' print byte number for xtrbN instruction. */
360
361 static void
362 mcore_print_operand (FILE * stream, rtx x, int code)
363 {
364 switch (code)
365 {
366 case 'N':
367 if (INTVAL(x) == -1)
368 fprintf (asm_out_file, "32");
369 else
370 fprintf (asm_out_file, "%d", exact_log2 (INTVAL (x) + 1));
371 break;
372 case 'P':
373 fprintf (asm_out_file, "%d", exact_log2 (INTVAL (x) & 0xffffffff));
374 break;
375 case 'Q':
376 fprintf (asm_out_file, "%d", exact_log2 (~INTVAL (x)));
377 break;
378 case 'O':
379 fprintf (asm_out_file, HOST_WIDE_INT_PRINT_DEC, INTVAL (x));
380 break;
381 case 'M':
382 fprintf (asm_out_file, HOST_WIDE_INT_PRINT_DEC, - INTVAL (x));
383 break;
384 case 'R':
385 /* Next location along in memory or register. */
386 switch (GET_CODE (x))
387 {
388 case REG:
389 fputs (reg_names[REGNO (x) + 1], (stream));
390 break;
391 case MEM:
392 mcore_print_operand_address
393 (stream, XEXP (adjust_address (x, SImode, 4), 0));
394 break;
395 default:
396 gcc_unreachable ();
397 }
398 break;
399 case 'U':
400 fprintf (asm_out_file, "%s-%s", reg_names[REGNO (x)],
401 reg_names[REGNO (x) + 3]);
402 break;
403 case 'x':
404 fprintf (asm_out_file, HOST_WIDE_INT_PRINT_HEX, INTVAL (x));
405 break;
406 case 'X':
407 fprintf (asm_out_file, HOST_WIDE_INT_PRINT_DEC, 3 - INTVAL (x) / 8);
408 break;
409
410 default:
411 switch (GET_CODE (x))
412 {
413 case REG:
414 fputs (reg_names[REGNO (x)], (stream));
415 break;
416 case MEM:
417 output_address (XEXP (x, 0));
418 break;
419 default:
420 output_addr_const (stream, x);
421 break;
422 }
423 break;
424 }
425 }
426
427 /* What does a constant cost ? */
428
429 static int
430 mcore_const_costs (rtx exp, enum rtx_code code)
431 {
432 HOST_WIDE_INT val = INTVAL (exp);
433
434 /* Easy constants. */
435 if ( CONST_OK_FOR_I (val)
436 || CONST_OK_FOR_M (val)
437 || CONST_OK_FOR_N (val)
438 || (code == PLUS && CONST_OK_FOR_L (val)))
439 return 1;
440 else if (code == AND
441 && ( CONST_OK_FOR_M (~val)
442 || CONST_OK_FOR_N (~val)))
443 return 2;
444 else if (code == PLUS
445 && ( CONST_OK_FOR_I (-val)
446 || CONST_OK_FOR_M (-val)
447 || CONST_OK_FOR_N (-val)))
448 return 2;
449
450 return 5;
451 }
452
453 /* What does an and instruction cost - we do this b/c immediates may
454 have been relaxed. We want to ensure that cse will cse relaxed immeds
455 out. Otherwise we'll get bad code (multiple reloads of the same const). */
456
457 static int
458 mcore_and_cost (rtx x)
459 {
460 HOST_WIDE_INT val;
461
462 if (GET_CODE (XEXP (x, 1)) != CONST_INT)
463 return 2;
464
465 val = INTVAL (XEXP (x, 1));
466
467 /* Do it directly. */
468 if (CONST_OK_FOR_K (val) || CONST_OK_FOR_M (~val))
469 return 2;
470 /* Takes one instruction to load. */
471 else if (const_ok_for_mcore (val))
472 return 3;
473 /* Takes two instructions to load. */
474 else if (TARGET_HARDLIT && mcore_const_ok_for_inline (val))
475 return 4;
476
477 /* Takes a lrw to load. */
478 return 5;
479 }
480
481 /* What does an or cost - see and_cost(). */
482
483 static int
484 mcore_ior_cost (rtx x)
485 {
486 HOST_WIDE_INT val;
487
488 if (GET_CODE (XEXP (x, 1)) != CONST_INT)
489 return 2;
490
491 val = INTVAL (XEXP (x, 1));
492
493 /* Do it directly with bclri. */
494 if (CONST_OK_FOR_M (val))
495 return 2;
496 /* Takes one instruction to load. */
497 else if (const_ok_for_mcore (val))
498 return 3;
499 /* Takes two instructions to load. */
500 else if (TARGET_HARDLIT && mcore_const_ok_for_inline (val))
501 return 4;
502
503 /* Takes a lrw to load. */
504 return 5;
505 }
506
507 static bool
508 mcore_rtx_costs (rtx x, int code, int outer_code, int * total,
509 bool speed ATTRIBUTE_UNUSED)
510 {
511 switch (code)
512 {
513 case CONST_INT:
514 *total = mcore_const_costs (x, (enum rtx_code) outer_code);
515 return true;
516 case CONST:
517 case LABEL_REF:
518 case SYMBOL_REF:
519 *total = 5;
520 return true;
521 case CONST_DOUBLE:
522 *total = 10;
523 return true;
524
525 case AND:
526 *total = COSTS_N_INSNS (mcore_and_cost (x));
527 return true;
528
529 case IOR:
530 *total = COSTS_N_INSNS (mcore_ior_cost (x));
531 return true;
532
533 case DIV:
534 case UDIV:
535 case MOD:
536 case UMOD:
537 case FLOAT:
538 case FIX:
539 *total = COSTS_N_INSNS (100);
540 return true;
541
542 default:
543 return false;
544 }
545 }
546
547 /* Prepare the operands for a comparison. Return whether the branch/setcc
548 should reverse the operands. */
549
550 bool
551 mcore_gen_compare (enum rtx_code code, rtx op0, rtx op1)
552 {
553 rtx cc_reg = gen_rtx_REG (CCmode, CC_REG);
554 bool invert;
555
556 if (GET_CODE (op1) == CONST_INT)
557 {
558 HOST_WIDE_INT val = INTVAL (op1);
559
560 switch (code)
561 {
562 case GTU:
563 /* Unsigned > 0 is the same as != 0; everything else is converted
564 below to LEU (reversed cmphs). */
565 if (val == 0)
566 code = NE;
567 break;
568
569 /* Check whether (LE A imm) can become (LT A imm + 1),
570 or (GT A imm) can become (GE A imm + 1). */
571 case GT:
572 case LE:
573 if (CONST_OK_FOR_J (val + 1))
574 {
575 op1 = GEN_INT (val + 1);
576 code = code == LE ? LT : GE;
577 }
578 break;
579
580 default:
581 break;
582 }
583 }
584
585 if (CONSTANT_P (op1) && GET_CODE (op1) != CONST_INT)
586 op1 = force_reg (SImode, op1);
587
588 /* cmpnei: 0-31 (K immediate)
589 cmplti: 1-32 (J immediate, 0 using btsti x,31). */
590 invert = false;
591 switch (code)
592 {
593 case EQ: /* Use inverted condition, cmpne. */
594 code = NE;
595 invert = true;
596 /* Drop through. */
597
598 case NE: /* Use normal condition, cmpne. */
599 if (GET_CODE (op1) == CONST_INT && ! CONST_OK_FOR_K (INTVAL (op1)))
600 op1 = force_reg (SImode, op1);
601 break;
602
603 case LE: /* Use inverted condition, reversed cmplt. */
604 code = GT;
605 invert = true;
606 /* Drop through. */
607
608 case GT: /* Use normal condition, reversed cmplt. */
609 if (GET_CODE (op1) == CONST_INT)
610 op1 = force_reg (SImode, op1);
611 break;
612
613 case GE: /* Use inverted condition, cmplt. */
614 code = LT;
615 invert = true;
616 /* Drop through. */
617
618 case LT: /* Use normal condition, cmplt. */
619 if (GET_CODE (op1) == CONST_INT &&
620 /* covered by btsti x,31. */
621 INTVAL (op1) != 0 &&
622 ! CONST_OK_FOR_J (INTVAL (op1)))
623 op1 = force_reg (SImode, op1);
624 break;
625
626 case GTU: /* Use inverted condition, cmple. */
627 /* We coped with unsigned > 0 above. */
628 gcc_assert (GET_CODE (op1) != CONST_INT || INTVAL (op1) != 0);
629 code = LEU;
630 invert = true;
631 /* Drop through. */
632
633 case LEU: /* Use normal condition, reversed cmphs. */
634 if (GET_CODE (op1) == CONST_INT && INTVAL (op1) != 0)
635 op1 = force_reg (SImode, op1);
636 break;
637
638 case LTU: /* Use inverted condition, cmphs. */
639 code = GEU;
640 invert = true;
641 /* Drop through. */
642
643 case GEU: /* Use normal condition, cmphs. */
644 if (GET_CODE (op1) == CONST_INT && INTVAL (op1) != 0)
645 op1 = force_reg (SImode, op1);
646 break;
647
648 default:
649 break;
650 }
651
652 emit_insn (gen_rtx_SET (VOIDmode,
653 cc_reg,
654 gen_rtx_fmt_ee (code, CCmode, op0, op1)));
655 return invert;
656 }
657
658 int
659 mcore_symbolic_address_p (rtx x)
660 {
661 switch (GET_CODE (x))
662 {
663 case SYMBOL_REF:
664 case LABEL_REF:
665 return 1;
666 case CONST:
667 x = XEXP (x, 0);
668 return ( (GET_CODE (XEXP (x, 0)) == SYMBOL_REF
669 || GET_CODE (XEXP (x, 0)) == LABEL_REF)
670 && GET_CODE (XEXP (x, 1)) == CONST_INT);
671 default:
672 return 0;
673 }
674 }
675
676 /* Functions to output assembly code for a function call. */
677
678 char *
679 mcore_output_call (rtx operands[], int index)
680 {
681 static char buffer[20];
682 rtx addr = operands [index];
683
684 if (REG_P (addr))
685 {
686 if (TARGET_CG_DATA)
687 {
688 gcc_assert (mcore_current_function_name);
689
690 ASM_OUTPUT_CG_EDGE (asm_out_file, mcore_current_function_name,
691 "unknown", 1);
692 }
693
694 sprintf (buffer, "jsr\t%%%d", index);
695 }
696 else
697 {
698 if (TARGET_CG_DATA)
699 {
700 gcc_assert (mcore_current_function_name);
701 gcc_assert (GET_CODE (addr) == SYMBOL_REF);
702
703 ASM_OUTPUT_CG_EDGE (asm_out_file, mcore_current_function_name,
704 XSTR (addr, 0), 0);
705 }
706
707 sprintf (buffer, "jbsr\t%%%d", index);
708 }
709
710 return buffer;
711 }
712
713 /* Can we load a constant with a single instruction ? */
714
715 int
716 const_ok_for_mcore (HOST_WIDE_INT value)
717 {
718 if (value >= 0 && value <= 127)
719 return 1;
720
721 /* Try exact power of two. */
722 if (CONST_OK_FOR_M (value))
723 return 1;
724
725 /* Try exact power of two - 1. */
726 if (CONST_OK_FOR_N (value) && value != -1)
727 return 1;
728
729 return 0;
730 }
731
732 /* Can we load a constant inline with up to 2 instructions ? */
733
734 int
735 mcore_const_ok_for_inline (HOST_WIDE_INT value)
736 {
737 HOST_WIDE_INT x, y;
738
739 return try_constant_tricks (value, & x, & y) > 0;
740 }
741
742 /* Are we loading the constant using a not ? */
743
744 int
745 mcore_const_trick_uses_not (HOST_WIDE_INT value)
746 {
747 HOST_WIDE_INT x, y;
748
749 return try_constant_tricks (value, & x, & y) == 2;
750 }
751
752 /* Try tricks to load a constant inline and return the trick number if
753 success (0 is non-inlinable).
754
755 0: not inlinable
756 1: single instruction (do the usual thing)
757 2: single insn followed by a 'not'
758 3: single insn followed by a subi
759 4: single insn followed by an addi
760 5: single insn followed by rsubi
761 6: single insn followed by bseti
762 7: single insn followed by bclri
763 8: single insn followed by rotli
764 9: single insn followed by lsli
765 10: single insn followed by ixh
766 11: single insn followed by ixw. */
767
768 static int
769 try_constant_tricks (HOST_WIDE_INT value, HOST_WIDE_INT * x, HOST_WIDE_INT * y)
770 {
771 HOST_WIDE_INT i;
772 unsigned HOST_WIDE_INT bit, shf, rot;
773
774 if (const_ok_for_mcore (value))
775 return 1; /* Do the usual thing. */
776
777 if (! TARGET_HARDLIT)
778 return 0;
779
780 if (const_ok_for_mcore (~value))
781 {
782 *x = ~value;
783 return 2;
784 }
785
786 for (i = 1; i <= 32; i++)
787 {
788 if (const_ok_for_mcore (value - i))
789 {
790 *x = value - i;
791 *y = i;
792
793 return 3;
794 }
795
796 if (const_ok_for_mcore (value + i))
797 {
798 *x = value + i;
799 *y = i;
800
801 return 4;
802 }
803 }
804
805 bit = 0x80000000ULL;
806
807 for (i = 0; i <= 31; i++)
808 {
809 if (const_ok_for_mcore (i - value))
810 {
811 *x = i - value;
812 *y = i;
813
814 return 5;
815 }
816
817 if (const_ok_for_mcore (value & ~bit))
818 {
819 *y = bit;
820 *x = value & ~bit;
821 return 6;
822 }
823
824 if (const_ok_for_mcore (value | bit))
825 {
826 *y = ~bit;
827 *x = value | bit;
828
829 return 7;
830 }
831
832 bit >>= 1;
833 }
834
835 shf = value;
836 rot = value;
837
838 for (i = 1; i < 31; i++)
839 {
840 int c;
841
842 /* MCore has rotate left. */
843 c = rot << 31;
844 rot >>= 1;
845 rot &= 0x7FFFFFFF;
846 rot |= c; /* Simulate rotate. */
847
848 if (const_ok_for_mcore (rot))
849 {
850 *y = i;
851 *x = rot;
852
853 return 8;
854 }
855
856 if (shf & 1)
857 shf = 0; /* Can't use logical shift, low order bit is one. */
858
859 shf >>= 1;
860
861 if (shf != 0 && const_ok_for_mcore (shf))
862 {
863 *y = i;
864 *x = shf;
865
866 return 9;
867 }
868 }
869
870 if ((value % 3) == 0 && const_ok_for_mcore (value / 3))
871 {
872 *x = value / 3;
873
874 return 10;
875 }
876
877 if ((value % 5) == 0 && const_ok_for_mcore (value / 5))
878 {
879 *x = value / 5;
880
881 return 11;
882 }
883
884 return 0;
885 }
886
887 /* Check whether reg is dead at first. This is done by searching ahead
888 for either the next use (i.e., reg is live), a death note, or a set of
889 reg. Don't just use dead_or_set_p() since reload does not always mark
890 deaths (especially if PRESERVE_DEATH_NOTES_REGNO_P is not defined). We
891 can ignore subregs by extracting the actual register. BRC */
892
893 int
894 mcore_is_dead (rtx first, rtx reg)
895 {
896 rtx insn;
897
898 /* For mcore, subregs can't live independently of their parent regs. */
899 if (GET_CODE (reg) == SUBREG)
900 reg = SUBREG_REG (reg);
901
902 /* Dies immediately. */
903 if (dead_or_set_p (first, reg))
904 return 1;
905
906 /* Look for conclusive evidence of live/death, otherwise we have
907 to assume that it is live. */
908 for (insn = NEXT_INSN (first); insn; insn = NEXT_INSN (insn))
909 {
910 if (GET_CODE (insn) == JUMP_INSN)
911 return 0; /* We lose track, assume it is alive. */
912
913 else if (GET_CODE(insn) == CALL_INSN)
914 {
915 /* Call's might use it for target or register parms. */
916 if (reg_referenced_p (reg, PATTERN (insn))
917 || find_reg_fusage (insn, USE, reg))
918 return 0;
919 else if (dead_or_set_p (insn, reg))
920 return 1;
921 }
922 else if (GET_CODE (insn) == INSN)
923 {
924 if (reg_referenced_p (reg, PATTERN (insn)))
925 return 0;
926 else if (dead_or_set_p (insn, reg))
927 return 1;
928 }
929 }
930
931 /* No conclusive evidence either way, we cannot take the chance
932 that control flow hid the use from us -- "I'm not dead yet". */
933 return 0;
934 }
935
936 /* Count the number of ones in mask. */
937
938 int
939 mcore_num_ones (HOST_WIDE_INT mask)
940 {
941 /* A trick to count set bits recently posted on comp.compilers. */
942 mask = (mask >> 1 & 0x55555555) + (mask & 0x55555555);
943 mask = ((mask >> 2) & 0x33333333) + (mask & 0x33333333);
944 mask = ((mask >> 4) + mask) & 0x0f0f0f0f;
945 mask = ((mask >> 8) + mask);
946
947 return (mask + (mask >> 16)) & 0xff;
948 }
949
950 /* Count the number of zeros in mask. */
951
952 int
953 mcore_num_zeros (HOST_WIDE_INT mask)
954 {
955 return 32 - mcore_num_ones (mask);
956 }
957
958 /* Determine byte being masked. */
959
960 int
961 mcore_byte_offset (unsigned int mask)
962 {
963 if (mask == 0x00ffffffL)
964 return 0;
965 else if (mask == 0xff00ffffL)
966 return 1;
967 else if (mask == 0xffff00ffL)
968 return 2;
969 else if (mask == 0xffffff00L)
970 return 3;
971
972 return -1;
973 }
974
975 /* Determine halfword being masked. */
976
977 int
978 mcore_halfword_offset (unsigned int mask)
979 {
980 if (mask == 0x0000ffffL)
981 return 0;
982 else if (mask == 0xffff0000L)
983 return 1;
984
985 return -1;
986 }
987
988 /* Output a series of bseti's corresponding to mask. */
989
990 const char *
991 mcore_output_bseti (rtx dst, int mask)
992 {
993 rtx out_operands[2];
994 int bit;
995
996 out_operands[0] = dst;
997
998 for (bit = 0; bit < 32; bit++)
999 {
1000 if ((mask & 0x1) == 0x1)
1001 {
1002 out_operands[1] = GEN_INT (bit);
1003
1004 output_asm_insn ("bseti\t%0,%1", out_operands);
1005 }
1006 mask >>= 1;
1007 }
1008
1009 return "";
1010 }
1011
1012 /* Output a series of bclri's corresponding to mask. */
1013
1014 const char *
1015 mcore_output_bclri (rtx dst, int mask)
1016 {
1017 rtx out_operands[2];
1018 int bit;
1019
1020 out_operands[0] = dst;
1021
1022 for (bit = 0; bit < 32; bit++)
1023 {
1024 if ((mask & 0x1) == 0x0)
1025 {
1026 out_operands[1] = GEN_INT (bit);
1027
1028 output_asm_insn ("bclri\t%0,%1", out_operands);
1029 }
1030
1031 mask >>= 1;
1032 }
1033
1034 return "";
1035 }
1036
1037 /* Output a conditional move of two constants that are +/- 1 within each
1038 other. See the "movtK" patterns in mcore.md. I'm not sure this is
1039 really worth the effort. */
1040
1041 const char *
1042 mcore_output_cmov (rtx operands[], int cmp_t, const char * test)
1043 {
1044 HOST_WIDE_INT load_value;
1045 HOST_WIDE_INT adjust_value;
1046 rtx out_operands[4];
1047
1048 out_operands[0] = operands[0];
1049
1050 /* Check to see which constant is loadable. */
1051 if (const_ok_for_mcore (INTVAL (operands[1])))
1052 {
1053 out_operands[1] = operands[1];
1054 out_operands[2] = operands[2];
1055 }
1056 else if (const_ok_for_mcore (INTVAL (operands[2])))
1057 {
1058 out_operands[1] = operands[2];
1059 out_operands[2] = operands[1];
1060
1061 /* Complement test since constants are swapped. */
1062 cmp_t = (cmp_t == 0);
1063 }
1064 load_value = INTVAL (out_operands[1]);
1065 adjust_value = INTVAL (out_operands[2]);
1066
1067 /* First output the test if folded into the pattern. */
1068
1069 if (test)
1070 output_asm_insn (test, operands);
1071
1072 /* Load the constant - for now, only support constants that can be
1073 generated with a single instruction. maybe add general inlinable
1074 constants later (this will increase the # of patterns since the
1075 instruction sequence has a different length attribute). */
1076 if (load_value >= 0 && load_value <= 127)
1077 output_asm_insn ("movi\t%0,%1", out_operands);
1078 else if (CONST_OK_FOR_M (load_value))
1079 output_asm_insn ("bgeni\t%0,%P1", out_operands);
1080 else if (CONST_OK_FOR_N (load_value))
1081 output_asm_insn ("bmaski\t%0,%N1", out_operands);
1082
1083 /* Output the constant adjustment. */
1084 if (load_value > adjust_value)
1085 {
1086 if (cmp_t)
1087 output_asm_insn ("decf\t%0", out_operands);
1088 else
1089 output_asm_insn ("dect\t%0", out_operands);
1090 }
1091 else
1092 {
1093 if (cmp_t)
1094 output_asm_insn ("incf\t%0", out_operands);
1095 else
1096 output_asm_insn ("inct\t%0", out_operands);
1097 }
1098
1099 return "";
1100 }
1101
1102 /* Outputs the peephole for moving a constant that gets not'ed followed
1103 by an and (i.e. combine the not and the and into andn). BRC */
1104
1105 const char *
1106 mcore_output_andn (rtx insn ATTRIBUTE_UNUSED, rtx operands[])
1107 {
1108 HOST_WIDE_INT x, y;
1109 rtx out_operands[3];
1110 const char * load_op;
1111 char buf[256];
1112 int trick_no;
1113
1114 trick_no = try_constant_tricks (INTVAL (operands[1]), &x, &y);
1115 gcc_assert (trick_no == 2);
1116
1117 out_operands[0] = operands[0];
1118 out_operands[1] = GEN_INT (x);
1119 out_operands[2] = operands[2];
1120
1121 if (x >= 0 && x <= 127)
1122 load_op = "movi\t%0,%1";
1123
1124 /* Try exact power of two. */
1125 else if (CONST_OK_FOR_M (x))
1126 load_op = "bgeni\t%0,%P1";
1127
1128 /* Try exact power of two - 1. */
1129 else if (CONST_OK_FOR_N (x))
1130 load_op = "bmaski\t%0,%N1";
1131
1132 else
1133 {
1134 load_op = "BADMOVI-andn\t%0, %1";
1135 gcc_unreachable ();
1136 }
1137
1138 sprintf (buf, "%s\n\tandn\t%%2,%%0", load_op);
1139 output_asm_insn (buf, out_operands);
1140
1141 return "";
1142 }
1143
1144 /* Output an inline constant. */
1145
1146 static const char *
1147 output_inline_const (enum machine_mode mode, rtx operands[])
1148 {
1149 HOST_WIDE_INT x = 0, y = 0;
1150 int trick_no;
1151 rtx out_operands[3];
1152 char buf[256];
1153 char load_op[256];
1154 const char *dst_fmt;
1155 HOST_WIDE_INT value;
1156
1157 value = INTVAL (operands[1]);
1158
1159 trick_no = try_constant_tricks (value, &x, &y);
1160 /* lrw's are handled separately: Large inlinable constants never get
1161 turned into lrw's. Our caller uses try_constant_tricks to back
1162 off to an lrw rather than calling this routine. */
1163 gcc_assert (trick_no != 0);
1164
1165 if (trick_no == 1)
1166 x = value;
1167
1168 /* operands: 0 = dst, 1 = load immed., 2 = immed. adjustment. */
1169 out_operands[0] = operands[0];
1170 out_operands[1] = GEN_INT (x);
1171
1172 if (trick_no > 2)
1173 out_operands[2] = GEN_INT (y);
1174
1175 /* Select dst format based on mode. */
1176 if (mode == DImode && (! TARGET_LITTLE_END))
1177 dst_fmt = "%R0";
1178 else
1179 dst_fmt = "%0";
1180
1181 if (x >= 0 && x <= 127)
1182 sprintf (load_op, "movi\t%s,%%1", dst_fmt);
1183
1184 /* Try exact power of two. */
1185 else if (CONST_OK_FOR_M (x))
1186 sprintf (load_op, "bgeni\t%s,%%P1", dst_fmt);
1187
1188 /* Try exact power of two - 1. */
1189 else if (CONST_OK_FOR_N (x))
1190 sprintf (load_op, "bmaski\t%s,%%N1", dst_fmt);
1191
1192 else
1193 {
1194 sprintf (load_op, "BADMOVI-inline_const %s, %%1", dst_fmt);
1195 gcc_unreachable ();
1196 }
1197
1198 switch (trick_no)
1199 {
1200 case 1:
1201 strcpy (buf, load_op);
1202 break;
1203 case 2: /* not */
1204 sprintf (buf, "%s\n\tnot\t%s\t// %ld 0x%lx", load_op, dst_fmt, value, value);
1205 break;
1206 case 3: /* add */
1207 sprintf (buf, "%s\n\taddi\t%s,%%2\t// %ld 0x%lx", load_op, dst_fmt, value, value);
1208 break;
1209 case 4: /* sub */
1210 sprintf (buf, "%s\n\tsubi\t%s,%%2\t// %ld 0x%lx", load_op, dst_fmt, value, value);
1211 break;
1212 case 5: /* rsub */
1213 /* Never happens unless -mrsubi, see try_constant_tricks(). */
1214 sprintf (buf, "%s\n\trsubi\t%s,%%2\t// %ld 0x%lx", load_op, dst_fmt, value, value);
1215 break;
1216 case 6: /* bseti */
1217 sprintf (buf, "%s\n\tbseti\t%s,%%P2\t// %ld 0x%lx", load_op, dst_fmt, value, value);
1218 break;
1219 case 7: /* bclr */
1220 sprintf (buf, "%s\n\tbclri\t%s,%%Q2\t// %ld 0x%lx", load_op, dst_fmt, value, value);
1221 break;
1222 case 8: /* rotl */
1223 sprintf (buf, "%s\n\trotli\t%s,%%2\t// %ld 0x%lx", load_op, dst_fmt, value, value);
1224 break;
1225 case 9: /* lsl */
1226 sprintf (buf, "%s\n\tlsli\t%s,%%2\t// %ld 0x%lx", load_op, dst_fmt, value, value);
1227 break;
1228 case 10: /* ixh */
1229 sprintf (buf, "%s\n\tixh\t%s,%s\t// %ld 0x%lx", load_op, dst_fmt, dst_fmt, value, value);
1230 break;
1231 case 11: /* ixw */
1232 sprintf (buf, "%s\n\tixw\t%s,%s\t// %ld 0x%lx", load_op, dst_fmt, dst_fmt, value, value);
1233 break;
1234 default:
1235 return "";
1236 }
1237
1238 output_asm_insn (buf, out_operands);
1239
1240 return "";
1241 }
1242
1243 /* Output a move of a word or less value. */
1244
1245 const char *
1246 mcore_output_move (rtx insn ATTRIBUTE_UNUSED, rtx operands[],
1247 enum machine_mode mode ATTRIBUTE_UNUSED)
1248 {
1249 rtx dst = operands[0];
1250 rtx src = operands[1];
1251
1252 if (GET_CODE (dst) == REG)
1253 {
1254 if (GET_CODE (src) == REG)
1255 {
1256 if (REGNO (src) == CC_REG) /* r-c */
1257 return "mvc\t%0";
1258 else
1259 return "mov\t%0,%1"; /* r-r*/
1260 }
1261 else if (GET_CODE (src) == MEM)
1262 {
1263 if (GET_CODE (XEXP (src, 0)) == LABEL_REF)
1264 return "lrw\t%0,[%1]"; /* a-R */
1265 else
1266 switch (GET_MODE (src)) /* r-m */
1267 {
1268 case SImode:
1269 return "ldw\t%0,%1";
1270 case HImode:
1271 return "ld.h\t%0,%1";
1272 case QImode:
1273 return "ld.b\t%0,%1";
1274 default:
1275 gcc_unreachable ();
1276 }
1277 }
1278 else if (GET_CODE (src) == CONST_INT)
1279 {
1280 HOST_WIDE_INT x, y;
1281
1282 if (CONST_OK_FOR_I (INTVAL (src))) /* r-I */
1283 return "movi\t%0,%1";
1284 else if (CONST_OK_FOR_M (INTVAL (src))) /* r-M */
1285 return "bgeni\t%0,%P1\t// %1 %x1";
1286 else if (CONST_OK_FOR_N (INTVAL (src))) /* r-N */
1287 return "bmaski\t%0,%N1\t// %1 %x1";
1288 else if (try_constant_tricks (INTVAL (src), &x, &y)) /* R-P */
1289 return output_inline_const (SImode, operands); /* 1-2 insns */
1290 else
1291 return "lrw\t%0,%x1\t// %1"; /* Get it from literal pool. */
1292 }
1293 else
1294 return "lrw\t%0, %1"; /* Into the literal pool. */
1295 }
1296 else if (GET_CODE (dst) == MEM) /* m-r */
1297 switch (GET_MODE (dst))
1298 {
1299 case SImode:
1300 return "stw\t%1,%0";
1301 case HImode:
1302 return "st.h\t%1,%0";
1303 case QImode:
1304 return "st.b\t%1,%0";
1305 default:
1306 gcc_unreachable ();
1307 }
1308
1309 gcc_unreachable ();
1310 }
1311
1312 /* Return a sequence of instructions to perform DI or DF move.
1313 Since the MCORE cannot move a DI or DF in one instruction, we have
1314 to take care when we see overlapping source and dest registers. */
1315
1316 const char *
1317 mcore_output_movedouble (rtx operands[], enum machine_mode mode ATTRIBUTE_UNUSED)
1318 {
1319 rtx dst = operands[0];
1320 rtx src = operands[1];
1321
1322 if (GET_CODE (dst) == REG)
1323 {
1324 if (GET_CODE (src) == REG)
1325 {
1326 int dstreg = REGNO (dst);
1327 int srcreg = REGNO (src);
1328
1329 /* Ensure the second source not overwritten. */
1330 if (srcreg + 1 == dstreg)
1331 return "mov %R0,%R1\n\tmov %0,%1";
1332 else
1333 return "mov %0,%1\n\tmov %R0,%R1";
1334 }
1335 else if (GET_CODE (src) == MEM)
1336 {
1337 rtx memexp = memexp = XEXP (src, 0);
1338 int dstreg = REGNO (dst);
1339 int basereg = -1;
1340
1341 if (GET_CODE (memexp) == LABEL_REF)
1342 return "lrw\t%0,[%1]\n\tlrw\t%R0,[%R1]";
1343 else if (GET_CODE (memexp) == REG)
1344 basereg = REGNO (memexp);
1345 else if (GET_CODE (memexp) == PLUS)
1346 {
1347 if (GET_CODE (XEXP (memexp, 0)) == REG)
1348 basereg = REGNO (XEXP (memexp, 0));
1349 else if (GET_CODE (XEXP (memexp, 1)) == REG)
1350 basereg = REGNO (XEXP (memexp, 1));
1351 else
1352 gcc_unreachable ();
1353 }
1354 else
1355 gcc_unreachable ();
1356
1357 /* ??? length attribute is wrong here. */
1358 if (dstreg == basereg)
1359 {
1360 /* Just load them in reverse order. */
1361 return "ldw\t%R0,%R1\n\tldw\t%0,%1";
1362
1363 /* XXX: alternative: move basereg to basereg+1
1364 and then fall through. */
1365 }
1366 else
1367 return "ldw\t%0,%1\n\tldw\t%R0,%R1";
1368 }
1369 else if (GET_CODE (src) == CONST_INT)
1370 {
1371 if (TARGET_LITTLE_END)
1372 {
1373 if (CONST_OK_FOR_I (INTVAL (src)))
1374 output_asm_insn ("movi %0,%1", operands);
1375 else if (CONST_OK_FOR_M (INTVAL (src)))
1376 output_asm_insn ("bgeni %0,%P1", operands);
1377 else if (CONST_OK_FOR_N (INTVAL (src)))
1378 output_asm_insn ("bmaski %0,%N1", operands);
1379 else
1380 gcc_unreachable ();
1381
1382 if (INTVAL (src) < 0)
1383 return "bmaski %R0,32";
1384 else
1385 return "movi %R0,0";
1386 }
1387 else
1388 {
1389 if (CONST_OK_FOR_I (INTVAL (src)))
1390 output_asm_insn ("movi %R0,%1", operands);
1391 else if (CONST_OK_FOR_M (INTVAL (src)))
1392 output_asm_insn ("bgeni %R0,%P1", operands);
1393 else if (CONST_OK_FOR_N (INTVAL (src)))
1394 output_asm_insn ("bmaski %R0,%N1", operands);
1395 else
1396 gcc_unreachable ();
1397
1398 if (INTVAL (src) < 0)
1399 return "bmaski %0,32";
1400 else
1401 return "movi %0,0";
1402 }
1403 }
1404 else
1405 gcc_unreachable ();
1406 }
1407 else if (GET_CODE (dst) == MEM && GET_CODE (src) == REG)
1408 return "stw\t%1,%0\n\tstw\t%R1,%R0";
1409 else
1410 gcc_unreachable ();
1411 }
1412
1413 /* Predicates used by the templates. */
1414
1415 int
1416 mcore_arith_S_operand (rtx op)
1417 {
1418 if (GET_CODE (op) == CONST_INT && CONST_OK_FOR_M (~INTVAL (op)))
1419 return 1;
1420
1421 return 0;
1422 }
1423
1424 /* Expand insert bit field. BRC */
1425
1426 int
1427 mcore_expand_insv (rtx operands[])
1428 {
1429 int width = INTVAL (operands[1]);
1430 int posn = INTVAL (operands[2]);
1431 int mask;
1432 rtx mreg, sreg, ereg;
1433
1434 /* To get width 1 insv, the test in store_bit_field() (expmed.c, line 191)
1435 for width==1 must be removed. Look around line 368. This is something
1436 we really want the md part to do. */
1437 if (width == 1 && GET_CODE (operands[3]) == CONST_INT)
1438 {
1439 /* Do directly with bseti or bclri. */
1440 /* RBE: 2/97 consider only low bit of constant. */
1441 if ((INTVAL (operands[3]) & 1) == 0)
1442 {
1443 mask = ~(1 << posn);
1444 emit_insn (gen_rtx_SET (SImode, operands[0],
1445 gen_rtx_AND (SImode, operands[0], GEN_INT (mask))));
1446 }
1447 else
1448 {
1449 mask = 1 << posn;
1450 emit_insn (gen_rtx_SET (SImode, operands[0],
1451 gen_rtx_IOR (SImode, operands[0], GEN_INT (mask))));
1452 }
1453
1454 return 1;
1455 }
1456
1457 /* Look at some bit-field placements that we aren't interested
1458 in handling ourselves, unless specifically directed to do so. */
1459 if (! TARGET_W_FIELD)
1460 return 0; /* Generally, give up about now. */
1461
1462 if (width == 8 && posn % 8 == 0)
1463 /* Byte sized and aligned; let caller break it up. */
1464 return 0;
1465
1466 if (width == 16 && posn % 16 == 0)
1467 /* Short sized and aligned; let caller break it up. */
1468 return 0;
1469
1470 /* The general case - we can do this a little bit better than what the
1471 machine independent part tries. This will get rid of all the subregs
1472 that mess up constant folding in combine when working with relaxed
1473 immediates. */
1474
1475 /* If setting the entire field, do it directly. */
1476 if (GET_CODE (operands[3]) == CONST_INT
1477 && INTVAL (operands[3]) == ((1 << width) - 1))
1478 {
1479 mreg = force_reg (SImode, GEN_INT (INTVAL (operands[3]) << posn));
1480 emit_insn (gen_rtx_SET (SImode, operands[0],
1481 gen_rtx_IOR (SImode, operands[0], mreg)));
1482 return 1;
1483 }
1484
1485 /* Generate the clear mask. */
1486 mreg = force_reg (SImode, GEN_INT (~(((1 << width) - 1) << posn)));
1487
1488 /* Clear the field, to overlay it later with the source. */
1489 emit_insn (gen_rtx_SET (SImode, operands[0],
1490 gen_rtx_AND (SImode, operands[0], mreg)));
1491
1492 /* If the source is constant 0, we've nothing to add back. */
1493 if (GET_CODE (operands[3]) == CONST_INT && INTVAL (operands[3]) == 0)
1494 return 1;
1495
1496 /* XXX: Should we worry about more games with constant values?
1497 We've covered the high profile: set/clear single-bit and many-bit
1498 fields. How often do we see "arbitrary bit pattern" constants? */
1499 sreg = copy_to_mode_reg (SImode, operands[3]);
1500
1501 /* Extract src as same width as dst (needed for signed values). We
1502 always have to do this since we widen everything to SImode.
1503 We don't have to mask if we're shifting this up against the
1504 MSB of the register (e.g., the shift will push out any hi-order
1505 bits. */
1506 if (width + posn != (int) GET_MODE_SIZE (SImode))
1507 {
1508 ereg = force_reg (SImode, GEN_INT ((1 << width) - 1));
1509 emit_insn (gen_rtx_SET (SImode, sreg,
1510 gen_rtx_AND (SImode, sreg, ereg)));
1511 }
1512
1513 /* Insert source value in dest. */
1514 if (posn != 0)
1515 emit_insn (gen_rtx_SET (SImode, sreg,
1516 gen_rtx_ASHIFT (SImode, sreg, GEN_INT (posn))));
1517
1518 emit_insn (gen_rtx_SET (SImode, operands[0],
1519 gen_rtx_IOR (SImode, operands[0], sreg)));
1520
1521 return 1;
1522 }
1523 \f
1524 /* ??? Block move stuff stolen from m88k. This code has not been
1525 verified for correctness. */
1526
1527 /* Emit code to perform a block move. Choose the best method.
1528
1529 OPERANDS[0] is the destination.
1530 OPERANDS[1] is the source.
1531 OPERANDS[2] is the size.
1532 OPERANDS[3] is the alignment safe to use. */
1533
1534 /* Emit code to perform a block move with an offset sequence of ldw/st
1535 instructions (..., ldw 0, stw 1, ldw 1, stw 0, ...). SIZE and ALIGN are
1536 known constants. DEST and SRC are registers. OFFSET is the known
1537 starting point for the output pattern. */
1538
1539 static const enum machine_mode mode_from_align[] =
1540 {
1541 VOIDmode, QImode, HImode, VOIDmode, SImode,
1542 };
1543
1544 static void
1545 block_move_sequence (rtx dst_mem, rtx src_mem, int size, int align)
1546 {
1547 rtx temp[2];
1548 enum machine_mode mode[2];
1549 int amount[2];
1550 bool active[2];
1551 int phase = 0;
1552 int next;
1553 int offset_ld = 0;
1554 int offset_st = 0;
1555 rtx x;
1556
1557 x = XEXP (dst_mem, 0);
1558 if (!REG_P (x))
1559 {
1560 x = force_reg (Pmode, x);
1561 dst_mem = replace_equiv_address (dst_mem, x);
1562 }
1563
1564 x = XEXP (src_mem, 0);
1565 if (!REG_P (x))
1566 {
1567 x = force_reg (Pmode, x);
1568 src_mem = replace_equiv_address (src_mem, x);
1569 }
1570
1571 active[0] = active[1] = false;
1572
1573 do
1574 {
1575 next = phase;
1576 phase ^= 1;
1577
1578 if (size > 0)
1579 {
1580 int next_amount;
1581
1582 next_amount = (size >= 4 ? 4 : (size >= 2 ? 2 : 1));
1583 next_amount = MIN (next_amount, align);
1584
1585 amount[next] = next_amount;
1586 mode[next] = mode_from_align[next_amount];
1587 temp[next] = gen_reg_rtx (mode[next]);
1588
1589 x = adjust_address (src_mem, mode[next], offset_ld);
1590 emit_insn (gen_rtx_SET (VOIDmode, temp[next], x));
1591
1592 offset_ld += next_amount;
1593 size -= next_amount;
1594 active[next] = true;
1595 }
1596
1597 if (active[phase])
1598 {
1599 active[phase] = false;
1600
1601 x = adjust_address (dst_mem, mode[phase], offset_st);
1602 emit_insn (gen_rtx_SET (VOIDmode, x, temp[phase]));
1603
1604 offset_st += amount[phase];
1605 }
1606 }
1607 while (active[next]);
1608 }
1609
1610 bool
1611 mcore_expand_block_move (rtx *operands)
1612 {
1613 HOST_WIDE_INT align, bytes, max;
1614
1615 if (GET_CODE (operands[2]) != CONST_INT)
1616 return false;
1617
1618 bytes = INTVAL (operands[2]);
1619 align = INTVAL (operands[3]);
1620
1621 if (bytes <= 0)
1622 return false;
1623 if (align > 4)
1624 align = 4;
1625
1626 switch (align)
1627 {
1628 case 4:
1629 if (bytes & 1)
1630 max = 4*4;
1631 else if (bytes & 3)
1632 max = 8*4;
1633 else
1634 max = 16*4;
1635 break;
1636 case 2:
1637 max = 4*2;
1638 break;
1639 case 1:
1640 max = 4*1;
1641 break;
1642 default:
1643 gcc_unreachable ();
1644 }
1645
1646 if (bytes <= max)
1647 {
1648 block_move_sequence (operands[0], operands[1], bytes, align);
1649 return true;
1650 }
1651
1652 return false;
1653 }
1654 \f
1655
1656 /* Code to generate prologue and epilogue sequences. */
1657 static int number_of_regs_before_varargs;
1658
1659 /* Set by TARGET_SETUP_INCOMING_VARARGS to indicate to prolog that this is
1660 for a varargs function. */
1661 static int current_function_anonymous_args;
1662
1663 #define STACK_BYTES (STACK_BOUNDARY/BITS_PER_UNIT)
1664 #define STORE_REACH (64) /* Maximum displace of word store + 4. */
1665 #define ADDI_REACH (32) /* Maximum addi operand. */
1666
1667 static void
1668 layout_mcore_frame (struct mcore_frame * infp)
1669 {
1670 int n;
1671 unsigned int i;
1672 int nbytes;
1673 int regarg;
1674 int localregarg;
1675 int localreg;
1676 int outbounds;
1677 unsigned int growths;
1678 int step;
1679
1680 /* Might have to spill bytes to re-assemble a big argument that
1681 was passed partially in registers and partially on the stack. */
1682 nbytes = crtl->args.pretend_args_size;
1683
1684 /* Determine how much space for spilled anonymous args (e.g., stdarg). */
1685 if (current_function_anonymous_args)
1686 nbytes += (NPARM_REGS - number_of_regs_before_varargs) * UNITS_PER_WORD;
1687
1688 infp->arg_size = nbytes;
1689
1690 /* How much space to save non-volatile registers we stomp. */
1691 infp->reg_mask = calc_live_regs (& n);
1692 infp->reg_size = n * 4;
1693
1694 /* And the rest of it... locals and space for overflowed outbounds. */
1695 infp->local_size = get_frame_size ();
1696 infp->outbound_size = crtl->outgoing_args_size;
1697
1698 /* Make sure we have a whole number of words for the locals. */
1699 if (infp->local_size % STACK_BYTES)
1700 infp->local_size = (infp->local_size + STACK_BYTES - 1) & ~ (STACK_BYTES -1);
1701
1702 /* Only thing we know we have to pad is the outbound space, since
1703 we've aligned our locals assuming that base of locals is aligned. */
1704 infp->pad_local = 0;
1705 infp->pad_reg = 0;
1706 infp->pad_outbound = 0;
1707 if (infp->outbound_size % STACK_BYTES)
1708 infp->pad_outbound = STACK_BYTES - (infp->outbound_size % STACK_BYTES);
1709
1710 /* Now we see how we want to stage the prologue so that it does
1711 the most appropriate stack growth and register saves to either:
1712 (1) run fast,
1713 (2) reduce instruction space, or
1714 (3) reduce stack space. */
1715 for (i = 0; i < ARRAY_SIZE (infp->growth); i++)
1716 infp->growth[i] = 0;
1717
1718 regarg = infp->reg_size + infp->arg_size;
1719 localregarg = infp->local_size + regarg;
1720 localreg = infp->local_size + infp->reg_size;
1721 outbounds = infp->outbound_size + infp->pad_outbound;
1722 growths = 0;
1723
1724 /* XXX: Consider one where we consider localregarg + outbound too! */
1725
1726 /* Frame of <= 32 bytes and using stm would get <= 2 registers.
1727 use stw's with offsets and buy the frame in one shot. */
1728 if (localregarg <= ADDI_REACH
1729 && (infp->reg_size <= 8 || (infp->reg_mask & 0xc000) != 0xc000))
1730 {
1731 /* Make sure we'll be aligned. */
1732 if (localregarg % STACK_BYTES)
1733 infp->pad_reg = STACK_BYTES - (localregarg % STACK_BYTES);
1734
1735 step = localregarg + infp->pad_reg;
1736 infp->reg_offset = infp->local_size;
1737
1738 if (outbounds + step <= ADDI_REACH && !frame_pointer_needed)
1739 {
1740 step += outbounds;
1741 infp->reg_offset += outbounds;
1742 outbounds = 0;
1743 }
1744
1745 infp->arg_offset = step - 4;
1746 infp->growth[growths++] = step;
1747 infp->reg_growth = growths;
1748 infp->local_growth = growths;
1749
1750 /* If we haven't already folded it in. */
1751 if (outbounds)
1752 infp->growth[growths++] = outbounds;
1753
1754 goto finish;
1755 }
1756
1757 /* Frame can't be done with a single subi, but can be done with 2
1758 insns. If the 'stm' is getting <= 2 registers, we use stw's and
1759 shift some of the stack purchase into the first subi, so both are
1760 single instructions. */
1761 if (localregarg <= STORE_REACH
1762 && (infp->local_size > ADDI_REACH)
1763 && (infp->reg_size <= 8 || (infp->reg_mask & 0xc000) != 0xc000))
1764 {
1765 int all;
1766
1767 /* Make sure we'll be aligned; use either pad_reg or pad_local. */
1768 if (localregarg % STACK_BYTES)
1769 infp->pad_reg = STACK_BYTES - (localregarg % STACK_BYTES);
1770
1771 all = localregarg + infp->pad_reg + infp->pad_local;
1772 step = ADDI_REACH; /* As much up front as we can. */
1773 if (step > all)
1774 step = all;
1775
1776 /* XXX: Consider whether step will still be aligned; we believe so. */
1777 infp->arg_offset = step - 4;
1778 infp->growth[growths++] = step;
1779 infp->reg_growth = growths;
1780 infp->reg_offset = step - infp->pad_reg - infp->reg_size;
1781 all -= step;
1782
1783 /* Can we fold in any space required for outbounds? */
1784 if (outbounds + all <= ADDI_REACH && !frame_pointer_needed)
1785 {
1786 all += outbounds;
1787 outbounds = 0;
1788 }
1789
1790 /* Get the rest of the locals in place. */
1791 step = all;
1792 infp->growth[growths++] = step;
1793 infp->local_growth = growths;
1794 all -= step;
1795
1796 assert (all == 0);
1797
1798 /* Finish off if we need to do so. */
1799 if (outbounds)
1800 infp->growth[growths++] = outbounds;
1801
1802 goto finish;
1803 }
1804
1805 /* Registers + args is nicely aligned, so we'll buy that in one shot.
1806 Then we buy the rest of the frame in 1 or 2 steps depending on
1807 whether we need a frame pointer. */
1808 if ((regarg % STACK_BYTES) == 0)
1809 {
1810 infp->growth[growths++] = regarg;
1811 infp->reg_growth = growths;
1812 infp->arg_offset = regarg - 4;
1813 infp->reg_offset = 0;
1814
1815 if (infp->local_size % STACK_BYTES)
1816 infp->pad_local = STACK_BYTES - (infp->local_size % STACK_BYTES);
1817
1818 step = infp->local_size + infp->pad_local;
1819
1820 if (!frame_pointer_needed)
1821 {
1822 step += outbounds;
1823 outbounds = 0;
1824 }
1825
1826 infp->growth[growths++] = step;
1827 infp->local_growth = growths;
1828
1829 /* If there's any left to be done. */
1830 if (outbounds)
1831 infp->growth[growths++] = outbounds;
1832
1833 goto finish;
1834 }
1835
1836 /* XXX: optimizations that we'll want to play with....
1837 -- regarg is not aligned, but it's a small number of registers;
1838 use some of localsize so that regarg is aligned and then
1839 save the registers. */
1840
1841 /* Simple encoding; plods down the stack buying the pieces as it goes.
1842 -- does not optimize space consumption.
1843 -- does not attempt to optimize instruction counts.
1844 -- but it is safe for all alignments. */
1845 if (regarg % STACK_BYTES != 0)
1846 infp->pad_reg = STACK_BYTES - (regarg % STACK_BYTES);
1847
1848 infp->growth[growths++] = infp->arg_size + infp->reg_size + infp->pad_reg;
1849 infp->reg_growth = growths;
1850 infp->arg_offset = infp->growth[0] - 4;
1851 infp->reg_offset = 0;
1852
1853 if (frame_pointer_needed)
1854 {
1855 if (infp->local_size % STACK_BYTES != 0)
1856 infp->pad_local = STACK_BYTES - (infp->local_size % STACK_BYTES);
1857
1858 infp->growth[growths++] = infp->local_size + infp->pad_local;
1859 infp->local_growth = growths;
1860
1861 infp->growth[growths++] = outbounds;
1862 }
1863 else
1864 {
1865 if ((infp->local_size + outbounds) % STACK_BYTES != 0)
1866 infp->pad_local = STACK_BYTES - ((infp->local_size + outbounds) % STACK_BYTES);
1867
1868 infp->growth[growths++] = infp->local_size + infp->pad_local + outbounds;
1869 infp->local_growth = growths;
1870 }
1871
1872 /* Anything else that we've forgotten?, plus a few consistency checks. */
1873 finish:
1874 assert (infp->reg_offset >= 0);
1875 assert (growths <= MAX_STACK_GROWS);
1876
1877 for (i = 0; i < growths; i++)
1878 gcc_assert (!(infp->growth[i] % STACK_BYTES));
1879 }
1880
1881 /* Define the offset between two registers, one to be eliminated, and
1882 the other its replacement, at the start of a routine. */
1883
1884 int
1885 mcore_initial_elimination_offset (int from, int to)
1886 {
1887 int above_frame;
1888 int below_frame;
1889 struct mcore_frame fi;
1890
1891 layout_mcore_frame (& fi);
1892
1893 /* fp to ap */
1894 above_frame = fi.local_size + fi.pad_local + fi.reg_size + fi.pad_reg;
1895 /* sp to fp */
1896 below_frame = fi.outbound_size + fi.pad_outbound;
1897
1898 if (from == ARG_POINTER_REGNUM && to == FRAME_POINTER_REGNUM)
1899 return above_frame;
1900
1901 if (from == ARG_POINTER_REGNUM && to == STACK_POINTER_REGNUM)
1902 return above_frame + below_frame;
1903
1904 if (from == FRAME_POINTER_REGNUM && to == STACK_POINTER_REGNUM)
1905 return below_frame;
1906
1907 gcc_unreachable ();
1908 }
1909
1910 /* Keep track of some information about varargs for the prolog. */
1911
1912 static void
1913 mcore_setup_incoming_varargs (CUMULATIVE_ARGS *args_so_far,
1914 enum machine_mode mode, tree type,
1915 int * ptr_pretend_size ATTRIBUTE_UNUSED,
1916 int second_time ATTRIBUTE_UNUSED)
1917 {
1918 current_function_anonymous_args = 1;
1919
1920 /* We need to know how many argument registers are used before
1921 the varargs start, so that we can push the remaining argument
1922 registers during the prologue. */
1923 number_of_regs_before_varargs = *args_so_far + mcore_num_arg_regs (mode, type);
1924
1925 /* There is a bug somewhere in the arg handling code.
1926 Until I can find it this workaround always pushes the
1927 last named argument onto the stack. */
1928 number_of_regs_before_varargs = *args_so_far;
1929
1930 /* The last named argument may be split between argument registers
1931 and the stack. Allow for this here. */
1932 if (number_of_regs_before_varargs > NPARM_REGS)
1933 number_of_regs_before_varargs = NPARM_REGS;
1934 }
1935
1936 void
1937 mcore_expand_prolog (void)
1938 {
1939 struct mcore_frame fi;
1940 int space_allocated = 0;
1941 int growth = 0;
1942
1943 /* Find out what we're doing. */
1944 layout_mcore_frame (&fi);
1945
1946 space_allocated = fi.arg_size + fi.reg_size + fi.local_size +
1947 fi.outbound_size + fi.pad_outbound + fi.pad_local + fi.pad_reg;
1948
1949 if (TARGET_CG_DATA)
1950 {
1951 /* Emit a symbol for this routine's frame size. */
1952 rtx x;
1953
1954 x = DECL_RTL (current_function_decl);
1955
1956 gcc_assert (GET_CODE (x) == MEM);
1957
1958 x = XEXP (x, 0);
1959
1960 gcc_assert (GET_CODE (x) == SYMBOL_REF);
1961
1962 if (mcore_current_function_name)
1963 free (mcore_current_function_name);
1964
1965 mcore_current_function_name = xstrdup (XSTR (x, 0));
1966
1967 ASM_OUTPUT_CG_NODE (asm_out_file, mcore_current_function_name, space_allocated);
1968
1969 if (cfun->calls_alloca)
1970 ASM_OUTPUT_CG_EDGE (asm_out_file, mcore_current_function_name, "alloca", 1);
1971
1972 /* 970425: RBE:
1973 We're looking at how the 8byte alignment affects stack layout
1974 and where we had to pad things. This emits information we can
1975 extract which tells us about frame sizes and the like. */
1976 fprintf (asm_out_file,
1977 "\t.equ\t__$frame$info$_%s_$_%d_%d_x%x_%d_%d_%d,0\n",
1978 mcore_current_function_name,
1979 fi.arg_size, fi.reg_size, fi.reg_mask,
1980 fi.local_size, fi.outbound_size,
1981 frame_pointer_needed);
1982 }
1983
1984 if (mcore_naked_function_p ())
1985 return;
1986
1987 /* Handle stdarg+regsaves in one shot: can't be more than 64 bytes. */
1988 output_stack_adjust (-1, fi.growth[growth++]); /* Grows it. */
1989
1990 /* If we have a parameter passed partially in regs and partially in memory,
1991 the registers will have been stored to memory already in function.c. So
1992 we only need to do something here for varargs functions. */
1993 if (fi.arg_size != 0 && crtl->args.pretend_args_size == 0)
1994 {
1995 int offset;
1996 int rn = FIRST_PARM_REG + NPARM_REGS - 1;
1997 int remaining = fi.arg_size;
1998
1999 for (offset = fi.arg_offset; remaining >= 4; offset -= 4, rn--, remaining -= 4)
2000 {
2001 emit_insn (gen_movsi
2002 (gen_rtx_MEM (SImode,
2003 plus_constant (stack_pointer_rtx, offset)),
2004 gen_rtx_REG (SImode, rn)));
2005 }
2006 }
2007
2008 /* Do we need another stack adjustment before we do the register saves? */
2009 if (growth < fi.reg_growth)
2010 output_stack_adjust (-1, fi.growth[growth++]); /* Grows it. */
2011
2012 if (fi.reg_size != 0)
2013 {
2014 int i;
2015 int offs = fi.reg_offset;
2016
2017 for (i = 15; i >= 0; i--)
2018 {
2019 if (offs == 0 && i == 15 && ((fi.reg_mask & 0xc000) == 0xc000))
2020 {
2021 int first_reg = 15;
2022
2023 while (fi.reg_mask & (1 << first_reg))
2024 first_reg--;
2025 first_reg++;
2026
2027 emit_insn (gen_store_multiple (gen_rtx_MEM (SImode, stack_pointer_rtx),
2028 gen_rtx_REG (SImode, first_reg),
2029 GEN_INT (16 - first_reg)));
2030
2031 i -= (15 - first_reg);
2032 offs += (16 - first_reg) * 4;
2033 }
2034 else if (fi.reg_mask & (1 << i))
2035 {
2036 emit_insn (gen_movsi
2037 (gen_rtx_MEM (SImode,
2038 plus_constant (stack_pointer_rtx, offs)),
2039 gen_rtx_REG (SImode, i)));
2040 offs += 4;
2041 }
2042 }
2043 }
2044
2045 /* Figure the locals + outbounds. */
2046 if (frame_pointer_needed)
2047 {
2048 /* If we haven't already purchased to 'fp'. */
2049 if (growth < fi.local_growth)
2050 output_stack_adjust (-1, fi.growth[growth++]); /* Grows it. */
2051
2052 emit_insn (gen_movsi (frame_pointer_rtx, stack_pointer_rtx));
2053
2054 /* ... and then go any remaining distance for outbounds, etc. */
2055 if (fi.growth[growth])
2056 output_stack_adjust (-1, fi.growth[growth++]);
2057 }
2058 else
2059 {
2060 if (growth < fi.local_growth)
2061 output_stack_adjust (-1, fi.growth[growth++]); /* Grows it. */
2062 if (fi.growth[growth])
2063 output_stack_adjust (-1, fi.growth[growth++]);
2064 }
2065 }
2066
2067 void
2068 mcore_expand_epilog (void)
2069 {
2070 struct mcore_frame fi;
2071 int i;
2072 int offs;
2073 int growth = MAX_STACK_GROWS - 1 ;
2074
2075
2076 /* Find out what we're doing. */
2077 layout_mcore_frame(&fi);
2078
2079 if (mcore_naked_function_p ())
2080 return;
2081
2082 /* If we had a frame pointer, restore the sp from that. */
2083 if (frame_pointer_needed)
2084 {
2085 emit_insn (gen_movsi (stack_pointer_rtx, frame_pointer_rtx));
2086 growth = fi.local_growth - 1;
2087 }
2088 else
2089 {
2090 /* XXX: while loop should accumulate and do a single sell. */
2091 while (growth >= fi.local_growth)
2092 {
2093 if (fi.growth[growth] != 0)
2094 output_stack_adjust (1, fi.growth[growth]);
2095 growth--;
2096 }
2097 }
2098
2099 /* Make sure we've shrunk stack back to the point where the registers
2100 were laid down. This is typically 0/1 iterations. Then pull the
2101 register save information back off the stack. */
2102 while (growth >= fi.reg_growth)
2103 output_stack_adjust ( 1, fi.growth[growth--]);
2104
2105 offs = fi.reg_offset;
2106
2107 for (i = 15; i >= 0; i--)
2108 {
2109 if (offs == 0 && i == 15 && ((fi.reg_mask & 0xc000) == 0xc000))
2110 {
2111 int first_reg;
2112
2113 /* Find the starting register. */
2114 first_reg = 15;
2115
2116 while (fi.reg_mask & (1 << first_reg))
2117 first_reg--;
2118
2119 first_reg++;
2120
2121 emit_insn (gen_load_multiple (gen_rtx_REG (SImode, first_reg),
2122 gen_rtx_MEM (SImode, stack_pointer_rtx),
2123 GEN_INT (16 - first_reg)));
2124
2125 i -= (15 - first_reg);
2126 offs += (16 - first_reg) * 4;
2127 }
2128 else if (fi.reg_mask & (1 << i))
2129 {
2130 emit_insn (gen_movsi
2131 (gen_rtx_REG (SImode, i),
2132 gen_rtx_MEM (SImode,
2133 plus_constant (stack_pointer_rtx, offs))));
2134 offs += 4;
2135 }
2136 }
2137
2138 /* Give back anything else. */
2139 /* XXX: Should accumulate total and then give it back. */
2140 while (growth >= 0)
2141 output_stack_adjust ( 1, fi.growth[growth--]);
2142 }
2143 \f
2144 /* This code is borrowed from the SH port. */
2145
2146 /* The MCORE cannot load a large constant into a register, constants have to
2147 come from a pc relative load. The reference of a pc relative load
2148 instruction must be less than 1k in front of the instruction. This
2149 means that we often have to dump a constant inside a function, and
2150 generate code to branch around it.
2151
2152 It is important to minimize this, since the branches will slow things
2153 down and make things bigger.
2154
2155 Worst case code looks like:
2156
2157 lrw L1,r0
2158 br L2
2159 align
2160 L1: .long value
2161 L2:
2162 ..
2163
2164 lrw L3,r0
2165 br L4
2166 align
2167 L3: .long value
2168 L4:
2169 ..
2170
2171 We fix this by performing a scan before scheduling, which notices which
2172 instructions need to have their operands fetched from the constant table
2173 and builds the table.
2174
2175 The algorithm is:
2176
2177 scan, find an instruction which needs a pcrel move. Look forward, find the
2178 last barrier which is within MAX_COUNT bytes of the requirement.
2179 If there isn't one, make one. Process all the instructions between
2180 the find and the barrier.
2181
2182 In the above example, we can tell that L3 is within 1k of L1, so
2183 the first move can be shrunk from the 2 insn+constant sequence into
2184 just 1 insn, and the constant moved to L3 to make:
2185
2186 lrw L1,r0
2187 ..
2188 lrw L3,r0
2189 bra L4
2190 align
2191 L3:.long value
2192 L4:.long value
2193
2194 Then the second move becomes the target for the shortening process. */
2195
2196 typedef struct
2197 {
2198 rtx value; /* Value in table. */
2199 rtx label; /* Label of value. */
2200 } pool_node;
2201
2202 /* The maximum number of constants that can fit into one pool, since
2203 the pc relative range is 0...1020 bytes and constants are at least 4
2204 bytes long. We subtract 4 from the range to allow for the case where
2205 we need to add a branch/align before the constant pool. */
2206
2207 #define MAX_COUNT 1016
2208 #define MAX_POOL_SIZE (MAX_COUNT/4)
2209 static pool_node pool_vector[MAX_POOL_SIZE];
2210 static int pool_size;
2211
2212 /* Dump out any constants accumulated in the final pass. These
2213 will only be labels. */
2214
2215 const char *
2216 mcore_output_jump_label_table (void)
2217 {
2218 int i;
2219
2220 if (pool_size)
2221 {
2222 fprintf (asm_out_file, "\t.align 2\n");
2223
2224 for (i = 0; i < pool_size; i++)
2225 {
2226 pool_node * p = pool_vector + i;
2227
2228 (*targetm.asm_out.internal_label) (asm_out_file, "L", CODE_LABEL_NUMBER (p->label));
2229
2230 output_asm_insn (".long %0", &p->value);
2231 }
2232
2233 pool_size = 0;
2234 }
2235
2236 return "";
2237 }
2238
2239 /* Check whether insn is a candidate for a conditional. */
2240
2241 static cond_type
2242 is_cond_candidate (rtx insn)
2243 {
2244 /* The only things we conditionalize are those that can be directly
2245 changed into a conditional. Only bother with SImode items. If
2246 we wanted to be a little more aggressive, we could also do other
2247 modes such as DImode with reg-reg move or load 0. */
2248 if (GET_CODE (insn) == INSN)
2249 {
2250 rtx pat = PATTERN (insn);
2251 rtx src, dst;
2252
2253 if (GET_CODE (pat) != SET)
2254 return COND_NO;
2255
2256 dst = XEXP (pat, 0);
2257
2258 if ((GET_CODE (dst) != REG &&
2259 GET_CODE (dst) != SUBREG) ||
2260 GET_MODE (dst) != SImode)
2261 return COND_NO;
2262
2263 src = XEXP (pat, 1);
2264
2265 if ((GET_CODE (src) == REG ||
2266 (GET_CODE (src) == SUBREG &&
2267 GET_CODE (SUBREG_REG (src)) == REG)) &&
2268 GET_MODE (src) == SImode)
2269 return COND_MOV_INSN;
2270 else if (GET_CODE (src) == CONST_INT &&
2271 INTVAL (src) == 0)
2272 return COND_CLR_INSN;
2273 else if (GET_CODE (src) == PLUS &&
2274 (GET_CODE (XEXP (src, 0)) == REG ||
2275 (GET_CODE (XEXP (src, 0)) == SUBREG &&
2276 GET_CODE (SUBREG_REG (XEXP (src, 0))) == REG)) &&
2277 GET_MODE (XEXP (src, 0)) == SImode &&
2278 GET_CODE (XEXP (src, 1)) == CONST_INT &&
2279 INTVAL (XEXP (src, 1)) == 1)
2280 return COND_INC_INSN;
2281 else if (((GET_CODE (src) == MINUS &&
2282 GET_CODE (XEXP (src, 1)) == CONST_INT &&
2283 INTVAL( XEXP (src, 1)) == 1) ||
2284 (GET_CODE (src) == PLUS &&
2285 GET_CODE (XEXP (src, 1)) == CONST_INT &&
2286 INTVAL (XEXP (src, 1)) == -1)) &&
2287 (GET_CODE (XEXP (src, 0)) == REG ||
2288 (GET_CODE (XEXP (src, 0)) == SUBREG &&
2289 GET_CODE (SUBREG_REG (XEXP (src, 0))) == REG)) &&
2290 GET_MODE (XEXP (src, 0)) == SImode)
2291 return COND_DEC_INSN;
2292
2293 /* Some insns that we don't bother with:
2294 (set (rx:DI) (ry:DI))
2295 (set (rx:DI) (const_int 0))
2296 */
2297
2298 }
2299 else if (GET_CODE (insn) == JUMP_INSN &&
2300 GET_CODE (PATTERN (insn)) == SET &&
2301 GET_CODE (XEXP (PATTERN (insn), 1)) == LABEL_REF)
2302 return COND_BRANCH_INSN;
2303
2304 return COND_NO;
2305 }
2306
2307 /* Emit a conditional version of insn and replace the old insn with the
2308 new one. Return the new insn if emitted. */
2309
2310 static rtx
2311 emit_new_cond_insn (rtx insn, int cond)
2312 {
2313 rtx c_insn = 0;
2314 rtx pat, dst, src;
2315 cond_type num;
2316
2317 if ((num = is_cond_candidate (insn)) == COND_NO)
2318 return NULL;
2319
2320 pat = PATTERN (insn);
2321
2322 if (GET_CODE (insn) == INSN)
2323 {
2324 dst = SET_DEST (pat);
2325 src = SET_SRC (pat);
2326 }
2327 else
2328 {
2329 dst = JUMP_LABEL (insn);
2330 src = NULL_RTX;
2331 }
2332
2333 switch (num)
2334 {
2335 case COND_MOV_INSN:
2336 case COND_CLR_INSN:
2337 if (cond)
2338 c_insn = gen_movt0 (dst, src, dst);
2339 else
2340 c_insn = gen_movt0 (dst, dst, src);
2341 break;
2342
2343 case COND_INC_INSN:
2344 if (cond)
2345 c_insn = gen_incscc (dst, dst);
2346 else
2347 c_insn = gen_incscc_false (dst, dst);
2348 break;
2349
2350 case COND_DEC_INSN:
2351 if (cond)
2352 c_insn = gen_decscc (dst, dst);
2353 else
2354 c_insn = gen_decscc_false (dst, dst);
2355 break;
2356
2357 case COND_BRANCH_INSN:
2358 if (cond)
2359 c_insn = gen_branch_true (dst);
2360 else
2361 c_insn = gen_branch_false (dst);
2362 break;
2363
2364 default:
2365 return NULL;
2366 }
2367
2368 /* Only copy the notes if they exist. */
2369 if (rtx_length [GET_CODE (c_insn)] >= 7 && rtx_length [GET_CODE (insn)] >= 7)
2370 {
2371 /* We really don't need to bother with the notes and links at this
2372 point, but go ahead and save the notes. This will help is_dead()
2373 when applying peepholes (links don't matter since they are not
2374 used any more beyond this point for the mcore). */
2375 REG_NOTES (c_insn) = REG_NOTES (insn);
2376 }
2377
2378 if (num == COND_BRANCH_INSN)
2379 {
2380 /* For jumps, we need to be a little bit careful and emit the new jump
2381 before the old one and to update the use count for the target label.
2382 This way, the barrier following the old (uncond) jump will get
2383 deleted, but the label won't. */
2384 c_insn = emit_jump_insn_before (c_insn, insn);
2385
2386 ++ LABEL_NUSES (dst);
2387
2388 JUMP_LABEL (c_insn) = dst;
2389 }
2390 else
2391 c_insn = emit_insn_after (c_insn, insn);
2392
2393 delete_insn (insn);
2394
2395 return c_insn;
2396 }
2397
2398 /* Attempt to change a basic block into a series of conditional insns. This
2399 works by taking the branch at the end of the 1st block and scanning for the
2400 end of the 2nd block. If all instructions in the 2nd block have cond.
2401 versions and the label at the start of block 3 is the same as the target
2402 from the branch at block 1, then conditionalize all insn in block 2 using
2403 the inverse condition of the branch at block 1. (Note I'm bending the
2404 definition of basic block here.)
2405
2406 e.g., change:
2407
2408 bt L2 <-- end of block 1 (delete)
2409 mov r7,r8
2410 addu r7,1
2411 br L3 <-- end of block 2
2412
2413 L2: ... <-- start of block 3 (NUSES==1)
2414 L3: ...
2415
2416 to:
2417
2418 movf r7,r8
2419 incf r7
2420 bf L3
2421
2422 L3: ...
2423
2424 we can delete the L2 label if NUSES==1 and re-apply the optimization
2425 starting at the last instruction of block 2. This may allow an entire
2426 if-then-else statement to be conditionalized. BRC */
2427 static rtx
2428 conditionalize_block (rtx first)
2429 {
2430 rtx insn;
2431 rtx br_pat;
2432 rtx end_blk_1_br = 0;
2433 rtx end_blk_2_insn = 0;
2434 rtx start_blk_3_lab = 0;
2435 int cond;
2436 int br_lab_num;
2437 int blk_size = 0;
2438
2439
2440 /* Check that the first insn is a candidate conditional jump. This is
2441 the one that we'll eliminate. If not, advance to the next insn to
2442 try. */
2443 if (GET_CODE (first) != JUMP_INSN ||
2444 GET_CODE (PATTERN (first)) != SET ||
2445 GET_CODE (XEXP (PATTERN (first), 1)) != IF_THEN_ELSE)
2446 return NEXT_INSN (first);
2447
2448 /* Extract some information we need. */
2449 end_blk_1_br = first;
2450 br_pat = PATTERN (end_blk_1_br);
2451
2452 /* Complement the condition since we use the reverse cond. for the insns. */
2453 cond = (GET_CODE (XEXP (XEXP (br_pat, 1), 0)) == EQ);
2454
2455 /* Determine what kind of branch we have. */
2456 if (GET_CODE (XEXP (XEXP (br_pat, 1), 1)) == LABEL_REF)
2457 {
2458 /* A normal branch, so extract label out of first arm. */
2459 br_lab_num = CODE_LABEL_NUMBER (XEXP (XEXP (XEXP (br_pat, 1), 1), 0));
2460 }
2461 else
2462 {
2463 /* An inverse branch, so extract the label out of the 2nd arm
2464 and complement the condition. */
2465 cond = (cond == 0);
2466 br_lab_num = CODE_LABEL_NUMBER (XEXP (XEXP (XEXP (br_pat, 1), 2), 0));
2467 }
2468
2469 /* Scan forward for the start of block 2: it must start with a
2470 label and that label must be the same as the branch target
2471 label from block 1. We don't care about whether block 2 actually
2472 ends with a branch or a label (an uncond. branch is
2473 conditionalizable). */
2474 for (insn = NEXT_INSN (first); insn; insn = NEXT_INSN (insn))
2475 {
2476 enum rtx_code code;
2477
2478 code = GET_CODE (insn);
2479
2480 /* Look for the label at the start of block 3. */
2481 if (code == CODE_LABEL && CODE_LABEL_NUMBER (insn) == br_lab_num)
2482 break;
2483
2484 /* Skip barriers, notes, and conditionalizable insns. If the
2485 insn is not conditionalizable or makes this optimization fail,
2486 just return the next insn so we can start over from that point. */
2487 if (code != BARRIER && code != NOTE && !is_cond_candidate (insn))
2488 return NEXT_INSN (insn);
2489
2490 /* Remember the last real insn before the label (i.e. end of block 2). */
2491 if (code == JUMP_INSN || code == INSN)
2492 {
2493 blk_size ++;
2494 end_blk_2_insn = insn;
2495 }
2496 }
2497
2498 if (!insn)
2499 return insn;
2500
2501 /* It is possible for this optimization to slow performance if the blocks
2502 are long. This really depends upon whether the branch is likely taken
2503 or not. If the branch is taken, we slow performance in many cases. But,
2504 if the branch is not taken, we always help performance (for a single
2505 block, but for a double block (i.e. when the optimization is re-applied)
2506 this is not true since the 'right thing' depends on the overall length of
2507 the collapsed block). As a compromise, don't apply this optimization on
2508 blocks larger than size 2 (unlikely for the mcore) when speed is important.
2509 the best threshold depends on the latencies of the instructions (i.e.,
2510 the branch penalty). */
2511 if (optimize > 1 && blk_size > 2)
2512 return insn;
2513
2514 /* At this point, we've found the start of block 3 and we know that
2515 it is the destination of the branch from block 1. Also, all
2516 instructions in the block 2 are conditionalizable. So, apply the
2517 conditionalization and delete the branch. */
2518 start_blk_3_lab = insn;
2519
2520 for (insn = NEXT_INSN (end_blk_1_br); insn != start_blk_3_lab;
2521 insn = NEXT_INSN (insn))
2522 {
2523 rtx newinsn;
2524
2525 if (INSN_DELETED_P (insn))
2526 continue;
2527
2528 /* Try to form a conditional variant of the instruction and emit it. */
2529 if ((newinsn = emit_new_cond_insn (insn, cond)))
2530 {
2531 if (end_blk_2_insn == insn)
2532 end_blk_2_insn = newinsn;
2533
2534 insn = newinsn;
2535 }
2536 }
2537
2538 /* Note whether we will delete the label starting blk 3 when the jump
2539 gets deleted. If so, we want to re-apply this optimization at the
2540 last real instruction right before the label. */
2541 if (LABEL_NUSES (start_blk_3_lab) == 1)
2542 {
2543 start_blk_3_lab = 0;
2544 }
2545
2546 /* ??? we probably should redistribute the death notes for this insn, esp.
2547 the death of cc, but it doesn't really matter this late in the game.
2548 The peepholes all use is_dead() which will find the correct death
2549 regardless of whether there is a note. */
2550 delete_insn (end_blk_1_br);
2551
2552 if (! start_blk_3_lab)
2553 return end_blk_2_insn;
2554
2555 /* Return the insn right after the label at the start of block 3. */
2556 return NEXT_INSN (start_blk_3_lab);
2557 }
2558
2559 /* Apply the conditionalization of blocks optimization. This is the
2560 outer loop that traverses through the insns scanning for a branch
2561 that signifies an opportunity to apply the optimization. Note that
2562 this optimization is applied late. If we could apply it earlier,
2563 say before cse 2, it may expose more optimization opportunities.
2564 but, the pay back probably isn't really worth the effort (we'd have
2565 to update all reg/flow/notes/links/etc to make it work - and stick it
2566 in before cse 2). */
2567
2568 static void
2569 conditionalize_optimization (void)
2570 {
2571 rtx insn;
2572
2573 for (insn = get_insns (); insn; insn = conditionalize_block (insn))
2574 continue;
2575 }
2576
2577 static int saved_warn_return_type = -1;
2578 static int saved_warn_return_type_count = 0;
2579
2580 /* This is to handle loads from the constant pool. */
2581
2582 static void
2583 mcore_reorg (void)
2584 {
2585 /* Reset this variable. */
2586 current_function_anonymous_args = 0;
2587
2588 /* Restore the warn_return_type if it has been altered. */
2589 if (saved_warn_return_type != -1)
2590 {
2591 /* Only restore the value if we have reached another function.
2592 The test of warn_return_type occurs in final_function () in
2593 c-decl.c a long time after the code for the function is generated,
2594 so we need a counter to tell us when we have finished parsing that
2595 function and can restore the flag. */
2596 if (--saved_warn_return_type_count == 0)
2597 {
2598 warn_return_type = saved_warn_return_type;
2599 saved_warn_return_type = -1;
2600 }
2601 }
2602
2603 if (optimize == 0)
2604 return;
2605
2606 /* Conditionalize blocks where we can. */
2607 conditionalize_optimization ();
2608
2609 /* Literal pool generation is now pushed off until the assembler. */
2610 }
2611
2612 \f
2613 /* Return true if X is something that can be moved directly into r15. */
2614
2615 bool
2616 mcore_r15_operand_p (rtx x)
2617 {
2618 switch (GET_CODE (x))
2619 {
2620 case CONST_INT:
2621 return mcore_const_ok_for_inline (INTVAL (x));
2622
2623 case REG:
2624 case SUBREG:
2625 case MEM:
2626 return 1;
2627
2628 default:
2629 return 0;
2630 }
2631 }
2632
2633 /* Implement SECONDARY_RELOAD_CLASS. If RCLASS contains r15, and we can't
2634 directly move X into it, use r1-r14 as a temporary. */
2635
2636 enum reg_class
2637 mcore_secondary_reload_class (enum reg_class rclass,
2638 enum machine_mode mode ATTRIBUTE_UNUSED, rtx x)
2639 {
2640 if (TEST_HARD_REG_BIT (reg_class_contents[rclass], 15)
2641 && !mcore_r15_operand_p (x))
2642 return LRW_REGS;
2643 return NO_REGS;
2644 }
2645
2646 /* Return the reg_class to use when reloading the rtx X into the class
2647 RCLASS. If X is too complex to move directly into r15, prefer to
2648 use LRW_REGS instead. */
2649
2650 enum reg_class
2651 mcore_reload_class (rtx x, enum reg_class rclass)
2652 {
2653 if (reg_class_subset_p (LRW_REGS, rclass) && !mcore_r15_operand_p (x))
2654 return LRW_REGS;
2655
2656 return rclass;
2657 }
2658
2659 /* Tell me if a pair of reg/subreg rtx's actually refer to the same
2660 register. Note that the current version doesn't worry about whether
2661 they are the same mode or note (e.g., a QImode in r2 matches an HImode
2662 in r2 matches an SImode in r2. Might think in the future about whether
2663 we want to be able to say something about modes. */
2664
2665 int
2666 mcore_is_same_reg (rtx x, rtx y)
2667 {
2668 /* Strip any and all of the subreg wrappers. */
2669 while (GET_CODE (x) == SUBREG)
2670 x = SUBREG_REG (x);
2671
2672 while (GET_CODE (y) == SUBREG)
2673 y = SUBREG_REG (y);
2674
2675 if (GET_CODE(x) == REG && GET_CODE(y) == REG && REGNO(x) == REGNO(y))
2676 return 1;
2677
2678 return 0;
2679 }
2680
2681 void
2682 mcore_override_options (void)
2683 {
2684 /* Only the m340 supports little endian code. */
2685 if (TARGET_LITTLE_END && ! TARGET_M340)
2686 target_flags |= MASK_M340;
2687 }
2688 \f
2689 /* Compute the number of word sized registers needed to
2690 hold a function argument of mode MODE and type TYPE. */
2691
2692 int
2693 mcore_num_arg_regs (enum machine_mode mode, const_tree type)
2694 {
2695 int size;
2696
2697 if (targetm.calls.must_pass_in_stack (mode, type))
2698 return 0;
2699
2700 if (type && mode == BLKmode)
2701 size = int_size_in_bytes (type);
2702 else
2703 size = GET_MODE_SIZE (mode);
2704
2705 return ROUND_ADVANCE (size);
2706 }
2707
2708 static rtx
2709 handle_structs_in_regs (enum machine_mode mode, const_tree type, int reg)
2710 {
2711 int size;
2712
2713 /* The MCore ABI defines that a structure whose size is not a whole multiple
2714 of bytes is passed packed into registers (or spilled onto the stack if
2715 not enough registers are available) with the last few bytes of the
2716 structure being packed, left-justified, into the last register/stack slot.
2717 GCC handles this correctly if the last word is in a stack slot, but we
2718 have to generate a special, PARALLEL RTX if the last word is in an
2719 argument register. */
2720 if (type
2721 && TYPE_MODE (type) == BLKmode
2722 && TREE_CODE (TYPE_SIZE (type)) == INTEGER_CST
2723 && (size = int_size_in_bytes (type)) > UNITS_PER_WORD
2724 && (size % UNITS_PER_WORD != 0)
2725 && (reg + mcore_num_arg_regs (mode, type) <= (FIRST_PARM_REG + NPARM_REGS)))
2726 {
2727 rtx arg_regs [NPARM_REGS];
2728 int nregs;
2729 rtx result;
2730 rtvec rtvec;
2731
2732 for (nregs = 0; size > 0; size -= UNITS_PER_WORD)
2733 {
2734 arg_regs [nregs] =
2735 gen_rtx_EXPR_LIST (SImode, gen_rtx_REG (SImode, reg ++),
2736 GEN_INT (nregs * UNITS_PER_WORD));
2737 nregs ++;
2738 }
2739
2740 /* We assume here that NPARM_REGS == 6. The assert checks this. */
2741 assert (ARRAY_SIZE (arg_regs) == 6);
2742 rtvec = gen_rtvec (nregs, arg_regs[0], arg_regs[1], arg_regs[2],
2743 arg_regs[3], arg_regs[4], arg_regs[5]);
2744
2745 result = gen_rtx_PARALLEL (mode, rtvec);
2746 return result;
2747 }
2748
2749 return gen_rtx_REG (mode, reg);
2750 }
2751
2752 rtx
2753 mcore_function_value (const_tree valtype, const_tree func)
2754 {
2755 enum machine_mode mode;
2756 int unsigned_p;
2757
2758 mode = TYPE_MODE (valtype);
2759
2760 /* Since we promote return types, we must promote the mode here too. */
2761 mode = promote_function_mode (valtype, mode, &unsigned_p, func, 1);
2762
2763 return handle_structs_in_regs (mode, valtype, FIRST_RET_REG);
2764 }
2765
2766 /* Define where to put the arguments to a function.
2767 Value is zero to push the argument on the stack,
2768 or a hard register in which to store the argument.
2769
2770 MODE is the argument's machine mode.
2771 TYPE is the data type of the argument (as a tree).
2772 This is null for libcalls where that information may
2773 not be available.
2774 CUM is a variable of type CUMULATIVE_ARGS which gives info about
2775 the preceding args and about the function being called.
2776 NAMED is nonzero if this argument is a named parameter
2777 (otherwise it is an extra parameter matching an ellipsis).
2778
2779 On MCore the first args are normally in registers
2780 and the rest are pushed. Any arg that starts within the first
2781 NPARM_REGS words is at least partially passed in a register unless
2782 its data type forbids. */
2783
2784 rtx
2785 mcore_function_arg (CUMULATIVE_ARGS cum, enum machine_mode mode,
2786 tree type, int named)
2787 {
2788 int arg_reg;
2789
2790 if (! named || mode == VOIDmode)
2791 return 0;
2792
2793 if (targetm.calls.must_pass_in_stack (mode, type))
2794 return 0;
2795
2796 arg_reg = ROUND_REG (cum, mode);
2797
2798 if (arg_reg < NPARM_REGS)
2799 return handle_structs_in_regs (mode, type, FIRST_PARM_REG + arg_reg);
2800
2801 return 0;
2802 }
2803
2804 /* Returns the number of bytes of argument registers required to hold *part*
2805 of a parameter of machine mode MODE and type TYPE (which may be NULL if
2806 the type is not known). If the argument fits entirely in the argument
2807 registers, or entirely on the stack, then 0 is returned. CUM is the
2808 number of argument registers already used by earlier parameters to
2809 the function. */
2810
2811 static int
2812 mcore_arg_partial_bytes (CUMULATIVE_ARGS *cum, enum machine_mode mode,
2813 tree type, bool named)
2814 {
2815 int reg = ROUND_REG (*cum, mode);
2816
2817 if (named == 0)
2818 return 0;
2819
2820 if (targetm.calls.must_pass_in_stack (mode, type))
2821 return 0;
2822
2823 /* REG is not the *hardware* register number of the register that holds
2824 the argument, it is the *argument* register number. So for example,
2825 the first argument to a function goes in argument register 0, which
2826 translates (for the MCore) into hardware register 2. The second
2827 argument goes into argument register 1, which translates into hardware
2828 register 3, and so on. NPARM_REGS is the number of argument registers
2829 supported by the target, not the maximum hardware register number of
2830 the target. */
2831 if (reg >= NPARM_REGS)
2832 return 0;
2833
2834 /* If the argument fits entirely in registers, return 0. */
2835 if (reg + mcore_num_arg_regs (mode, type) <= NPARM_REGS)
2836 return 0;
2837
2838 /* The argument overflows the number of available argument registers.
2839 Compute how many argument registers have not yet been assigned to
2840 hold an argument. */
2841 reg = NPARM_REGS - reg;
2842
2843 /* Return partially in registers and partially on the stack. */
2844 return reg * UNITS_PER_WORD;
2845 }
2846 \f
2847 /* Return nonzero if SYMBOL is marked as being dllexport'd. */
2848
2849 int
2850 mcore_dllexport_name_p (const char * symbol)
2851 {
2852 return symbol[0] == '@' && symbol[1] == 'e' && symbol[2] == '.';
2853 }
2854
2855 /* Return nonzero if SYMBOL is marked as being dllimport'd. */
2856
2857 int
2858 mcore_dllimport_name_p (const char * symbol)
2859 {
2860 return symbol[0] == '@' && symbol[1] == 'i' && symbol[2] == '.';
2861 }
2862
2863 /* Mark a DECL as being dllexport'd. */
2864
2865 static void
2866 mcore_mark_dllexport (tree decl)
2867 {
2868 const char * oldname;
2869 char * newname;
2870 rtx rtlname;
2871 tree idp;
2872
2873 rtlname = XEXP (DECL_RTL (decl), 0);
2874
2875 if (GET_CODE (rtlname) == MEM)
2876 rtlname = XEXP (rtlname, 0);
2877 gcc_assert (GET_CODE (rtlname) == SYMBOL_REF);
2878 oldname = XSTR (rtlname, 0);
2879
2880 if (mcore_dllexport_name_p (oldname))
2881 return; /* Already done. */
2882
2883 newname = XALLOCAVEC (char, strlen (oldname) + 4);
2884 sprintf (newname, "@e.%s", oldname);
2885
2886 /* We pass newname through get_identifier to ensure it has a unique
2887 address. RTL processing can sometimes peek inside the symbol ref
2888 and compare the string's addresses to see if two symbols are
2889 identical. */
2890 /* ??? At least I think that's why we do this. */
2891 idp = get_identifier (newname);
2892
2893 XEXP (DECL_RTL (decl), 0) =
2894 gen_rtx_SYMBOL_REF (Pmode, IDENTIFIER_POINTER (idp));
2895 }
2896
2897 /* Mark a DECL as being dllimport'd. */
2898
2899 static void
2900 mcore_mark_dllimport (tree decl)
2901 {
2902 const char * oldname;
2903 char * newname;
2904 tree idp;
2905 rtx rtlname;
2906 rtx newrtl;
2907
2908 rtlname = XEXP (DECL_RTL (decl), 0);
2909
2910 if (GET_CODE (rtlname) == MEM)
2911 rtlname = XEXP (rtlname, 0);
2912 gcc_assert (GET_CODE (rtlname) == SYMBOL_REF);
2913 oldname = XSTR (rtlname, 0);
2914
2915 gcc_assert (!mcore_dllexport_name_p (oldname));
2916 if (mcore_dllimport_name_p (oldname))
2917 return; /* Already done. */
2918
2919 /* ??? One can well ask why we're making these checks here,
2920 and that would be a good question. */
2921
2922 /* Imported variables can't be initialized. */
2923 if (TREE_CODE (decl) == VAR_DECL
2924 && !DECL_VIRTUAL_P (decl)
2925 && DECL_INITIAL (decl))
2926 {
2927 error ("initialized variable %q+D is marked dllimport", decl);
2928 return;
2929 }
2930
2931 /* `extern' needn't be specified with dllimport.
2932 Specify `extern' now and hope for the best. Sigh. */
2933 if (TREE_CODE (decl) == VAR_DECL
2934 /* ??? Is this test for vtables needed? */
2935 && !DECL_VIRTUAL_P (decl))
2936 {
2937 DECL_EXTERNAL (decl) = 1;
2938 TREE_PUBLIC (decl) = 1;
2939 }
2940
2941 newname = XALLOCAVEC (char, strlen (oldname) + 11);
2942 sprintf (newname, "@i.__imp_%s", oldname);
2943
2944 /* We pass newname through get_identifier to ensure it has a unique
2945 address. RTL processing can sometimes peek inside the symbol ref
2946 and compare the string's addresses to see if two symbols are
2947 identical. */
2948 /* ??? At least I think that's why we do this. */
2949 idp = get_identifier (newname);
2950
2951 newrtl = gen_rtx_MEM (Pmode,
2952 gen_rtx_SYMBOL_REF (Pmode,
2953 IDENTIFIER_POINTER (idp)));
2954 XEXP (DECL_RTL (decl), 0) = newrtl;
2955 }
2956
2957 static int
2958 mcore_dllexport_p (tree decl)
2959 {
2960 if ( TREE_CODE (decl) != VAR_DECL
2961 && TREE_CODE (decl) != FUNCTION_DECL)
2962 return 0;
2963
2964 return lookup_attribute ("dllexport", DECL_ATTRIBUTES (decl)) != 0;
2965 }
2966
2967 static int
2968 mcore_dllimport_p (tree decl)
2969 {
2970 if ( TREE_CODE (decl) != VAR_DECL
2971 && TREE_CODE (decl) != FUNCTION_DECL)
2972 return 0;
2973
2974 return lookup_attribute ("dllimport", DECL_ATTRIBUTES (decl)) != 0;
2975 }
2976
2977 /* We must mark dll symbols specially. Definitions of dllexport'd objects
2978 install some info in the .drective (PE) or .exports (ELF) sections. */
2979
2980 static void
2981 mcore_encode_section_info (tree decl, rtx rtl ATTRIBUTE_UNUSED, int first ATTRIBUTE_UNUSED)
2982 {
2983 /* Mark the decl so we can tell from the rtl whether the object is
2984 dllexport'd or dllimport'd. */
2985 if (mcore_dllexport_p (decl))
2986 mcore_mark_dllexport (decl);
2987 else if (mcore_dllimport_p (decl))
2988 mcore_mark_dllimport (decl);
2989
2990 /* It might be that DECL has already been marked as dllimport, but
2991 a subsequent definition nullified that. The attribute is gone
2992 but DECL_RTL still has @i.__imp_foo. We need to remove that. */
2993 else if ((TREE_CODE (decl) == FUNCTION_DECL
2994 || TREE_CODE (decl) == VAR_DECL)
2995 && DECL_RTL (decl) != NULL_RTX
2996 && GET_CODE (DECL_RTL (decl)) == MEM
2997 && GET_CODE (XEXP (DECL_RTL (decl), 0)) == MEM
2998 && GET_CODE (XEXP (XEXP (DECL_RTL (decl), 0), 0)) == SYMBOL_REF
2999 && mcore_dllimport_name_p (XSTR (XEXP (XEXP (DECL_RTL (decl), 0), 0), 0)))
3000 {
3001 const char * oldname = XSTR (XEXP (XEXP (DECL_RTL (decl), 0), 0), 0);
3002 tree idp = get_identifier (oldname + 9);
3003 rtx newrtl = gen_rtx_SYMBOL_REF (Pmode, IDENTIFIER_POINTER (idp));
3004
3005 XEXP (DECL_RTL (decl), 0) = newrtl;
3006
3007 /* We previously set TREE_PUBLIC and DECL_EXTERNAL.
3008 ??? We leave these alone for now. */
3009 }
3010 }
3011
3012 /* Undo the effects of the above. */
3013
3014 static const char *
3015 mcore_strip_name_encoding (const char * str)
3016 {
3017 return str + (str[0] == '@' ? 3 : 0);
3018 }
3019
3020 /* MCore specific attribute support.
3021 dllexport - for exporting a function/variable that will live in a dll
3022 dllimport - for importing a function/variable from a dll
3023 naked - do not create a function prologue/epilogue. */
3024
3025 /* Handle a "naked" attribute; arguments as in
3026 struct attribute_spec.handler. */
3027
3028 static tree
3029 mcore_handle_naked_attribute (tree * node, tree name, tree args ATTRIBUTE_UNUSED,
3030 int flags ATTRIBUTE_UNUSED, bool * no_add_attrs)
3031 {
3032 if (TREE_CODE (*node) == FUNCTION_DECL)
3033 {
3034 /* PR14310 - don't complain about lack of return statement
3035 in naked functions. The solution here is a gross hack
3036 but this is the only way to solve the problem without
3037 adding a new feature to GCC. I did try submitting a patch
3038 that would add such a new feature, but it was (rightfully)
3039 rejected on the grounds that it was creeping featurism,
3040 so hence this code. */
3041 if (warn_return_type)
3042 {
3043 saved_warn_return_type = warn_return_type;
3044 warn_return_type = 0;
3045 saved_warn_return_type_count = 2;
3046 }
3047 else if (saved_warn_return_type_count)
3048 saved_warn_return_type_count = 2;
3049 }
3050 else
3051 {
3052 warning (OPT_Wattributes, "%qE attribute only applies to functions",
3053 name);
3054 *no_add_attrs = true;
3055 }
3056
3057 return NULL_TREE;
3058 }
3059
3060 /* ??? It looks like this is PE specific? Oh well, this is what the
3061 old code did as well. */
3062
3063 static void
3064 mcore_unique_section (tree decl, int reloc ATTRIBUTE_UNUSED)
3065 {
3066 int len;
3067 const char * name;
3068 char * string;
3069 const char * prefix;
3070
3071 name = IDENTIFIER_POINTER (DECL_ASSEMBLER_NAME (decl));
3072
3073 /* Strip off any encoding in name. */
3074 name = (* targetm.strip_name_encoding) (name);
3075
3076 /* The object is put in, for example, section .text$foo.
3077 The linker will then ultimately place them in .text
3078 (everything from the $ on is stripped). */
3079 if (TREE_CODE (decl) == FUNCTION_DECL)
3080 prefix = ".text$";
3081 /* For compatibility with EPOC, we ignore the fact that the
3082 section might have relocs against it. */
3083 else if (decl_readonly_section (decl, 0))
3084 prefix = ".rdata$";
3085 else
3086 prefix = ".data$";
3087
3088 len = strlen (name) + strlen (prefix);
3089 string = XALLOCAVEC (char, len + 1);
3090
3091 sprintf (string, "%s%s", prefix, name);
3092
3093 DECL_SECTION_NAME (decl) = build_string (len, string);
3094 }
3095
3096 int
3097 mcore_naked_function_p (void)
3098 {
3099 return lookup_attribute ("naked", DECL_ATTRIBUTES (current_function_decl)) != NULL_TREE;
3100 }
3101
3102 #ifdef OBJECT_FORMAT_ELF
3103 static void
3104 mcore_asm_named_section (const char *name,
3105 unsigned int flags ATTRIBUTE_UNUSED,
3106 tree decl ATTRIBUTE_UNUSED)
3107 {
3108 fprintf (asm_out_file, "\t.section %s\n", name);
3109 }
3110 #endif /* OBJECT_FORMAT_ELF */
3111
3112 /* Worker function for TARGET_ASM_EXTERNAL_LIBCALL. */
3113
3114 static void
3115 mcore_external_libcall (rtx fun)
3116 {
3117 fprintf (asm_out_file, "\t.import\t");
3118 assemble_name (asm_out_file, XSTR (fun, 0));
3119 fprintf (asm_out_file, "\n");
3120 }
3121
3122 /* Worker function for TARGET_RETURN_IN_MEMORY. */
3123
3124 static bool
3125 mcore_return_in_memory (const_tree type, const_tree fntype ATTRIBUTE_UNUSED)
3126 {
3127 const HOST_WIDE_INT size = int_size_in_bytes (type);
3128 return (size == -1 || size > 2 * UNITS_PER_WORD);
3129 }
3130
3131 /* Worker function for TARGET_ASM_TRAMPOLINE_TEMPLATE.
3132 Output assembler code for a block containing the constant parts
3133 of a trampoline, leaving space for the variable parts.
3134
3135 On the MCore, the trampoline looks like:
3136 lrw r1, function
3137 lrw r13, area
3138 jmp r13
3139 or r0, r0
3140 .literals */
3141
3142 static void
3143 mcore_asm_trampoline_template (FILE *f)
3144 {
3145 fprintf (f, "\t.short 0x7102\n");
3146 fprintf (f, "\t.short 0x7d02\n");
3147 fprintf (f, "\t.short 0x00cd\n");
3148 fprintf (f, "\t.short 0x1e00\n");
3149 fprintf (f, "\t.long 0\n");
3150 fprintf (f, "\t.long 0\n");
3151 }
3152
3153 /* Worker function for TARGET_TRAMPOLINE_INIT. */
3154
3155 static void
3156 mcore_trampoline_init (rtx m_tramp, tree fndecl, rtx chain_value)
3157 {
3158 rtx fnaddr = XEXP (DECL_RTL (fndecl), 0);
3159 rtx mem;
3160
3161 emit_block_move (m_tramp, assemble_trampoline_template (),
3162 GEN_INT (2*UNITS_PER_WORD), BLOCK_OP_NORMAL);
3163
3164 mem = adjust_address (m_tramp, SImode, 8);
3165 emit_move_insn (mem, chain_value);
3166 mem = adjust_address (m_tramp, SImode, 12);
3167 emit_move_insn (mem, fnaddr);
3168 }