]> git.ipfire.org Git - thirdparty/gcc.git/blob - gcc/config/mcore/mcore.c
rtl.h (always_void_p): New function.
[thirdparty/gcc.git] / gcc / config / mcore / mcore.c
1 /* Output routines for Motorola MCore processor
2 Copyright (C) 1993-2015 Free Software Foundation, Inc.
3
4 This file is part of GCC.
5
6 GCC is free software; you can redistribute it and/or modify it
7 under the terms of the GNU General Public License as published
8 by the Free Software Foundation; either version 3, or (at your
9 option) any later version.
10
11 GCC is distributed in the hope that it will be useful, but WITHOUT
12 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
13 or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public
14 License for more details.
15
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
19
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "tm.h"
24 #include "rtl.h"
25 #include "hash-set.h"
26 #include "machmode.h"
27 #include "vec.h"
28 #include "double-int.h"
29 #include "input.h"
30 #include "alias.h"
31 #include "symtab.h"
32 #include "wide-int.h"
33 #include "inchash.h"
34 #include "tree.h"
35 #include "fold-const.h"
36 #include "stor-layout.h"
37 #include "varasm.h"
38 #include "stringpool.h"
39 #include "calls.h"
40 #include "tm_p.h"
41 #include "mcore.h"
42 #include "regs.h"
43 #include "hard-reg-set.h"
44 #include "insn-config.h"
45 #include "conditions.h"
46 #include "output.h"
47 #include "insn-attr.h"
48 #include "flags.h"
49 #include "obstack.h"
50 #include "hashtab.h"
51 #include "function.h"
52 #include "statistics.h"
53 #include "real.h"
54 #include "fixed-value.h"
55 #include "expmed.h"
56 #include "dojump.h"
57 #include "explow.h"
58 #include "emit-rtl.h"
59 #include "stmt.h"
60 #include "expr.h"
61 #include "reload.h"
62 #include "recog.h"
63 #include "ggc.h"
64 #include "diagnostic-core.h"
65 #include "target.h"
66 #include "target-def.h"
67 #include "dominance.h"
68 #include "cfg.h"
69 #include "cfgrtl.h"
70 #include "cfganal.h"
71 #include "lcm.h"
72 #include "cfgbuild.h"
73 #include "cfgcleanup.h"
74 #include "predict.h"
75 #include "basic-block.h"
76 #include "df.h"
77 #include "builtins.h"
78
79 /* For dumping information about frame sizes. */
80 char * mcore_current_function_name = 0;
81 long mcore_current_compilation_timestamp = 0;
82
83 /* Global variables for machine-dependent things. */
84
85 /* Provides the class number of the smallest class containing
86 reg number. */
87 const enum reg_class regno_reg_class[FIRST_PSEUDO_REGISTER] =
88 {
89 GENERAL_REGS, ONLYR1_REGS, LRW_REGS, LRW_REGS,
90 LRW_REGS, LRW_REGS, LRW_REGS, LRW_REGS,
91 LRW_REGS, LRW_REGS, LRW_REGS, LRW_REGS,
92 LRW_REGS, LRW_REGS, LRW_REGS, GENERAL_REGS,
93 GENERAL_REGS, C_REGS, NO_REGS, NO_REGS,
94 };
95
96 struct mcore_frame
97 {
98 int arg_size; /* Stdarg spills (bytes). */
99 int reg_size; /* Non-volatile reg saves (bytes). */
100 int reg_mask; /* Non-volatile reg saves. */
101 int local_size; /* Locals. */
102 int outbound_size; /* Arg overflow on calls out. */
103 int pad_outbound;
104 int pad_local;
105 int pad_reg;
106 /* Describe the steps we'll use to grow it. */
107 #define MAX_STACK_GROWS 4 /* Gives us some spare space. */
108 int growth[MAX_STACK_GROWS];
109 int arg_offset;
110 int reg_offset;
111 int reg_growth;
112 int local_growth;
113 };
114
115 typedef enum
116 {
117 COND_NO,
118 COND_MOV_INSN,
119 COND_CLR_INSN,
120 COND_INC_INSN,
121 COND_DEC_INSN,
122 COND_BRANCH_INSN
123 }
124 cond_type;
125
126 static void output_stack_adjust (int, int);
127 static int calc_live_regs (int *);
128 static int try_constant_tricks (HOST_WIDE_INT, HOST_WIDE_INT *, HOST_WIDE_INT *);
129 static const char * output_inline_const (machine_mode, rtx *);
130 static void layout_mcore_frame (struct mcore_frame *);
131 static void mcore_setup_incoming_varargs (cumulative_args_t, machine_mode, tree, int *, int);
132 static cond_type is_cond_candidate (rtx);
133 static rtx_insn *emit_new_cond_insn (rtx, int);
134 static rtx_insn *conditionalize_block (rtx_insn *);
135 static void conditionalize_optimization (void);
136 static void mcore_reorg (void);
137 static rtx handle_structs_in_regs (machine_mode, const_tree, int);
138 static void mcore_mark_dllexport (tree);
139 static void mcore_mark_dllimport (tree);
140 static int mcore_dllexport_p (tree);
141 static int mcore_dllimport_p (tree);
142 static tree mcore_handle_naked_attribute (tree *, tree, tree, int, bool *);
143 #ifdef OBJECT_FORMAT_ELF
144 static void mcore_asm_named_section (const char *,
145 unsigned int, tree);
146 #endif
147 static void mcore_print_operand (FILE *, rtx, int);
148 static void mcore_print_operand_address (FILE *, rtx);
149 static bool mcore_print_operand_punct_valid_p (unsigned char code);
150 static void mcore_unique_section (tree, int);
151 static void mcore_encode_section_info (tree, rtx, int);
152 static const char *mcore_strip_name_encoding (const char *);
153 static int mcore_const_costs (rtx, RTX_CODE);
154 static int mcore_and_cost (rtx);
155 static int mcore_ior_cost (rtx);
156 static bool mcore_rtx_costs (rtx, int, int, int,
157 int *, bool);
158 static void mcore_external_libcall (rtx);
159 static bool mcore_return_in_memory (const_tree, const_tree);
160 static int mcore_arg_partial_bytes (cumulative_args_t,
161 machine_mode,
162 tree, bool);
163 static rtx mcore_function_arg (cumulative_args_t,
164 machine_mode,
165 const_tree, bool);
166 static void mcore_function_arg_advance (cumulative_args_t,
167 machine_mode,
168 const_tree, bool);
169 static unsigned int mcore_function_arg_boundary (machine_mode,
170 const_tree);
171 static void mcore_asm_trampoline_template (FILE *);
172 static void mcore_trampoline_init (rtx, tree, rtx);
173 static bool mcore_warn_func_return (tree);
174 static void mcore_option_override (void);
175 static bool mcore_legitimate_constant_p (machine_mode, rtx);
176 \f
177 /* MCore specific attributes. */
178
179 static const struct attribute_spec mcore_attribute_table[] =
180 {
181 /* { name, min_len, max_len, decl_req, type_req, fn_type_req, handler,
182 affects_type_identity } */
183 { "dllexport", 0, 0, true, false, false, NULL, false },
184 { "dllimport", 0, 0, true, false, false, NULL, false },
185 { "naked", 0, 0, true, false, false, mcore_handle_naked_attribute,
186 false },
187 { NULL, 0, 0, false, false, false, NULL, false }
188 };
189 \f
190 /* Initialize the GCC target structure. */
191 #undef TARGET_ASM_EXTERNAL_LIBCALL
192 #define TARGET_ASM_EXTERNAL_LIBCALL mcore_external_libcall
193
194 #if TARGET_DLLIMPORT_DECL_ATTRIBUTES
195 #undef TARGET_MERGE_DECL_ATTRIBUTES
196 #define TARGET_MERGE_DECL_ATTRIBUTES merge_dllimport_decl_attributes
197 #endif
198
199 #ifdef OBJECT_FORMAT_ELF
200 #undef TARGET_ASM_UNALIGNED_HI_OP
201 #define TARGET_ASM_UNALIGNED_HI_OP "\t.short\t"
202 #undef TARGET_ASM_UNALIGNED_SI_OP
203 #define TARGET_ASM_UNALIGNED_SI_OP "\t.long\t"
204 #endif
205
206 #undef TARGET_PRINT_OPERAND
207 #define TARGET_PRINT_OPERAND mcore_print_operand
208 #undef TARGET_PRINT_OPERAND_ADDRESS
209 #define TARGET_PRINT_OPERAND_ADDRESS mcore_print_operand_address
210 #undef TARGET_PRINT_OPERAND_PUNCT_VALID_P
211 #define TARGET_PRINT_OPERAND_PUNCT_VALID_P mcore_print_operand_punct_valid_p
212
213 #undef TARGET_ATTRIBUTE_TABLE
214 #define TARGET_ATTRIBUTE_TABLE mcore_attribute_table
215 #undef TARGET_ASM_UNIQUE_SECTION
216 #define TARGET_ASM_UNIQUE_SECTION mcore_unique_section
217 #undef TARGET_ASM_FUNCTION_RODATA_SECTION
218 #define TARGET_ASM_FUNCTION_RODATA_SECTION default_no_function_rodata_section
219 #undef TARGET_ENCODE_SECTION_INFO
220 #define TARGET_ENCODE_SECTION_INFO mcore_encode_section_info
221 #undef TARGET_STRIP_NAME_ENCODING
222 #define TARGET_STRIP_NAME_ENCODING mcore_strip_name_encoding
223 #undef TARGET_RTX_COSTS
224 #define TARGET_RTX_COSTS mcore_rtx_costs
225 #undef TARGET_ADDRESS_COST
226 #define TARGET_ADDRESS_COST hook_int_rtx_mode_as_bool_0
227 #undef TARGET_MACHINE_DEPENDENT_REORG
228 #define TARGET_MACHINE_DEPENDENT_REORG mcore_reorg
229
230 #undef TARGET_PROMOTE_FUNCTION_MODE
231 #define TARGET_PROMOTE_FUNCTION_MODE default_promote_function_mode_always_promote
232 #undef TARGET_PROMOTE_PROTOTYPES
233 #define TARGET_PROMOTE_PROTOTYPES hook_bool_const_tree_true
234
235 #undef TARGET_RETURN_IN_MEMORY
236 #define TARGET_RETURN_IN_MEMORY mcore_return_in_memory
237 #undef TARGET_MUST_PASS_IN_STACK
238 #define TARGET_MUST_PASS_IN_STACK must_pass_in_stack_var_size
239 #undef TARGET_PASS_BY_REFERENCE
240 #define TARGET_PASS_BY_REFERENCE hook_pass_by_reference_must_pass_in_stack
241 #undef TARGET_ARG_PARTIAL_BYTES
242 #define TARGET_ARG_PARTIAL_BYTES mcore_arg_partial_bytes
243 #undef TARGET_FUNCTION_ARG
244 #define TARGET_FUNCTION_ARG mcore_function_arg
245 #undef TARGET_FUNCTION_ARG_ADVANCE
246 #define TARGET_FUNCTION_ARG_ADVANCE mcore_function_arg_advance
247 #undef TARGET_FUNCTION_ARG_BOUNDARY
248 #define TARGET_FUNCTION_ARG_BOUNDARY mcore_function_arg_boundary
249
250 #undef TARGET_SETUP_INCOMING_VARARGS
251 #define TARGET_SETUP_INCOMING_VARARGS mcore_setup_incoming_varargs
252
253 #undef TARGET_ASM_TRAMPOLINE_TEMPLATE
254 #define TARGET_ASM_TRAMPOLINE_TEMPLATE mcore_asm_trampoline_template
255 #undef TARGET_TRAMPOLINE_INIT
256 #define TARGET_TRAMPOLINE_INIT mcore_trampoline_init
257
258 #undef TARGET_OPTION_OVERRIDE
259 #define TARGET_OPTION_OVERRIDE mcore_option_override
260
261 #undef TARGET_LEGITIMATE_CONSTANT_P
262 #define TARGET_LEGITIMATE_CONSTANT_P mcore_legitimate_constant_p
263
264 #undef TARGET_WARN_FUNC_RETURN
265 #define TARGET_WARN_FUNC_RETURN mcore_warn_func_return
266
267 struct gcc_target targetm = TARGET_INITIALIZER;
268 \f
269 /* Adjust the stack and return the number of bytes taken to do it. */
270 static void
271 output_stack_adjust (int direction, int size)
272 {
273 /* If extending stack a lot, we do it incrementally. */
274 if (direction < 0 && size > mcore_stack_increment && mcore_stack_increment > 0)
275 {
276 rtx tmp = gen_rtx_REG (SImode, 1);
277 rtx memref;
278
279 emit_insn (gen_movsi (tmp, GEN_INT (mcore_stack_increment)));
280 do
281 {
282 emit_insn (gen_subsi3 (stack_pointer_rtx, stack_pointer_rtx, tmp));
283 memref = gen_rtx_MEM (SImode, stack_pointer_rtx);
284 MEM_VOLATILE_P (memref) = 1;
285 emit_insn (gen_movsi (memref, stack_pointer_rtx));
286 size -= mcore_stack_increment;
287 }
288 while (size > mcore_stack_increment);
289
290 /* SIZE is now the residual for the last adjustment,
291 which doesn't require a probe. */
292 }
293
294 if (size)
295 {
296 rtx insn;
297 rtx val = GEN_INT (size);
298
299 if (size > 32)
300 {
301 rtx nval = gen_rtx_REG (SImode, 1);
302 emit_insn (gen_movsi (nval, val));
303 val = nval;
304 }
305
306 if (direction > 0)
307 insn = gen_addsi3 (stack_pointer_rtx, stack_pointer_rtx, val);
308 else
309 insn = gen_subsi3 (stack_pointer_rtx, stack_pointer_rtx, val);
310
311 emit_insn (insn);
312 }
313 }
314
315 /* Work out the registers which need to be saved,
316 both as a mask and a count. */
317
318 static int
319 calc_live_regs (int * count)
320 {
321 int reg;
322 int live_regs_mask = 0;
323
324 * count = 0;
325
326 for (reg = 0; reg < FIRST_PSEUDO_REGISTER; reg++)
327 {
328 if (df_regs_ever_live_p (reg) && !call_used_regs[reg])
329 {
330 (*count)++;
331 live_regs_mask |= (1 << reg);
332 }
333 }
334
335 return live_regs_mask;
336 }
337
338 /* Print the operand address in x to the stream. */
339
340 static void
341 mcore_print_operand_address (FILE * stream, rtx x)
342 {
343 switch (GET_CODE (x))
344 {
345 case REG:
346 fprintf (stream, "(%s)", reg_names[REGNO (x)]);
347 break;
348
349 case PLUS:
350 {
351 rtx base = XEXP (x, 0);
352 rtx index = XEXP (x, 1);
353
354 if (GET_CODE (base) != REG)
355 {
356 /* Ensure that BASE is a register (one of them must be). */
357 rtx temp = base;
358 base = index;
359 index = temp;
360 }
361
362 switch (GET_CODE (index))
363 {
364 case CONST_INT:
365 fprintf (stream, "(%s," HOST_WIDE_INT_PRINT_DEC ")",
366 reg_names[REGNO(base)], INTVAL (index));
367 break;
368
369 default:
370 gcc_unreachable ();
371 }
372 }
373
374 break;
375
376 default:
377 output_addr_const (stream, x);
378 break;
379 }
380 }
381
382 static bool
383 mcore_print_operand_punct_valid_p (unsigned char code)
384 {
385 return (code == '.' || code == '#' || code == '*' || code == '^'
386 || code == '!');
387 }
388
389 /* Print operand x (an rtx) in assembler syntax to file stream
390 according to modifier code.
391
392 'R' print the next register or memory location along, i.e. the lsw in
393 a double word value
394 'O' print a constant without the #
395 'M' print a constant as its negative
396 'P' print log2 of a power of two
397 'Q' print log2 of an inverse of a power of two
398 'U' print register for ldm/stm instruction
399 'X' print byte number for xtrbN instruction. */
400
401 static void
402 mcore_print_operand (FILE * stream, rtx x, int code)
403 {
404 switch (code)
405 {
406 case 'N':
407 if (INTVAL(x) == -1)
408 fprintf (asm_out_file, "32");
409 else
410 fprintf (asm_out_file, "%d", exact_log2 (INTVAL (x) + 1));
411 break;
412 case 'P':
413 fprintf (asm_out_file, "%d", exact_log2 (INTVAL (x) & 0xffffffff));
414 break;
415 case 'Q':
416 fprintf (asm_out_file, "%d", exact_log2 (~INTVAL (x)));
417 break;
418 case 'O':
419 fprintf (asm_out_file, HOST_WIDE_INT_PRINT_DEC, INTVAL (x));
420 break;
421 case 'M':
422 fprintf (asm_out_file, HOST_WIDE_INT_PRINT_DEC, - INTVAL (x));
423 break;
424 case 'R':
425 /* Next location along in memory or register. */
426 switch (GET_CODE (x))
427 {
428 case REG:
429 fputs (reg_names[REGNO (x) + 1], (stream));
430 break;
431 case MEM:
432 mcore_print_operand_address
433 (stream, XEXP (adjust_address (x, SImode, 4), 0));
434 break;
435 default:
436 gcc_unreachable ();
437 }
438 break;
439 case 'U':
440 fprintf (asm_out_file, "%s-%s", reg_names[REGNO (x)],
441 reg_names[REGNO (x) + 3]);
442 break;
443 case 'x':
444 fprintf (asm_out_file, HOST_WIDE_INT_PRINT_HEX, INTVAL (x));
445 break;
446 case 'X':
447 fprintf (asm_out_file, HOST_WIDE_INT_PRINT_DEC, 3 - INTVAL (x) / 8);
448 break;
449
450 default:
451 switch (GET_CODE (x))
452 {
453 case REG:
454 fputs (reg_names[REGNO (x)], (stream));
455 break;
456 case MEM:
457 output_address (XEXP (x, 0));
458 break;
459 default:
460 output_addr_const (stream, x);
461 break;
462 }
463 break;
464 }
465 }
466
467 /* What does a constant cost ? */
468
469 static int
470 mcore_const_costs (rtx exp, enum rtx_code code)
471 {
472 HOST_WIDE_INT val = INTVAL (exp);
473
474 /* Easy constants. */
475 if ( CONST_OK_FOR_I (val)
476 || CONST_OK_FOR_M (val)
477 || CONST_OK_FOR_N (val)
478 || (code == PLUS && CONST_OK_FOR_L (val)))
479 return 1;
480 else if (code == AND
481 && ( CONST_OK_FOR_M (~val)
482 || CONST_OK_FOR_N (~val)))
483 return 2;
484 else if (code == PLUS
485 && ( CONST_OK_FOR_I (-val)
486 || CONST_OK_FOR_M (-val)
487 || CONST_OK_FOR_N (-val)))
488 return 2;
489
490 return 5;
491 }
492
493 /* What does an and instruction cost - we do this b/c immediates may
494 have been relaxed. We want to ensure that cse will cse relaxed immeds
495 out. Otherwise we'll get bad code (multiple reloads of the same const). */
496
497 static int
498 mcore_and_cost (rtx x)
499 {
500 HOST_WIDE_INT val;
501
502 if (GET_CODE (XEXP (x, 1)) != CONST_INT)
503 return 2;
504
505 val = INTVAL (XEXP (x, 1));
506
507 /* Do it directly. */
508 if (CONST_OK_FOR_K (val) || CONST_OK_FOR_M (~val))
509 return 2;
510 /* Takes one instruction to load. */
511 else if (const_ok_for_mcore (val))
512 return 3;
513 /* Takes two instructions to load. */
514 else if (TARGET_HARDLIT && mcore_const_ok_for_inline (val))
515 return 4;
516
517 /* Takes a lrw to load. */
518 return 5;
519 }
520
521 /* What does an or cost - see and_cost(). */
522
523 static int
524 mcore_ior_cost (rtx x)
525 {
526 HOST_WIDE_INT val;
527
528 if (GET_CODE (XEXP (x, 1)) != CONST_INT)
529 return 2;
530
531 val = INTVAL (XEXP (x, 1));
532
533 /* Do it directly with bclri. */
534 if (CONST_OK_FOR_M (val))
535 return 2;
536 /* Takes one instruction to load. */
537 else if (const_ok_for_mcore (val))
538 return 3;
539 /* Takes two instructions to load. */
540 else if (TARGET_HARDLIT && mcore_const_ok_for_inline (val))
541 return 4;
542
543 /* Takes a lrw to load. */
544 return 5;
545 }
546
547 static bool
548 mcore_rtx_costs (rtx x, int code, int outer_code, int opno ATTRIBUTE_UNUSED,
549 int * total, bool speed ATTRIBUTE_UNUSED)
550 {
551 switch (code)
552 {
553 case CONST_INT:
554 *total = mcore_const_costs (x, (enum rtx_code) outer_code);
555 return true;
556 case CONST:
557 case LABEL_REF:
558 case SYMBOL_REF:
559 *total = 5;
560 return true;
561 case CONST_DOUBLE:
562 *total = 10;
563 return true;
564
565 case AND:
566 *total = COSTS_N_INSNS (mcore_and_cost (x));
567 return true;
568
569 case IOR:
570 *total = COSTS_N_INSNS (mcore_ior_cost (x));
571 return true;
572
573 case DIV:
574 case UDIV:
575 case MOD:
576 case UMOD:
577 case FLOAT:
578 case FIX:
579 *total = COSTS_N_INSNS (100);
580 return true;
581
582 default:
583 return false;
584 }
585 }
586
587 /* Prepare the operands for a comparison. Return whether the branch/setcc
588 should reverse the operands. */
589
590 bool
591 mcore_gen_compare (enum rtx_code code, rtx op0, rtx op1)
592 {
593 rtx cc_reg = gen_rtx_REG (CCmode, CC_REG);
594 bool invert;
595
596 if (GET_CODE (op1) == CONST_INT)
597 {
598 HOST_WIDE_INT val = INTVAL (op1);
599
600 switch (code)
601 {
602 case GTU:
603 /* Unsigned > 0 is the same as != 0; everything else is converted
604 below to LEU (reversed cmphs). */
605 if (val == 0)
606 code = NE;
607 break;
608
609 /* Check whether (LE A imm) can become (LT A imm + 1),
610 or (GT A imm) can become (GE A imm + 1). */
611 case GT:
612 case LE:
613 if (CONST_OK_FOR_J (val + 1))
614 {
615 op1 = GEN_INT (val + 1);
616 code = code == LE ? LT : GE;
617 }
618 break;
619
620 default:
621 break;
622 }
623 }
624
625 if (CONSTANT_P (op1) && GET_CODE (op1) != CONST_INT)
626 op1 = force_reg (SImode, op1);
627
628 /* cmpnei: 0-31 (K immediate)
629 cmplti: 1-32 (J immediate, 0 using btsti x,31). */
630 invert = false;
631 switch (code)
632 {
633 case EQ: /* Use inverted condition, cmpne. */
634 code = NE;
635 invert = true;
636 /* Drop through. */
637
638 case NE: /* Use normal condition, cmpne. */
639 if (GET_CODE (op1) == CONST_INT && ! CONST_OK_FOR_K (INTVAL (op1)))
640 op1 = force_reg (SImode, op1);
641 break;
642
643 case LE: /* Use inverted condition, reversed cmplt. */
644 code = GT;
645 invert = true;
646 /* Drop through. */
647
648 case GT: /* Use normal condition, reversed cmplt. */
649 if (GET_CODE (op1) == CONST_INT)
650 op1 = force_reg (SImode, op1);
651 break;
652
653 case GE: /* Use inverted condition, cmplt. */
654 code = LT;
655 invert = true;
656 /* Drop through. */
657
658 case LT: /* Use normal condition, cmplt. */
659 if (GET_CODE (op1) == CONST_INT &&
660 /* covered by btsti x,31. */
661 INTVAL (op1) != 0 &&
662 ! CONST_OK_FOR_J (INTVAL (op1)))
663 op1 = force_reg (SImode, op1);
664 break;
665
666 case GTU: /* Use inverted condition, cmple. */
667 /* We coped with unsigned > 0 above. */
668 gcc_assert (GET_CODE (op1) != CONST_INT || INTVAL (op1) != 0);
669 code = LEU;
670 invert = true;
671 /* Drop through. */
672
673 case LEU: /* Use normal condition, reversed cmphs. */
674 if (GET_CODE (op1) == CONST_INT && INTVAL (op1) != 0)
675 op1 = force_reg (SImode, op1);
676 break;
677
678 case LTU: /* Use inverted condition, cmphs. */
679 code = GEU;
680 invert = true;
681 /* Drop through. */
682
683 case GEU: /* Use normal condition, cmphs. */
684 if (GET_CODE (op1) == CONST_INT && INTVAL (op1) != 0)
685 op1 = force_reg (SImode, op1);
686 break;
687
688 default:
689 break;
690 }
691
692 emit_insn (gen_rtx_SET (cc_reg, gen_rtx_fmt_ee (code, CCmode, op0, op1)));
693 return invert;
694 }
695
696 int
697 mcore_symbolic_address_p (rtx x)
698 {
699 switch (GET_CODE (x))
700 {
701 case SYMBOL_REF:
702 case LABEL_REF:
703 return 1;
704 case CONST:
705 x = XEXP (x, 0);
706 return ( (GET_CODE (XEXP (x, 0)) == SYMBOL_REF
707 || GET_CODE (XEXP (x, 0)) == LABEL_REF)
708 && GET_CODE (XEXP (x, 1)) == CONST_INT);
709 default:
710 return 0;
711 }
712 }
713
714 /* Functions to output assembly code for a function call. */
715
716 char *
717 mcore_output_call (rtx operands[], int index)
718 {
719 static char buffer[20];
720 rtx addr = operands [index];
721
722 if (REG_P (addr))
723 {
724 if (TARGET_CG_DATA)
725 {
726 gcc_assert (mcore_current_function_name);
727
728 ASM_OUTPUT_CG_EDGE (asm_out_file, mcore_current_function_name,
729 "unknown", 1);
730 }
731
732 sprintf (buffer, "jsr\t%%%d", index);
733 }
734 else
735 {
736 if (TARGET_CG_DATA)
737 {
738 gcc_assert (mcore_current_function_name);
739 gcc_assert (GET_CODE (addr) == SYMBOL_REF);
740
741 ASM_OUTPUT_CG_EDGE (asm_out_file, mcore_current_function_name,
742 XSTR (addr, 0), 0);
743 }
744
745 sprintf (buffer, "jbsr\t%%%d", index);
746 }
747
748 return buffer;
749 }
750
751 /* Can we load a constant with a single instruction ? */
752
753 int
754 const_ok_for_mcore (HOST_WIDE_INT value)
755 {
756 if (value >= 0 && value <= 127)
757 return 1;
758
759 /* Try exact power of two. */
760 if (CONST_OK_FOR_M (value))
761 return 1;
762
763 /* Try exact power of two - 1. */
764 if (CONST_OK_FOR_N (value) && value != -1)
765 return 1;
766
767 return 0;
768 }
769
770 /* Can we load a constant inline with up to 2 instructions ? */
771
772 int
773 mcore_const_ok_for_inline (HOST_WIDE_INT value)
774 {
775 HOST_WIDE_INT x, y;
776
777 return try_constant_tricks (value, & x, & y) > 0;
778 }
779
780 /* Are we loading the constant using a not ? */
781
782 int
783 mcore_const_trick_uses_not (HOST_WIDE_INT value)
784 {
785 HOST_WIDE_INT x, y;
786
787 return try_constant_tricks (value, & x, & y) == 2;
788 }
789
790 /* Try tricks to load a constant inline and return the trick number if
791 success (0 is non-inlinable).
792
793 0: not inlinable
794 1: single instruction (do the usual thing)
795 2: single insn followed by a 'not'
796 3: single insn followed by a subi
797 4: single insn followed by an addi
798 5: single insn followed by rsubi
799 6: single insn followed by bseti
800 7: single insn followed by bclri
801 8: single insn followed by rotli
802 9: single insn followed by lsli
803 10: single insn followed by ixh
804 11: single insn followed by ixw. */
805
806 static int
807 try_constant_tricks (HOST_WIDE_INT value, HOST_WIDE_INT * x, HOST_WIDE_INT * y)
808 {
809 HOST_WIDE_INT i;
810 unsigned HOST_WIDE_INT bit, shf, rot;
811
812 if (const_ok_for_mcore (value))
813 return 1; /* Do the usual thing. */
814
815 if (! TARGET_HARDLIT)
816 return 0;
817
818 if (const_ok_for_mcore (~value))
819 {
820 *x = ~value;
821 return 2;
822 }
823
824 for (i = 1; i <= 32; i++)
825 {
826 if (const_ok_for_mcore (value - i))
827 {
828 *x = value - i;
829 *y = i;
830
831 return 3;
832 }
833
834 if (const_ok_for_mcore (value + i))
835 {
836 *x = value + i;
837 *y = i;
838
839 return 4;
840 }
841 }
842
843 bit = 0x80000000ULL;
844
845 for (i = 0; i <= 31; i++)
846 {
847 if (const_ok_for_mcore (i - value))
848 {
849 *x = i - value;
850 *y = i;
851
852 return 5;
853 }
854
855 if (const_ok_for_mcore (value & ~bit))
856 {
857 *y = bit;
858 *x = value & ~bit;
859 return 6;
860 }
861
862 if (const_ok_for_mcore (value | bit))
863 {
864 *y = ~bit;
865 *x = value | bit;
866
867 return 7;
868 }
869
870 bit >>= 1;
871 }
872
873 shf = value;
874 rot = value;
875
876 for (i = 1; i < 31; i++)
877 {
878 int c;
879
880 /* MCore has rotate left. */
881 c = rot << 31;
882 rot >>= 1;
883 rot &= 0x7FFFFFFF;
884 rot |= c; /* Simulate rotate. */
885
886 if (const_ok_for_mcore (rot))
887 {
888 *y = i;
889 *x = rot;
890
891 return 8;
892 }
893
894 if (shf & 1)
895 shf = 0; /* Can't use logical shift, low order bit is one. */
896
897 shf >>= 1;
898
899 if (shf != 0 && const_ok_for_mcore (shf))
900 {
901 *y = i;
902 *x = shf;
903
904 return 9;
905 }
906 }
907
908 if ((value % 3) == 0 && const_ok_for_mcore (value / 3))
909 {
910 *x = value / 3;
911
912 return 10;
913 }
914
915 if ((value % 5) == 0 && const_ok_for_mcore (value / 5))
916 {
917 *x = value / 5;
918
919 return 11;
920 }
921
922 return 0;
923 }
924
925 /* Check whether reg is dead at first. This is done by searching ahead
926 for either the next use (i.e., reg is live), a death note, or a set of
927 reg. Don't just use dead_or_set_p() since reload does not always mark
928 deaths (especially if PRESERVE_DEATH_NOTES_REGNO_P is not defined). We
929 can ignore subregs by extracting the actual register. BRC */
930
931 int
932 mcore_is_dead (rtx_insn *first, rtx reg)
933 {
934 rtx_insn *insn;
935
936 /* For mcore, subregs can't live independently of their parent regs. */
937 if (GET_CODE (reg) == SUBREG)
938 reg = SUBREG_REG (reg);
939
940 /* Dies immediately. */
941 if (dead_or_set_p (first, reg))
942 return 1;
943
944 /* Look for conclusive evidence of live/death, otherwise we have
945 to assume that it is live. */
946 for (insn = NEXT_INSN (first); insn; insn = NEXT_INSN (insn))
947 {
948 if (JUMP_P (insn))
949 return 0; /* We lose track, assume it is alive. */
950
951 else if (CALL_P (insn))
952 {
953 /* Call's might use it for target or register parms. */
954 if (reg_referenced_p (reg, PATTERN (insn))
955 || find_reg_fusage (insn, USE, reg))
956 return 0;
957 else if (dead_or_set_p (insn, reg))
958 return 1;
959 }
960 else if (NONJUMP_INSN_P (insn))
961 {
962 if (reg_referenced_p (reg, PATTERN (insn)))
963 return 0;
964 else if (dead_or_set_p (insn, reg))
965 return 1;
966 }
967 }
968
969 /* No conclusive evidence either way, we cannot take the chance
970 that control flow hid the use from us -- "I'm not dead yet". */
971 return 0;
972 }
973
974 /* Count the number of ones in mask. */
975
976 int
977 mcore_num_ones (HOST_WIDE_INT mask)
978 {
979 /* A trick to count set bits recently posted on comp.compilers. */
980 mask = (mask >> 1 & 0x55555555) + (mask & 0x55555555);
981 mask = ((mask >> 2) & 0x33333333) + (mask & 0x33333333);
982 mask = ((mask >> 4) + mask) & 0x0f0f0f0f;
983 mask = ((mask >> 8) + mask);
984
985 return (mask + (mask >> 16)) & 0xff;
986 }
987
988 /* Count the number of zeros in mask. */
989
990 int
991 mcore_num_zeros (HOST_WIDE_INT mask)
992 {
993 return 32 - mcore_num_ones (mask);
994 }
995
996 /* Determine byte being masked. */
997
998 int
999 mcore_byte_offset (unsigned int mask)
1000 {
1001 if (mask == 0x00ffffffL)
1002 return 0;
1003 else if (mask == 0xff00ffffL)
1004 return 1;
1005 else if (mask == 0xffff00ffL)
1006 return 2;
1007 else if (mask == 0xffffff00L)
1008 return 3;
1009
1010 return -1;
1011 }
1012
1013 /* Determine halfword being masked. */
1014
1015 int
1016 mcore_halfword_offset (unsigned int mask)
1017 {
1018 if (mask == 0x0000ffffL)
1019 return 0;
1020 else if (mask == 0xffff0000L)
1021 return 1;
1022
1023 return -1;
1024 }
1025
1026 /* Output a series of bseti's corresponding to mask. */
1027
1028 const char *
1029 mcore_output_bseti (rtx dst, int mask)
1030 {
1031 rtx out_operands[2];
1032 int bit;
1033
1034 out_operands[0] = dst;
1035
1036 for (bit = 0; bit < 32; bit++)
1037 {
1038 if ((mask & 0x1) == 0x1)
1039 {
1040 out_operands[1] = GEN_INT (bit);
1041
1042 output_asm_insn ("bseti\t%0,%1", out_operands);
1043 }
1044 mask >>= 1;
1045 }
1046
1047 return "";
1048 }
1049
1050 /* Output a series of bclri's corresponding to mask. */
1051
1052 const char *
1053 mcore_output_bclri (rtx dst, int mask)
1054 {
1055 rtx out_operands[2];
1056 int bit;
1057
1058 out_operands[0] = dst;
1059
1060 for (bit = 0; bit < 32; bit++)
1061 {
1062 if ((mask & 0x1) == 0x0)
1063 {
1064 out_operands[1] = GEN_INT (bit);
1065
1066 output_asm_insn ("bclri\t%0,%1", out_operands);
1067 }
1068
1069 mask >>= 1;
1070 }
1071
1072 return "";
1073 }
1074
1075 /* Output a conditional move of two constants that are +/- 1 within each
1076 other. See the "movtK" patterns in mcore.md. I'm not sure this is
1077 really worth the effort. */
1078
1079 const char *
1080 mcore_output_cmov (rtx operands[], int cmp_t, const char * test)
1081 {
1082 HOST_WIDE_INT load_value;
1083 HOST_WIDE_INT adjust_value;
1084 rtx out_operands[4];
1085
1086 out_operands[0] = operands[0];
1087
1088 /* Check to see which constant is loadable. */
1089 if (const_ok_for_mcore (INTVAL (operands[1])))
1090 {
1091 out_operands[1] = operands[1];
1092 out_operands[2] = operands[2];
1093 }
1094 else if (const_ok_for_mcore (INTVAL (operands[2])))
1095 {
1096 out_operands[1] = operands[2];
1097 out_operands[2] = operands[1];
1098
1099 /* Complement test since constants are swapped. */
1100 cmp_t = (cmp_t == 0);
1101 }
1102 load_value = INTVAL (out_operands[1]);
1103 adjust_value = INTVAL (out_operands[2]);
1104
1105 /* First output the test if folded into the pattern. */
1106
1107 if (test)
1108 output_asm_insn (test, operands);
1109
1110 /* Load the constant - for now, only support constants that can be
1111 generated with a single instruction. maybe add general inlinable
1112 constants later (this will increase the # of patterns since the
1113 instruction sequence has a different length attribute). */
1114 if (load_value >= 0 && load_value <= 127)
1115 output_asm_insn ("movi\t%0,%1", out_operands);
1116 else if (CONST_OK_FOR_M (load_value))
1117 output_asm_insn ("bgeni\t%0,%P1", out_operands);
1118 else if (CONST_OK_FOR_N (load_value))
1119 output_asm_insn ("bmaski\t%0,%N1", out_operands);
1120
1121 /* Output the constant adjustment. */
1122 if (load_value > adjust_value)
1123 {
1124 if (cmp_t)
1125 output_asm_insn ("decf\t%0", out_operands);
1126 else
1127 output_asm_insn ("dect\t%0", out_operands);
1128 }
1129 else
1130 {
1131 if (cmp_t)
1132 output_asm_insn ("incf\t%0", out_operands);
1133 else
1134 output_asm_insn ("inct\t%0", out_operands);
1135 }
1136
1137 return "";
1138 }
1139
1140 /* Outputs the peephole for moving a constant that gets not'ed followed
1141 by an and (i.e. combine the not and the and into andn). BRC */
1142
1143 const char *
1144 mcore_output_andn (rtx insn ATTRIBUTE_UNUSED, rtx operands[])
1145 {
1146 HOST_WIDE_INT x, y;
1147 rtx out_operands[3];
1148 const char * load_op;
1149 char buf[256];
1150 int trick_no;
1151
1152 trick_no = try_constant_tricks (INTVAL (operands[1]), &x, &y);
1153 gcc_assert (trick_no == 2);
1154
1155 out_operands[0] = operands[0];
1156 out_operands[1] = GEN_INT (x);
1157 out_operands[2] = operands[2];
1158
1159 if (x >= 0 && x <= 127)
1160 load_op = "movi\t%0,%1";
1161
1162 /* Try exact power of two. */
1163 else if (CONST_OK_FOR_M (x))
1164 load_op = "bgeni\t%0,%P1";
1165
1166 /* Try exact power of two - 1. */
1167 else if (CONST_OK_FOR_N (x))
1168 load_op = "bmaski\t%0,%N1";
1169
1170 else
1171 {
1172 load_op = "BADMOVI-andn\t%0, %1";
1173 gcc_unreachable ();
1174 }
1175
1176 sprintf (buf, "%s\n\tandn\t%%2,%%0", load_op);
1177 output_asm_insn (buf, out_operands);
1178
1179 return "";
1180 }
1181
1182 /* Output an inline constant. */
1183
1184 static const char *
1185 output_inline_const (machine_mode mode, rtx operands[])
1186 {
1187 HOST_WIDE_INT x = 0, y = 0;
1188 int trick_no;
1189 rtx out_operands[3];
1190 char buf[256];
1191 char load_op[256];
1192 const char *dst_fmt;
1193 HOST_WIDE_INT value;
1194
1195 value = INTVAL (operands[1]);
1196
1197 trick_no = try_constant_tricks (value, &x, &y);
1198 /* lrw's are handled separately: Large inlinable constants never get
1199 turned into lrw's. Our caller uses try_constant_tricks to back
1200 off to an lrw rather than calling this routine. */
1201 gcc_assert (trick_no != 0);
1202
1203 if (trick_no == 1)
1204 x = value;
1205
1206 /* operands: 0 = dst, 1 = load immed., 2 = immed. adjustment. */
1207 out_operands[0] = operands[0];
1208 out_operands[1] = GEN_INT (x);
1209
1210 if (trick_no > 2)
1211 out_operands[2] = GEN_INT (y);
1212
1213 /* Select dst format based on mode. */
1214 if (mode == DImode && (! TARGET_LITTLE_END))
1215 dst_fmt = "%R0";
1216 else
1217 dst_fmt = "%0";
1218
1219 if (x >= 0 && x <= 127)
1220 sprintf (load_op, "movi\t%s,%%1", dst_fmt);
1221
1222 /* Try exact power of two. */
1223 else if (CONST_OK_FOR_M (x))
1224 sprintf (load_op, "bgeni\t%s,%%P1", dst_fmt);
1225
1226 /* Try exact power of two - 1. */
1227 else if (CONST_OK_FOR_N (x))
1228 sprintf (load_op, "bmaski\t%s,%%N1", dst_fmt);
1229
1230 else
1231 {
1232 sprintf (load_op, "BADMOVI-inline_const %s, %%1", dst_fmt);
1233 gcc_unreachable ();
1234 }
1235
1236 switch (trick_no)
1237 {
1238 case 1:
1239 strcpy (buf, load_op);
1240 break;
1241 case 2: /* not */
1242 sprintf (buf, "%s\n\tnot\t%s\t// %ld 0x%lx", load_op, dst_fmt, value, value);
1243 break;
1244 case 3: /* add */
1245 sprintf (buf, "%s\n\taddi\t%s,%%2\t// %ld 0x%lx", load_op, dst_fmt, value, value);
1246 break;
1247 case 4: /* sub */
1248 sprintf (buf, "%s\n\tsubi\t%s,%%2\t// %ld 0x%lx", load_op, dst_fmt, value, value);
1249 break;
1250 case 5: /* rsub */
1251 /* Never happens unless -mrsubi, see try_constant_tricks(). */
1252 sprintf (buf, "%s\n\trsubi\t%s,%%2\t// %ld 0x%lx", load_op, dst_fmt, value, value);
1253 break;
1254 case 6: /* bseti */
1255 sprintf (buf, "%s\n\tbseti\t%s,%%P2\t// %ld 0x%lx", load_op, dst_fmt, value, value);
1256 break;
1257 case 7: /* bclr */
1258 sprintf (buf, "%s\n\tbclri\t%s,%%Q2\t// %ld 0x%lx", load_op, dst_fmt, value, value);
1259 break;
1260 case 8: /* rotl */
1261 sprintf (buf, "%s\n\trotli\t%s,%%2\t// %ld 0x%lx", load_op, dst_fmt, value, value);
1262 break;
1263 case 9: /* lsl */
1264 sprintf (buf, "%s\n\tlsli\t%s,%%2\t// %ld 0x%lx", load_op, dst_fmt, value, value);
1265 break;
1266 case 10: /* ixh */
1267 sprintf (buf, "%s\n\tixh\t%s,%s\t// %ld 0x%lx", load_op, dst_fmt, dst_fmt, value, value);
1268 break;
1269 case 11: /* ixw */
1270 sprintf (buf, "%s\n\tixw\t%s,%s\t// %ld 0x%lx", load_op, dst_fmt, dst_fmt, value, value);
1271 break;
1272 default:
1273 return "";
1274 }
1275
1276 output_asm_insn (buf, out_operands);
1277
1278 return "";
1279 }
1280
1281 /* Output a move of a word or less value. */
1282
1283 const char *
1284 mcore_output_move (rtx insn ATTRIBUTE_UNUSED, rtx operands[],
1285 machine_mode mode ATTRIBUTE_UNUSED)
1286 {
1287 rtx dst = operands[0];
1288 rtx src = operands[1];
1289
1290 if (GET_CODE (dst) == REG)
1291 {
1292 if (GET_CODE (src) == REG)
1293 {
1294 if (REGNO (src) == CC_REG) /* r-c */
1295 return "mvc\t%0";
1296 else
1297 return "mov\t%0,%1"; /* r-r*/
1298 }
1299 else if (GET_CODE (src) == MEM)
1300 {
1301 if (GET_CODE (XEXP (src, 0)) == LABEL_REF)
1302 return "lrw\t%0,[%1]"; /* a-R */
1303 else
1304 switch (GET_MODE (src)) /* r-m */
1305 {
1306 case SImode:
1307 return "ldw\t%0,%1";
1308 case HImode:
1309 return "ld.h\t%0,%1";
1310 case QImode:
1311 return "ld.b\t%0,%1";
1312 default:
1313 gcc_unreachable ();
1314 }
1315 }
1316 else if (GET_CODE (src) == CONST_INT)
1317 {
1318 HOST_WIDE_INT x, y;
1319
1320 if (CONST_OK_FOR_I (INTVAL (src))) /* r-I */
1321 return "movi\t%0,%1";
1322 else if (CONST_OK_FOR_M (INTVAL (src))) /* r-M */
1323 return "bgeni\t%0,%P1\t// %1 %x1";
1324 else if (CONST_OK_FOR_N (INTVAL (src))) /* r-N */
1325 return "bmaski\t%0,%N1\t// %1 %x1";
1326 else if (try_constant_tricks (INTVAL (src), &x, &y)) /* R-P */
1327 return output_inline_const (SImode, operands); /* 1-2 insns */
1328 else
1329 return "lrw\t%0,%x1\t// %1"; /* Get it from literal pool. */
1330 }
1331 else
1332 return "lrw\t%0, %1"; /* Into the literal pool. */
1333 }
1334 else if (GET_CODE (dst) == MEM) /* m-r */
1335 switch (GET_MODE (dst))
1336 {
1337 case SImode:
1338 return "stw\t%1,%0";
1339 case HImode:
1340 return "st.h\t%1,%0";
1341 case QImode:
1342 return "st.b\t%1,%0";
1343 default:
1344 gcc_unreachable ();
1345 }
1346
1347 gcc_unreachable ();
1348 }
1349
1350 /* Return a sequence of instructions to perform DI or DF move.
1351 Since the MCORE cannot move a DI or DF in one instruction, we have
1352 to take care when we see overlapping source and dest registers. */
1353
1354 const char *
1355 mcore_output_movedouble (rtx operands[], machine_mode mode ATTRIBUTE_UNUSED)
1356 {
1357 rtx dst = operands[0];
1358 rtx src = operands[1];
1359
1360 if (GET_CODE (dst) == REG)
1361 {
1362 if (GET_CODE (src) == REG)
1363 {
1364 int dstreg = REGNO (dst);
1365 int srcreg = REGNO (src);
1366
1367 /* Ensure the second source not overwritten. */
1368 if (srcreg + 1 == dstreg)
1369 return "mov %R0,%R1\n\tmov %0,%1";
1370 else
1371 return "mov %0,%1\n\tmov %R0,%R1";
1372 }
1373 else if (GET_CODE (src) == MEM)
1374 {
1375 rtx memexp = XEXP (src, 0);
1376 int dstreg = REGNO (dst);
1377 int basereg = -1;
1378
1379 if (GET_CODE (memexp) == LABEL_REF)
1380 return "lrw\t%0,[%1]\n\tlrw\t%R0,[%R1]";
1381 else if (GET_CODE (memexp) == REG)
1382 basereg = REGNO (memexp);
1383 else if (GET_CODE (memexp) == PLUS)
1384 {
1385 if (GET_CODE (XEXP (memexp, 0)) == REG)
1386 basereg = REGNO (XEXP (memexp, 0));
1387 else if (GET_CODE (XEXP (memexp, 1)) == REG)
1388 basereg = REGNO (XEXP (memexp, 1));
1389 else
1390 gcc_unreachable ();
1391 }
1392 else
1393 gcc_unreachable ();
1394
1395 /* ??? length attribute is wrong here. */
1396 if (dstreg == basereg)
1397 {
1398 /* Just load them in reverse order. */
1399 return "ldw\t%R0,%R1\n\tldw\t%0,%1";
1400
1401 /* XXX: alternative: move basereg to basereg+1
1402 and then fall through. */
1403 }
1404 else
1405 return "ldw\t%0,%1\n\tldw\t%R0,%R1";
1406 }
1407 else if (GET_CODE (src) == CONST_INT)
1408 {
1409 if (TARGET_LITTLE_END)
1410 {
1411 if (CONST_OK_FOR_I (INTVAL (src)))
1412 output_asm_insn ("movi %0,%1", operands);
1413 else if (CONST_OK_FOR_M (INTVAL (src)))
1414 output_asm_insn ("bgeni %0,%P1", operands);
1415 else if (CONST_OK_FOR_N (INTVAL (src)))
1416 output_asm_insn ("bmaski %0,%N1", operands);
1417 else
1418 gcc_unreachable ();
1419
1420 if (INTVAL (src) < 0)
1421 return "bmaski %R0,32";
1422 else
1423 return "movi %R0,0";
1424 }
1425 else
1426 {
1427 if (CONST_OK_FOR_I (INTVAL (src)))
1428 output_asm_insn ("movi %R0,%1", operands);
1429 else if (CONST_OK_FOR_M (INTVAL (src)))
1430 output_asm_insn ("bgeni %R0,%P1", operands);
1431 else if (CONST_OK_FOR_N (INTVAL (src)))
1432 output_asm_insn ("bmaski %R0,%N1", operands);
1433 else
1434 gcc_unreachable ();
1435
1436 if (INTVAL (src) < 0)
1437 return "bmaski %0,32";
1438 else
1439 return "movi %0,0";
1440 }
1441 }
1442 else
1443 gcc_unreachable ();
1444 }
1445 else if (GET_CODE (dst) == MEM && GET_CODE (src) == REG)
1446 return "stw\t%1,%0\n\tstw\t%R1,%R0";
1447 else
1448 gcc_unreachable ();
1449 }
1450
1451 /* Predicates used by the templates. */
1452
1453 int
1454 mcore_arith_S_operand (rtx op)
1455 {
1456 if (GET_CODE (op) == CONST_INT && CONST_OK_FOR_M (~INTVAL (op)))
1457 return 1;
1458
1459 return 0;
1460 }
1461
1462 /* Expand insert bit field. BRC */
1463
1464 int
1465 mcore_expand_insv (rtx operands[])
1466 {
1467 int width = INTVAL (operands[1]);
1468 int posn = INTVAL (operands[2]);
1469 int mask;
1470 rtx mreg, sreg, ereg;
1471
1472 /* To get width 1 insv, the test in store_bit_field() (expmed.c, line 191)
1473 for width==1 must be removed. Look around line 368. This is something
1474 we really want the md part to do. */
1475 if (width == 1 && GET_CODE (operands[3]) == CONST_INT)
1476 {
1477 /* Do directly with bseti or bclri. */
1478 /* RBE: 2/97 consider only low bit of constant. */
1479 if ((INTVAL (operands[3]) & 1) == 0)
1480 {
1481 mask = ~(1 << posn);
1482 emit_insn (gen_rtx_SET (operands[0],
1483 gen_rtx_AND (SImode, operands[0],
1484 GEN_INT (mask))));
1485 }
1486 else
1487 {
1488 mask = 1 << posn;
1489 emit_insn (gen_rtx_SET (operands[0],
1490 gen_rtx_IOR (SImode, operands[0],
1491 GEN_INT (mask))));
1492 }
1493
1494 return 1;
1495 }
1496
1497 /* Look at some bit-field placements that we aren't interested
1498 in handling ourselves, unless specifically directed to do so. */
1499 if (! TARGET_W_FIELD)
1500 return 0; /* Generally, give up about now. */
1501
1502 if (width == 8 && posn % 8 == 0)
1503 /* Byte sized and aligned; let caller break it up. */
1504 return 0;
1505
1506 if (width == 16 && posn % 16 == 0)
1507 /* Short sized and aligned; let caller break it up. */
1508 return 0;
1509
1510 /* The general case - we can do this a little bit better than what the
1511 machine independent part tries. This will get rid of all the subregs
1512 that mess up constant folding in combine when working with relaxed
1513 immediates. */
1514
1515 /* If setting the entire field, do it directly. */
1516 if (GET_CODE (operands[3]) == CONST_INT
1517 && INTVAL (operands[3]) == ((1 << width) - 1))
1518 {
1519 mreg = force_reg (SImode, GEN_INT (INTVAL (operands[3]) << posn));
1520 emit_insn (gen_rtx_SET (operands[0],
1521 gen_rtx_IOR (SImode, operands[0], mreg)));
1522 return 1;
1523 }
1524
1525 /* Generate the clear mask. */
1526 mreg = force_reg (SImode, GEN_INT (~(((1 << width) - 1) << posn)));
1527
1528 /* Clear the field, to overlay it later with the source. */
1529 emit_insn (gen_rtx_SET (operands[0],
1530 gen_rtx_AND (SImode, operands[0], mreg)));
1531
1532 /* If the source is constant 0, we've nothing to add back. */
1533 if (GET_CODE (operands[3]) == CONST_INT && INTVAL (operands[3]) == 0)
1534 return 1;
1535
1536 /* XXX: Should we worry about more games with constant values?
1537 We've covered the high profile: set/clear single-bit and many-bit
1538 fields. How often do we see "arbitrary bit pattern" constants? */
1539 sreg = copy_to_mode_reg (SImode, operands[3]);
1540
1541 /* Extract src as same width as dst (needed for signed values). We
1542 always have to do this since we widen everything to SImode.
1543 We don't have to mask if we're shifting this up against the
1544 MSB of the register (e.g., the shift will push out any hi-order
1545 bits. */
1546 if (width + posn != (int) GET_MODE_SIZE (SImode))
1547 {
1548 ereg = force_reg (SImode, GEN_INT ((1 << width) - 1));
1549 emit_insn (gen_rtx_SET (sreg, gen_rtx_AND (SImode, sreg, ereg)));
1550 }
1551
1552 /* Insert source value in dest. */
1553 if (posn != 0)
1554 emit_insn (gen_rtx_SET (sreg, gen_rtx_ASHIFT (SImode, sreg,
1555 GEN_INT (posn))));
1556
1557 emit_insn (gen_rtx_SET (operands[0],
1558 gen_rtx_IOR (SImode, operands[0], sreg)));
1559
1560 return 1;
1561 }
1562 \f
1563 /* ??? Block move stuff stolen from m88k. This code has not been
1564 verified for correctness. */
1565
1566 /* Emit code to perform a block move. Choose the best method.
1567
1568 OPERANDS[0] is the destination.
1569 OPERANDS[1] is the source.
1570 OPERANDS[2] is the size.
1571 OPERANDS[3] is the alignment safe to use. */
1572
1573 /* Emit code to perform a block move with an offset sequence of ldw/st
1574 instructions (..., ldw 0, stw 1, ldw 1, stw 0, ...). SIZE and ALIGN are
1575 known constants. DEST and SRC are registers. OFFSET is the known
1576 starting point for the output pattern. */
1577
1578 static const machine_mode mode_from_align[] =
1579 {
1580 VOIDmode, QImode, HImode, VOIDmode, SImode,
1581 };
1582
1583 static void
1584 block_move_sequence (rtx dst_mem, rtx src_mem, int size, int align)
1585 {
1586 rtx temp[2];
1587 machine_mode mode[2];
1588 int amount[2];
1589 bool active[2];
1590 int phase = 0;
1591 int next;
1592 int offset_ld = 0;
1593 int offset_st = 0;
1594 rtx x;
1595
1596 x = XEXP (dst_mem, 0);
1597 if (!REG_P (x))
1598 {
1599 x = force_reg (Pmode, x);
1600 dst_mem = replace_equiv_address (dst_mem, x);
1601 }
1602
1603 x = XEXP (src_mem, 0);
1604 if (!REG_P (x))
1605 {
1606 x = force_reg (Pmode, x);
1607 src_mem = replace_equiv_address (src_mem, x);
1608 }
1609
1610 active[0] = active[1] = false;
1611
1612 do
1613 {
1614 next = phase;
1615 phase ^= 1;
1616
1617 if (size > 0)
1618 {
1619 int next_amount;
1620
1621 next_amount = (size >= 4 ? 4 : (size >= 2 ? 2 : 1));
1622 next_amount = MIN (next_amount, align);
1623
1624 amount[next] = next_amount;
1625 mode[next] = mode_from_align[next_amount];
1626 temp[next] = gen_reg_rtx (mode[next]);
1627
1628 x = adjust_address (src_mem, mode[next], offset_ld);
1629 emit_insn (gen_rtx_SET (temp[next], x));
1630
1631 offset_ld += next_amount;
1632 size -= next_amount;
1633 active[next] = true;
1634 }
1635
1636 if (active[phase])
1637 {
1638 active[phase] = false;
1639
1640 x = adjust_address (dst_mem, mode[phase], offset_st);
1641 emit_insn (gen_rtx_SET (x, temp[phase]));
1642
1643 offset_st += amount[phase];
1644 }
1645 }
1646 while (active[next]);
1647 }
1648
1649 bool
1650 mcore_expand_block_move (rtx *operands)
1651 {
1652 HOST_WIDE_INT align, bytes, max;
1653
1654 if (GET_CODE (operands[2]) != CONST_INT)
1655 return false;
1656
1657 bytes = INTVAL (operands[2]);
1658 align = INTVAL (operands[3]);
1659
1660 if (bytes <= 0)
1661 return false;
1662 if (align > 4)
1663 align = 4;
1664
1665 switch (align)
1666 {
1667 case 4:
1668 if (bytes & 1)
1669 max = 4*4;
1670 else if (bytes & 3)
1671 max = 8*4;
1672 else
1673 max = 16*4;
1674 break;
1675 case 2:
1676 max = 4*2;
1677 break;
1678 case 1:
1679 max = 4*1;
1680 break;
1681 default:
1682 gcc_unreachable ();
1683 }
1684
1685 if (bytes <= max)
1686 {
1687 block_move_sequence (operands[0], operands[1], bytes, align);
1688 return true;
1689 }
1690
1691 return false;
1692 }
1693 \f
1694
1695 /* Code to generate prologue and epilogue sequences. */
1696 static int number_of_regs_before_varargs;
1697
1698 /* Set by TARGET_SETUP_INCOMING_VARARGS to indicate to prolog that this is
1699 for a varargs function. */
1700 static int current_function_anonymous_args;
1701
1702 #define STACK_BYTES (STACK_BOUNDARY/BITS_PER_UNIT)
1703 #define STORE_REACH (64) /* Maximum displace of word store + 4. */
1704 #define ADDI_REACH (32) /* Maximum addi operand. */
1705
1706 static void
1707 layout_mcore_frame (struct mcore_frame * infp)
1708 {
1709 int n;
1710 unsigned int i;
1711 int nbytes;
1712 int regarg;
1713 int localregarg;
1714 int outbounds;
1715 unsigned int growths;
1716 int step;
1717
1718 /* Might have to spill bytes to re-assemble a big argument that
1719 was passed partially in registers and partially on the stack. */
1720 nbytes = crtl->args.pretend_args_size;
1721
1722 /* Determine how much space for spilled anonymous args (e.g., stdarg). */
1723 if (current_function_anonymous_args)
1724 nbytes += (NPARM_REGS - number_of_regs_before_varargs) * UNITS_PER_WORD;
1725
1726 infp->arg_size = nbytes;
1727
1728 /* How much space to save non-volatile registers we stomp. */
1729 infp->reg_mask = calc_live_regs (& n);
1730 infp->reg_size = n * 4;
1731
1732 /* And the rest of it... locals and space for overflowed outbounds. */
1733 infp->local_size = get_frame_size ();
1734 infp->outbound_size = crtl->outgoing_args_size;
1735
1736 /* Make sure we have a whole number of words for the locals. */
1737 if (infp->local_size % STACK_BYTES)
1738 infp->local_size = (infp->local_size + STACK_BYTES - 1) & ~ (STACK_BYTES -1);
1739
1740 /* Only thing we know we have to pad is the outbound space, since
1741 we've aligned our locals assuming that base of locals is aligned. */
1742 infp->pad_local = 0;
1743 infp->pad_reg = 0;
1744 infp->pad_outbound = 0;
1745 if (infp->outbound_size % STACK_BYTES)
1746 infp->pad_outbound = STACK_BYTES - (infp->outbound_size % STACK_BYTES);
1747
1748 /* Now we see how we want to stage the prologue so that it does
1749 the most appropriate stack growth and register saves to either:
1750 (1) run fast,
1751 (2) reduce instruction space, or
1752 (3) reduce stack space. */
1753 for (i = 0; i < ARRAY_SIZE (infp->growth); i++)
1754 infp->growth[i] = 0;
1755
1756 regarg = infp->reg_size + infp->arg_size;
1757 localregarg = infp->local_size + regarg;
1758 outbounds = infp->outbound_size + infp->pad_outbound;
1759 growths = 0;
1760
1761 /* XXX: Consider one where we consider localregarg + outbound too! */
1762
1763 /* Frame of <= 32 bytes and using stm would get <= 2 registers.
1764 use stw's with offsets and buy the frame in one shot. */
1765 if (localregarg <= ADDI_REACH
1766 && (infp->reg_size <= 8 || (infp->reg_mask & 0xc000) != 0xc000))
1767 {
1768 /* Make sure we'll be aligned. */
1769 if (localregarg % STACK_BYTES)
1770 infp->pad_reg = STACK_BYTES - (localregarg % STACK_BYTES);
1771
1772 step = localregarg + infp->pad_reg;
1773 infp->reg_offset = infp->local_size;
1774
1775 if (outbounds + step <= ADDI_REACH && !frame_pointer_needed)
1776 {
1777 step += outbounds;
1778 infp->reg_offset += outbounds;
1779 outbounds = 0;
1780 }
1781
1782 infp->arg_offset = step - 4;
1783 infp->growth[growths++] = step;
1784 infp->reg_growth = growths;
1785 infp->local_growth = growths;
1786
1787 /* If we haven't already folded it in. */
1788 if (outbounds)
1789 infp->growth[growths++] = outbounds;
1790
1791 goto finish;
1792 }
1793
1794 /* Frame can't be done with a single subi, but can be done with 2
1795 insns. If the 'stm' is getting <= 2 registers, we use stw's and
1796 shift some of the stack purchase into the first subi, so both are
1797 single instructions. */
1798 if (localregarg <= STORE_REACH
1799 && (infp->local_size > ADDI_REACH)
1800 && (infp->reg_size <= 8 || (infp->reg_mask & 0xc000) != 0xc000))
1801 {
1802 int all;
1803
1804 /* Make sure we'll be aligned; use either pad_reg or pad_local. */
1805 if (localregarg % STACK_BYTES)
1806 infp->pad_reg = STACK_BYTES - (localregarg % STACK_BYTES);
1807
1808 all = localregarg + infp->pad_reg + infp->pad_local;
1809 step = ADDI_REACH; /* As much up front as we can. */
1810 if (step > all)
1811 step = all;
1812
1813 /* XXX: Consider whether step will still be aligned; we believe so. */
1814 infp->arg_offset = step - 4;
1815 infp->growth[growths++] = step;
1816 infp->reg_growth = growths;
1817 infp->reg_offset = step - infp->pad_reg - infp->reg_size;
1818 all -= step;
1819
1820 /* Can we fold in any space required for outbounds? */
1821 if (outbounds + all <= ADDI_REACH && !frame_pointer_needed)
1822 {
1823 all += outbounds;
1824 outbounds = 0;
1825 }
1826
1827 /* Get the rest of the locals in place. */
1828 step = all;
1829 infp->growth[growths++] = step;
1830 infp->local_growth = growths;
1831 all -= step;
1832
1833 gcc_assert (all == 0);
1834
1835 /* Finish off if we need to do so. */
1836 if (outbounds)
1837 infp->growth[growths++] = outbounds;
1838
1839 goto finish;
1840 }
1841
1842 /* Registers + args is nicely aligned, so we'll buy that in one shot.
1843 Then we buy the rest of the frame in 1 or 2 steps depending on
1844 whether we need a frame pointer. */
1845 if ((regarg % STACK_BYTES) == 0)
1846 {
1847 infp->growth[growths++] = regarg;
1848 infp->reg_growth = growths;
1849 infp->arg_offset = regarg - 4;
1850 infp->reg_offset = 0;
1851
1852 if (infp->local_size % STACK_BYTES)
1853 infp->pad_local = STACK_BYTES - (infp->local_size % STACK_BYTES);
1854
1855 step = infp->local_size + infp->pad_local;
1856
1857 if (!frame_pointer_needed)
1858 {
1859 step += outbounds;
1860 outbounds = 0;
1861 }
1862
1863 infp->growth[growths++] = step;
1864 infp->local_growth = growths;
1865
1866 /* If there's any left to be done. */
1867 if (outbounds)
1868 infp->growth[growths++] = outbounds;
1869
1870 goto finish;
1871 }
1872
1873 /* XXX: optimizations that we'll want to play with....
1874 -- regarg is not aligned, but it's a small number of registers;
1875 use some of localsize so that regarg is aligned and then
1876 save the registers. */
1877
1878 /* Simple encoding; plods down the stack buying the pieces as it goes.
1879 -- does not optimize space consumption.
1880 -- does not attempt to optimize instruction counts.
1881 -- but it is safe for all alignments. */
1882 if (regarg % STACK_BYTES != 0)
1883 infp->pad_reg = STACK_BYTES - (regarg % STACK_BYTES);
1884
1885 infp->growth[growths++] = infp->arg_size + infp->reg_size + infp->pad_reg;
1886 infp->reg_growth = growths;
1887 infp->arg_offset = infp->growth[0] - 4;
1888 infp->reg_offset = 0;
1889
1890 if (frame_pointer_needed)
1891 {
1892 if (infp->local_size % STACK_BYTES != 0)
1893 infp->pad_local = STACK_BYTES - (infp->local_size % STACK_BYTES);
1894
1895 infp->growth[growths++] = infp->local_size + infp->pad_local;
1896 infp->local_growth = growths;
1897
1898 infp->growth[growths++] = outbounds;
1899 }
1900 else
1901 {
1902 if ((infp->local_size + outbounds) % STACK_BYTES != 0)
1903 infp->pad_local = STACK_BYTES - ((infp->local_size + outbounds) % STACK_BYTES);
1904
1905 infp->growth[growths++] = infp->local_size + infp->pad_local + outbounds;
1906 infp->local_growth = growths;
1907 }
1908
1909 /* Anything else that we've forgotten?, plus a few consistency checks. */
1910 finish:
1911 gcc_assert (infp->reg_offset >= 0);
1912 gcc_assert (growths <= MAX_STACK_GROWS);
1913
1914 for (i = 0; i < growths; i++)
1915 gcc_assert (!(infp->growth[i] % STACK_BYTES));
1916 }
1917
1918 /* Define the offset between two registers, one to be eliminated, and
1919 the other its replacement, at the start of a routine. */
1920
1921 int
1922 mcore_initial_elimination_offset (int from, int to)
1923 {
1924 int above_frame;
1925 int below_frame;
1926 struct mcore_frame fi;
1927
1928 layout_mcore_frame (& fi);
1929
1930 /* fp to ap */
1931 above_frame = fi.local_size + fi.pad_local + fi.reg_size + fi.pad_reg;
1932 /* sp to fp */
1933 below_frame = fi.outbound_size + fi.pad_outbound;
1934
1935 if (from == ARG_POINTER_REGNUM && to == FRAME_POINTER_REGNUM)
1936 return above_frame;
1937
1938 if (from == ARG_POINTER_REGNUM && to == STACK_POINTER_REGNUM)
1939 return above_frame + below_frame;
1940
1941 if (from == FRAME_POINTER_REGNUM && to == STACK_POINTER_REGNUM)
1942 return below_frame;
1943
1944 gcc_unreachable ();
1945 }
1946
1947 /* Keep track of some information about varargs for the prolog. */
1948
1949 static void
1950 mcore_setup_incoming_varargs (cumulative_args_t args_so_far_v,
1951 machine_mode mode, tree type,
1952 int * ptr_pretend_size ATTRIBUTE_UNUSED,
1953 int second_time ATTRIBUTE_UNUSED)
1954 {
1955 CUMULATIVE_ARGS *args_so_far = get_cumulative_args (args_so_far_v);
1956
1957 current_function_anonymous_args = 1;
1958
1959 /* We need to know how many argument registers are used before
1960 the varargs start, so that we can push the remaining argument
1961 registers during the prologue. */
1962 number_of_regs_before_varargs = *args_so_far + mcore_num_arg_regs (mode, type);
1963
1964 /* There is a bug somewhere in the arg handling code.
1965 Until I can find it this workaround always pushes the
1966 last named argument onto the stack. */
1967 number_of_regs_before_varargs = *args_so_far;
1968
1969 /* The last named argument may be split between argument registers
1970 and the stack. Allow for this here. */
1971 if (number_of_regs_before_varargs > NPARM_REGS)
1972 number_of_regs_before_varargs = NPARM_REGS;
1973 }
1974
1975 void
1976 mcore_expand_prolog (void)
1977 {
1978 struct mcore_frame fi;
1979 int space_allocated = 0;
1980 int growth = 0;
1981
1982 /* Find out what we're doing. */
1983 layout_mcore_frame (&fi);
1984
1985 space_allocated = fi.arg_size + fi.reg_size + fi.local_size +
1986 fi.outbound_size + fi.pad_outbound + fi.pad_local + fi.pad_reg;
1987
1988 if (TARGET_CG_DATA)
1989 {
1990 /* Emit a symbol for this routine's frame size. */
1991 rtx x;
1992
1993 x = DECL_RTL (current_function_decl);
1994
1995 gcc_assert (GET_CODE (x) == MEM);
1996
1997 x = XEXP (x, 0);
1998
1999 gcc_assert (GET_CODE (x) == SYMBOL_REF);
2000
2001 free (mcore_current_function_name);
2002
2003 mcore_current_function_name = xstrdup (XSTR (x, 0));
2004
2005 ASM_OUTPUT_CG_NODE (asm_out_file, mcore_current_function_name, space_allocated);
2006
2007 if (cfun->calls_alloca)
2008 ASM_OUTPUT_CG_EDGE (asm_out_file, mcore_current_function_name, "alloca", 1);
2009
2010 /* 970425: RBE:
2011 We're looking at how the 8byte alignment affects stack layout
2012 and where we had to pad things. This emits information we can
2013 extract which tells us about frame sizes and the like. */
2014 fprintf (asm_out_file,
2015 "\t.equ\t__$frame$info$_%s_$_%d_%d_x%x_%d_%d_%d,0\n",
2016 mcore_current_function_name,
2017 fi.arg_size, fi.reg_size, fi.reg_mask,
2018 fi.local_size, fi.outbound_size,
2019 frame_pointer_needed);
2020 }
2021
2022 if (mcore_naked_function_p ())
2023 return;
2024
2025 /* Handle stdarg+regsaves in one shot: can't be more than 64 bytes. */
2026 output_stack_adjust (-1, fi.growth[growth++]); /* Grows it. */
2027
2028 /* If we have a parameter passed partially in regs and partially in memory,
2029 the registers will have been stored to memory already in function.c. So
2030 we only need to do something here for varargs functions. */
2031 if (fi.arg_size != 0 && crtl->args.pretend_args_size == 0)
2032 {
2033 int offset;
2034 int rn = FIRST_PARM_REG + NPARM_REGS - 1;
2035 int remaining = fi.arg_size;
2036
2037 for (offset = fi.arg_offset; remaining >= 4; offset -= 4, rn--, remaining -= 4)
2038 {
2039 emit_insn (gen_movsi
2040 (gen_rtx_MEM (SImode,
2041 plus_constant (Pmode, stack_pointer_rtx,
2042 offset)),
2043 gen_rtx_REG (SImode, rn)));
2044 }
2045 }
2046
2047 /* Do we need another stack adjustment before we do the register saves? */
2048 if (growth < fi.reg_growth)
2049 output_stack_adjust (-1, fi.growth[growth++]); /* Grows it. */
2050
2051 if (fi.reg_size != 0)
2052 {
2053 int i;
2054 int offs = fi.reg_offset;
2055
2056 for (i = 15; i >= 0; i--)
2057 {
2058 if (offs == 0 && i == 15 && ((fi.reg_mask & 0xc000) == 0xc000))
2059 {
2060 int first_reg = 15;
2061
2062 while (fi.reg_mask & (1 << first_reg))
2063 first_reg--;
2064 first_reg++;
2065
2066 emit_insn (gen_store_multiple (gen_rtx_MEM (SImode, stack_pointer_rtx),
2067 gen_rtx_REG (SImode, first_reg),
2068 GEN_INT (16 - first_reg)));
2069
2070 i -= (15 - first_reg);
2071 offs += (16 - first_reg) * 4;
2072 }
2073 else if (fi.reg_mask & (1 << i))
2074 {
2075 emit_insn (gen_movsi
2076 (gen_rtx_MEM (SImode,
2077 plus_constant (Pmode, stack_pointer_rtx,
2078 offs)),
2079 gen_rtx_REG (SImode, i)));
2080 offs += 4;
2081 }
2082 }
2083 }
2084
2085 /* Figure the locals + outbounds. */
2086 if (frame_pointer_needed)
2087 {
2088 /* If we haven't already purchased to 'fp'. */
2089 if (growth < fi.local_growth)
2090 output_stack_adjust (-1, fi.growth[growth++]); /* Grows it. */
2091
2092 emit_insn (gen_movsi (frame_pointer_rtx, stack_pointer_rtx));
2093
2094 /* ... and then go any remaining distance for outbounds, etc. */
2095 if (fi.growth[growth])
2096 output_stack_adjust (-1, fi.growth[growth++]);
2097 }
2098 else
2099 {
2100 if (growth < fi.local_growth)
2101 output_stack_adjust (-1, fi.growth[growth++]); /* Grows it. */
2102 if (fi.growth[growth])
2103 output_stack_adjust (-1, fi.growth[growth++]);
2104 }
2105 }
2106
2107 void
2108 mcore_expand_epilog (void)
2109 {
2110 struct mcore_frame fi;
2111 int i;
2112 int offs;
2113 int growth = MAX_STACK_GROWS - 1 ;
2114
2115
2116 /* Find out what we're doing. */
2117 layout_mcore_frame(&fi);
2118
2119 if (mcore_naked_function_p ())
2120 return;
2121
2122 /* If we had a frame pointer, restore the sp from that. */
2123 if (frame_pointer_needed)
2124 {
2125 emit_insn (gen_movsi (stack_pointer_rtx, frame_pointer_rtx));
2126 growth = fi.local_growth - 1;
2127 }
2128 else
2129 {
2130 /* XXX: while loop should accumulate and do a single sell. */
2131 while (growth >= fi.local_growth)
2132 {
2133 if (fi.growth[growth] != 0)
2134 output_stack_adjust (1, fi.growth[growth]);
2135 growth--;
2136 }
2137 }
2138
2139 /* Make sure we've shrunk stack back to the point where the registers
2140 were laid down. This is typically 0/1 iterations. Then pull the
2141 register save information back off the stack. */
2142 while (growth >= fi.reg_growth)
2143 output_stack_adjust ( 1, fi.growth[growth--]);
2144
2145 offs = fi.reg_offset;
2146
2147 for (i = 15; i >= 0; i--)
2148 {
2149 if (offs == 0 && i == 15 && ((fi.reg_mask & 0xc000) == 0xc000))
2150 {
2151 int first_reg;
2152
2153 /* Find the starting register. */
2154 first_reg = 15;
2155
2156 while (fi.reg_mask & (1 << first_reg))
2157 first_reg--;
2158
2159 first_reg++;
2160
2161 emit_insn (gen_load_multiple (gen_rtx_REG (SImode, first_reg),
2162 gen_rtx_MEM (SImode, stack_pointer_rtx),
2163 GEN_INT (16 - first_reg)));
2164
2165 i -= (15 - first_reg);
2166 offs += (16 - first_reg) * 4;
2167 }
2168 else if (fi.reg_mask & (1 << i))
2169 {
2170 emit_insn (gen_movsi
2171 (gen_rtx_REG (SImode, i),
2172 gen_rtx_MEM (SImode,
2173 plus_constant (Pmode, stack_pointer_rtx,
2174 offs))));
2175 offs += 4;
2176 }
2177 }
2178
2179 /* Give back anything else. */
2180 /* XXX: Should accumulate total and then give it back. */
2181 while (growth >= 0)
2182 output_stack_adjust ( 1, fi.growth[growth--]);
2183 }
2184 \f
2185 /* This code is borrowed from the SH port. */
2186
2187 /* The MCORE cannot load a large constant into a register, constants have to
2188 come from a pc relative load. The reference of a pc relative load
2189 instruction must be less than 1k in front of the instruction. This
2190 means that we often have to dump a constant inside a function, and
2191 generate code to branch around it.
2192
2193 It is important to minimize this, since the branches will slow things
2194 down and make things bigger.
2195
2196 Worst case code looks like:
2197
2198 lrw L1,r0
2199 br L2
2200 align
2201 L1: .long value
2202 L2:
2203 ..
2204
2205 lrw L3,r0
2206 br L4
2207 align
2208 L3: .long value
2209 L4:
2210 ..
2211
2212 We fix this by performing a scan before scheduling, which notices which
2213 instructions need to have their operands fetched from the constant table
2214 and builds the table.
2215
2216 The algorithm is:
2217
2218 scan, find an instruction which needs a pcrel move. Look forward, find the
2219 last barrier which is within MAX_COUNT bytes of the requirement.
2220 If there isn't one, make one. Process all the instructions between
2221 the find and the barrier.
2222
2223 In the above example, we can tell that L3 is within 1k of L1, so
2224 the first move can be shrunk from the 2 insn+constant sequence into
2225 just 1 insn, and the constant moved to L3 to make:
2226
2227 lrw L1,r0
2228 ..
2229 lrw L3,r0
2230 bra L4
2231 align
2232 L3:.long value
2233 L4:.long value
2234
2235 Then the second move becomes the target for the shortening process. */
2236
2237 typedef struct
2238 {
2239 rtx value; /* Value in table. */
2240 rtx label; /* Label of value. */
2241 } pool_node;
2242
2243 /* The maximum number of constants that can fit into one pool, since
2244 the pc relative range is 0...1020 bytes and constants are at least 4
2245 bytes long. We subtract 4 from the range to allow for the case where
2246 we need to add a branch/align before the constant pool. */
2247
2248 #define MAX_COUNT 1016
2249 #define MAX_POOL_SIZE (MAX_COUNT/4)
2250 static pool_node pool_vector[MAX_POOL_SIZE];
2251 static int pool_size;
2252
2253 /* Dump out any constants accumulated in the final pass. These
2254 will only be labels. */
2255
2256 const char *
2257 mcore_output_jump_label_table (void)
2258 {
2259 int i;
2260
2261 if (pool_size)
2262 {
2263 fprintf (asm_out_file, "\t.align 2\n");
2264
2265 for (i = 0; i < pool_size; i++)
2266 {
2267 pool_node * p = pool_vector + i;
2268
2269 (*targetm.asm_out.internal_label) (asm_out_file, "L", CODE_LABEL_NUMBER (p->label));
2270
2271 output_asm_insn (".long %0", &p->value);
2272 }
2273
2274 pool_size = 0;
2275 }
2276
2277 return "";
2278 }
2279
2280 /* Check whether insn is a candidate for a conditional. */
2281
2282 static cond_type
2283 is_cond_candidate (rtx insn)
2284 {
2285 /* The only things we conditionalize are those that can be directly
2286 changed into a conditional. Only bother with SImode items. If
2287 we wanted to be a little more aggressive, we could also do other
2288 modes such as DImode with reg-reg move or load 0. */
2289 if (NONJUMP_INSN_P (insn))
2290 {
2291 rtx pat = PATTERN (insn);
2292 rtx src, dst;
2293
2294 if (GET_CODE (pat) != SET)
2295 return COND_NO;
2296
2297 dst = XEXP (pat, 0);
2298
2299 if ((GET_CODE (dst) != REG &&
2300 GET_CODE (dst) != SUBREG) ||
2301 GET_MODE (dst) != SImode)
2302 return COND_NO;
2303
2304 src = XEXP (pat, 1);
2305
2306 if ((GET_CODE (src) == REG ||
2307 (GET_CODE (src) == SUBREG &&
2308 GET_CODE (SUBREG_REG (src)) == REG)) &&
2309 GET_MODE (src) == SImode)
2310 return COND_MOV_INSN;
2311 else if (GET_CODE (src) == CONST_INT &&
2312 INTVAL (src) == 0)
2313 return COND_CLR_INSN;
2314 else if (GET_CODE (src) == PLUS &&
2315 (GET_CODE (XEXP (src, 0)) == REG ||
2316 (GET_CODE (XEXP (src, 0)) == SUBREG &&
2317 GET_CODE (SUBREG_REG (XEXP (src, 0))) == REG)) &&
2318 GET_MODE (XEXP (src, 0)) == SImode &&
2319 GET_CODE (XEXP (src, 1)) == CONST_INT &&
2320 INTVAL (XEXP (src, 1)) == 1)
2321 return COND_INC_INSN;
2322 else if (((GET_CODE (src) == MINUS &&
2323 GET_CODE (XEXP (src, 1)) == CONST_INT &&
2324 INTVAL( XEXP (src, 1)) == 1) ||
2325 (GET_CODE (src) == PLUS &&
2326 GET_CODE (XEXP (src, 1)) == CONST_INT &&
2327 INTVAL (XEXP (src, 1)) == -1)) &&
2328 (GET_CODE (XEXP (src, 0)) == REG ||
2329 (GET_CODE (XEXP (src, 0)) == SUBREG &&
2330 GET_CODE (SUBREG_REG (XEXP (src, 0))) == REG)) &&
2331 GET_MODE (XEXP (src, 0)) == SImode)
2332 return COND_DEC_INSN;
2333
2334 /* Some insns that we don't bother with:
2335 (set (rx:DI) (ry:DI))
2336 (set (rx:DI) (const_int 0))
2337 */
2338
2339 }
2340 else if (JUMP_P (insn)
2341 && GET_CODE (PATTERN (insn)) == SET
2342 && GET_CODE (XEXP (PATTERN (insn), 1)) == LABEL_REF)
2343 return COND_BRANCH_INSN;
2344
2345 return COND_NO;
2346 }
2347
2348 /* Emit a conditional version of insn and replace the old insn with the
2349 new one. Return the new insn if emitted. */
2350
2351 static rtx_insn *
2352 emit_new_cond_insn (rtx insn, int cond)
2353 {
2354 rtx c_insn = 0;
2355 rtx pat, dst, src;
2356 cond_type num;
2357
2358 if ((num = is_cond_candidate (insn)) == COND_NO)
2359 return NULL;
2360
2361 pat = PATTERN (insn);
2362
2363 if (NONJUMP_INSN_P (insn))
2364 {
2365 dst = SET_DEST (pat);
2366 src = SET_SRC (pat);
2367 }
2368 else
2369 {
2370 dst = JUMP_LABEL (insn);
2371 src = NULL_RTX;
2372 }
2373
2374 switch (num)
2375 {
2376 case COND_MOV_INSN:
2377 case COND_CLR_INSN:
2378 if (cond)
2379 c_insn = gen_movt0 (dst, src, dst);
2380 else
2381 c_insn = gen_movt0 (dst, dst, src);
2382 break;
2383
2384 case COND_INC_INSN:
2385 if (cond)
2386 c_insn = gen_incscc (dst, dst);
2387 else
2388 c_insn = gen_incscc_false (dst, dst);
2389 break;
2390
2391 case COND_DEC_INSN:
2392 if (cond)
2393 c_insn = gen_decscc (dst, dst);
2394 else
2395 c_insn = gen_decscc_false (dst, dst);
2396 break;
2397
2398 case COND_BRANCH_INSN:
2399 if (cond)
2400 c_insn = gen_branch_true (dst);
2401 else
2402 c_insn = gen_branch_false (dst);
2403 break;
2404
2405 default:
2406 return NULL;
2407 }
2408
2409 /* Only copy the notes if they exist. */
2410 if (rtx_length [GET_CODE (c_insn)] >= 7 && rtx_length [GET_CODE (insn)] >= 7)
2411 {
2412 /* We really don't need to bother with the notes and links at this
2413 point, but go ahead and save the notes. This will help is_dead()
2414 when applying peepholes (links don't matter since they are not
2415 used any more beyond this point for the mcore). */
2416 REG_NOTES (c_insn) = REG_NOTES (insn);
2417 }
2418
2419 if (num == COND_BRANCH_INSN)
2420 {
2421 /* For jumps, we need to be a little bit careful and emit the new jump
2422 before the old one and to update the use count for the target label.
2423 This way, the barrier following the old (uncond) jump will get
2424 deleted, but the label won't. */
2425 c_insn = emit_jump_insn_before (c_insn, insn);
2426
2427 ++ LABEL_NUSES (dst);
2428
2429 JUMP_LABEL (c_insn) = dst;
2430 }
2431 else
2432 c_insn = emit_insn_after (c_insn, insn);
2433
2434 delete_insn (insn);
2435
2436 return as_a <rtx_insn *> (c_insn);
2437 }
2438
2439 /* Attempt to change a basic block into a series of conditional insns. This
2440 works by taking the branch at the end of the 1st block and scanning for the
2441 end of the 2nd block. If all instructions in the 2nd block have cond.
2442 versions and the label at the start of block 3 is the same as the target
2443 from the branch at block 1, then conditionalize all insn in block 2 using
2444 the inverse condition of the branch at block 1. (Note I'm bending the
2445 definition of basic block here.)
2446
2447 e.g., change:
2448
2449 bt L2 <-- end of block 1 (delete)
2450 mov r7,r8
2451 addu r7,1
2452 br L3 <-- end of block 2
2453
2454 L2: ... <-- start of block 3 (NUSES==1)
2455 L3: ...
2456
2457 to:
2458
2459 movf r7,r8
2460 incf r7
2461 bf L3
2462
2463 L3: ...
2464
2465 we can delete the L2 label if NUSES==1 and re-apply the optimization
2466 starting at the last instruction of block 2. This may allow an entire
2467 if-then-else statement to be conditionalized. BRC */
2468 static rtx_insn *
2469 conditionalize_block (rtx_insn *first)
2470 {
2471 rtx_insn *insn;
2472 rtx br_pat;
2473 rtx_insn *end_blk_1_br = 0;
2474 rtx_insn *end_blk_2_insn = 0;
2475 rtx_insn *start_blk_3_lab = 0;
2476 int cond;
2477 int br_lab_num;
2478 int blk_size = 0;
2479
2480
2481 /* Check that the first insn is a candidate conditional jump. This is
2482 the one that we'll eliminate. If not, advance to the next insn to
2483 try. */
2484 if (! JUMP_P (first)
2485 || GET_CODE (PATTERN (first)) != SET
2486 || GET_CODE (XEXP (PATTERN (first), 1)) != IF_THEN_ELSE)
2487 return NEXT_INSN (first);
2488
2489 /* Extract some information we need. */
2490 end_blk_1_br = first;
2491 br_pat = PATTERN (end_blk_1_br);
2492
2493 /* Complement the condition since we use the reverse cond. for the insns. */
2494 cond = (GET_CODE (XEXP (XEXP (br_pat, 1), 0)) == EQ);
2495
2496 /* Determine what kind of branch we have. */
2497 if (GET_CODE (XEXP (XEXP (br_pat, 1), 1)) == LABEL_REF)
2498 {
2499 /* A normal branch, so extract label out of first arm. */
2500 br_lab_num = CODE_LABEL_NUMBER (XEXP (XEXP (XEXP (br_pat, 1), 1), 0));
2501 }
2502 else
2503 {
2504 /* An inverse branch, so extract the label out of the 2nd arm
2505 and complement the condition. */
2506 cond = (cond == 0);
2507 br_lab_num = CODE_LABEL_NUMBER (XEXP (XEXP (XEXP (br_pat, 1), 2), 0));
2508 }
2509
2510 /* Scan forward for the start of block 2: it must start with a
2511 label and that label must be the same as the branch target
2512 label from block 1. We don't care about whether block 2 actually
2513 ends with a branch or a label (an uncond. branch is
2514 conditionalizable). */
2515 for (insn = NEXT_INSN (first); insn; insn = NEXT_INSN (insn))
2516 {
2517 enum rtx_code code;
2518
2519 code = GET_CODE (insn);
2520
2521 /* Look for the label at the start of block 3. */
2522 if (code == CODE_LABEL && CODE_LABEL_NUMBER (insn) == br_lab_num)
2523 break;
2524
2525 /* Skip barriers, notes, and conditionalizable insns. If the
2526 insn is not conditionalizable or makes this optimization fail,
2527 just return the next insn so we can start over from that point. */
2528 if (code != BARRIER && code != NOTE && !is_cond_candidate (insn))
2529 return NEXT_INSN (insn);
2530
2531 /* Remember the last real insn before the label (i.e. end of block 2). */
2532 if (code == JUMP_INSN || code == INSN)
2533 {
2534 blk_size ++;
2535 end_blk_2_insn = insn;
2536 }
2537 }
2538
2539 if (!insn)
2540 return insn;
2541
2542 /* It is possible for this optimization to slow performance if the blocks
2543 are long. This really depends upon whether the branch is likely taken
2544 or not. If the branch is taken, we slow performance in many cases. But,
2545 if the branch is not taken, we always help performance (for a single
2546 block, but for a double block (i.e. when the optimization is re-applied)
2547 this is not true since the 'right thing' depends on the overall length of
2548 the collapsed block). As a compromise, don't apply this optimization on
2549 blocks larger than size 2 (unlikely for the mcore) when speed is important.
2550 the best threshold depends on the latencies of the instructions (i.e.,
2551 the branch penalty). */
2552 if (optimize > 1 && blk_size > 2)
2553 return insn;
2554
2555 /* At this point, we've found the start of block 3 and we know that
2556 it is the destination of the branch from block 1. Also, all
2557 instructions in the block 2 are conditionalizable. So, apply the
2558 conditionalization and delete the branch. */
2559 start_blk_3_lab = insn;
2560
2561 for (insn = NEXT_INSN (end_blk_1_br); insn != start_blk_3_lab;
2562 insn = NEXT_INSN (insn))
2563 {
2564 rtx_insn *newinsn;
2565
2566 if (insn->deleted ())
2567 continue;
2568
2569 /* Try to form a conditional variant of the instruction and emit it. */
2570 if ((newinsn = emit_new_cond_insn (insn, cond)))
2571 {
2572 if (end_blk_2_insn == insn)
2573 end_blk_2_insn = newinsn;
2574
2575 insn = newinsn;
2576 }
2577 }
2578
2579 /* Note whether we will delete the label starting blk 3 when the jump
2580 gets deleted. If so, we want to re-apply this optimization at the
2581 last real instruction right before the label. */
2582 if (LABEL_NUSES (start_blk_3_lab) == 1)
2583 {
2584 start_blk_3_lab = 0;
2585 }
2586
2587 /* ??? we probably should redistribute the death notes for this insn, esp.
2588 the death of cc, but it doesn't really matter this late in the game.
2589 The peepholes all use is_dead() which will find the correct death
2590 regardless of whether there is a note. */
2591 delete_insn (end_blk_1_br);
2592
2593 if (! start_blk_3_lab)
2594 return end_blk_2_insn;
2595
2596 /* Return the insn right after the label at the start of block 3. */
2597 return NEXT_INSN (start_blk_3_lab);
2598 }
2599
2600 /* Apply the conditionalization of blocks optimization. This is the
2601 outer loop that traverses through the insns scanning for a branch
2602 that signifies an opportunity to apply the optimization. Note that
2603 this optimization is applied late. If we could apply it earlier,
2604 say before cse 2, it may expose more optimization opportunities.
2605 but, the pay back probably isn't really worth the effort (we'd have
2606 to update all reg/flow/notes/links/etc to make it work - and stick it
2607 in before cse 2). */
2608
2609 static void
2610 conditionalize_optimization (void)
2611 {
2612 rtx_insn *insn;
2613
2614 for (insn = get_insns (); insn; insn = conditionalize_block (insn))
2615 continue;
2616 }
2617
2618 /* This is to handle loads from the constant pool. */
2619
2620 static void
2621 mcore_reorg (void)
2622 {
2623 /* Reset this variable. */
2624 current_function_anonymous_args = 0;
2625
2626 if (optimize == 0)
2627 return;
2628
2629 /* Conditionalize blocks where we can. */
2630 conditionalize_optimization ();
2631
2632 /* Literal pool generation is now pushed off until the assembler. */
2633 }
2634
2635 \f
2636 /* Return true if X is something that can be moved directly into r15. */
2637
2638 bool
2639 mcore_r15_operand_p (rtx x)
2640 {
2641 switch (GET_CODE (x))
2642 {
2643 case CONST_INT:
2644 return mcore_const_ok_for_inline (INTVAL (x));
2645
2646 case REG:
2647 case SUBREG:
2648 case MEM:
2649 return 1;
2650
2651 default:
2652 return 0;
2653 }
2654 }
2655
2656 /* Implement SECONDARY_RELOAD_CLASS. If RCLASS contains r15, and we can't
2657 directly move X into it, use r1-r14 as a temporary. */
2658
2659 enum reg_class
2660 mcore_secondary_reload_class (enum reg_class rclass,
2661 machine_mode mode ATTRIBUTE_UNUSED, rtx x)
2662 {
2663 if (TEST_HARD_REG_BIT (reg_class_contents[rclass], 15)
2664 && !mcore_r15_operand_p (x))
2665 return LRW_REGS;
2666 return NO_REGS;
2667 }
2668
2669 /* Return the reg_class to use when reloading the rtx X into the class
2670 RCLASS. If X is too complex to move directly into r15, prefer to
2671 use LRW_REGS instead. */
2672
2673 enum reg_class
2674 mcore_reload_class (rtx x, enum reg_class rclass)
2675 {
2676 if (reg_class_subset_p (LRW_REGS, rclass) && !mcore_r15_operand_p (x))
2677 return LRW_REGS;
2678
2679 return rclass;
2680 }
2681
2682 /* Tell me if a pair of reg/subreg rtx's actually refer to the same
2683 register. Note that the current version doesn't worry about whether
2684 they are the same mode or note (e.g., a QImode in r2 matches an HImode
2685 in r2 matches an SImode in r2. Might think in the future about whether
2686 we want to be able to say something about modes. */
2687
2688 int
2689 mcore_is_same_reg (rtx x, rtx y)
2690 {
2691 /* Strip any and all of the subreg wrappers. */
2692 while (GET_CODE (x) == SUBREG)
2693 x = SUBREG_REG (x);
2694
2695 while (GET_CODE (y) == SUBREG)
2696 y = SUBREG_REG (y);
2697
2698 if (GET_CODE(x) == REG && GET_CODE(y) == REG && REGNO(x) == REGNO(y))
2699 return 1;
2700
2701 return 0;
2702 }
2703
2704 static void
2705 mcore_option_override (void)
2706 {
2707 /* Only the m340 supports little endian code. */
2708 if (TARGET_LITTLE_END && ! TARGET_M340)
2709 target_flags |= MASK_M340;
2710 }
2711
2712 \f
2713 /* Compute the number of word sized registers needed to
2714 hold a function argument of mode MODE and type TYPE. */
2715
2716 int
2717 mcore_num_arg_regs (machine_mode mode, const_tree type)
2718 {
2719 int size;
2720
2721 if (targetm.calls.must_pass_in_stack (mode, type))
2722 return 0;
2723
2724 if (type && mode == BLKmode)
2725 size = int_size_in_bytes (type);
2726 else
2727 size = GET_MODE_SIZE (mode);
2728
2729 return ROUND_ADVANCE (size);
2730 }
2731
2732 static rtx
2733 handle_structs_in_regs (machine_mode mode, const_tree type, int reg)
2734 {
2735 int size;
2736
2737 /* The MCore ABI defines that a structure whose size is not a whole multiple
2738 of bytes is passed packed into registers (or spilled onto the stack if
2739 not enough registers are available) with the last few bytes of the
2740 structure being packed, left-justified, into the last register/stack slot.
2741 GCC handles this correctly if the last word is in a stack slot, but we
2742 have to generate a special, PARALLEL RTX if the last word is in an
2743 argument register. */
2744 if (type
2745 && TYPE_MODE (type) == BLKmode
2746 && TREE_CODE (TYPE_SIZE (type)) == INTEGER_CST
2747 && (size = int_size_in_bytes (type)) > UNITS_PER_WORD
2748 && (size % UNITS_PER_WORD != 0)
2749 && (reg + mcore_num_arg_regs (mode, type) <= (FIRST_PARM_REG + NPARM_REGS)))
2750 {
2751 rtx arg_regs [NPARM_REGS];
2752 int nregs;
2753 rtx result;
2754 rtvec rtvec;
2755
2756 for (nregs = 0; size > 0; size -= UNITS_PER_WORD)
2757 {
2758 arg_regs [nregs] =
2759 gen_rtx_EXPR_LIST (SImode, gen_rtx_REG (SImode, reg ++),
2760 GEN_INT (nregs * UNITS_PER_WORD));
2761 nregs ++;
2762 }
2763
2764 /* We assume here that NPARM_REGS == 6. The assert checks this. */
2765 gcc_assert (ARRAY_SIZE (arg_regs) == 6);
2766 rtvec = gen_rtvec (nregs, arg_regs[0], arg_regs[1], arg_regs[2],
2767 arg_regs[3], arg_regs[4], arg_regs[5]);
2768
2769 result = gen_rtx_PARALLEL (mode, rtvec);
2770 return result;
2771 }
2772
2773 return gen_rtx_REG (mode, reg);
2774 }
2775
2776 rtx
2777 mcore_function_value (const_tree valtype, const_tree func)
2778 {
2779 machine_mode mode;
2780 int unsigned_p;
2781
2782 mode = TYPE_MODE (valtype);
2783
2784 /* Since we promote return types, we must promote the mode here too. */
2785 mode = promote_function_mode (valtype, mode, &unsigned_p, func, 1);
2786
2787 return handle_structs_in_regs (mode, valtype, FIRST_RET_REG);
2788 }
2789
2790 /* Define where to put the arguments to a function.
2791 Value is zero to push the argument on the stack,
2792 or a hard register in which to store the argument.
2793
2794 MODE is the argument's machine mode.
2795 TYPE is the data type of the argument (as a tree).
2796 This is null for libcalls where that information may
2797 not be available.
2798 CUM is a variable of type CUMULATIVE_ARGS which gives info about
2799 the preceding args and about the function being called.
2800 NAMED is nonzero if this argument is a named parameter
2801 (otherwise it is an extra parameter matching an ellipsis).
2802
2803 On MCore the first args are normally in registers
2804 and the rest are pushed. Any arg that starts within the first
2805 NPARM_REGS words is at least partially passed in a register unless
2806 its data type forbids. */
2807
2808 static rtx
2809 mcore_function_arg (cumulative_args_t cum, machine_mode mode,
2810 const_tree type, bool named)
2811 {
2812 int arg_reg;
2813
2814 if (! named || mode == VOIDmode)
2815 return 0;
2816
2817 if (targetm.calls.must_pass_in_stack (mode, type))
2818 return 0;
2819
2820 arg_reg = ROUND_REG (*get_cumulative_args (cum), mode);
2821
2822 if (arg_reg < NPARM_REGS)
2823 return handle_structs_in_regs (mode, type, FIRST_PARM_REG + arg_reg);
2824
2825 return 0;
2826 }
2827
2828 static void
2829 mcore_function_arg_advance (cumulative_args_t cum_v, machine_mode mode,
2830 const_tree type, bool named ATTRIBUTE_UNUSED)
2831 {
2832 CUMULATIVE_ARGS *cum = get_cumulative_args (cum_v);
2833
2834 *cum = (ROUND_REG (*cum, mode)
2835 + (int)named * mcore_num_arg_regs (mode, type));
2836 }
2837
2838 static unsigned int
2839 mcore_function_arg_boundary (machine_mode mode,
2840 const_tree type ATTRIBUTE_UNUSED)
2841 {
2842 /* Doubles must be aligned to an 8 byte boundary. */
2843 return (mode != BLKmode && GET_MODE_SIZE (mode) == 8
2844 ? BIGGEST_ALIGNMENT
2845 : PARM_BOUNDARY);
2846 }
2847
2848 /* Returns the number of bytes of argument registers required to hold *part*
2849 of a parameter of machine mode MODE and type TYPE (which may be NULL if
2850 the type is not known). If the argument fits entirely in the argument
2851 registers, or entirely on the stack, then 0 is returned. CUM is the
2852 number of argument registers already used by earlier parameters to
2853 the function. */
2854
2855 static int
2856 mcore_arg_partial_bytes (cumulative_args_t cum, machine_mode mode,
2857 tree type, bool named)
2858 {
2859 int reg = ROUND_REG (*get_cumulative_args (cum), mode);
2860
2861 if (named == 0)
2862 return 0;
2863
2864 if (targetm.calls.must_pass_in_stack (mode, type))
2865 return 0;
2866
2867 /* REG is not the *hardware* register number of the register that holds
2868 the argument, it is the *argument* register number. So for example,
2869 the first argument to a function goes in argument register 0, which
2870 translates (for the MCore) into hardware register 2. The second
2871 argument goes into argument register 1, which translates into hardware
2872 register 3, and so on. NPARM_REGS is the number of argument registers
2873 supported by the target, not the maximum hardware register number of
2874 the target. */
2875 if (reg >= NPARM_REGS)
2876 return 0;
2877
2878 /* If the argument fits entirely in registers, return 0. */
2879 if (reg + mcore_num_arg_regs (mode, type) <= NPARM_REGS)
2880 return 0;
2881
2882 /* The argument overflows the number of available argument registers.
2883 Compute how many argument registers have not yet been assigned to
2884 hold an argument. */
2885 reg = NPARM_REGS - reg;
2886
2887 /* Return partially in registers and partially on the stack. */
2888 return reg * UNITS_PER_WORD;
2889 }
2890 \f
2891 /* Return nonzero if SYMBOL is marked as being dllexport'd. */
2892
2893 int
2894 mcore_dllexport_name_p (const char * symbol)
2895 {
2896 return symbol[0] == '@' && symbol[1] == 'e' && symbol[2] == '.';
2897 }
2898
2899 /* Return nonzero if SYMBOL is marked as being dllimport'd. */
2900
2901 int
2902 mcore_dllimport_name_p (const char * symbol)
2903 {
2904 return symbol[0] == '@' && symbol[1] == 'i' && symbol[2] == '.';
2905 }
2906
2907 /* Mark a DECL as being dllexport'd. */
2908
2909 static void
2910 mcore_mark_dllexport (tree decl)
2911 {
2912 const char * oldname;
2913 char * newname;
2914 rtx rtlname;
2915 tree idp;
2916
2917 rtlname = XEXP (DECL_RTL (decl), 0);
2918
2919 if (GET_CODE (rtlname) == MEM)
2920 rtlname = XEXP (rtlname, 0);
2921 gcc_assert (GET_CODE (rtlname) == SYMBOL_REF);
2922 oldname = XSTR (rtlname, 0);
2923
2924 if (mcore_dllexport_name_p (oldname))
2925 return; /* Already done. */
2926
2927 newname = XALLOCAVEC (char, strlen (oldname) + 4);
2928 sprintf (newname, "@e.%s", oldname);
2929
2930 /* We pass newname through get_identifier to ensure it has a unique
2931 address. RTL processing can sometimes peek inside the symbol ref
2932 and compare the string's addresses to see if two symbols are
2933 identical. */
2934 /* ??? At least I think that's why we do this. */
2935 idp = get_identifier (newname);
2936
2937 XEXP (DECL_RTL (decl), 0) =
2938 gen_rtx_SYMBOL_REF (Pmode, IDENTIFIER_POINTER (idp));
2939 }
2940
2941 /* Mark a DECL as being dllimport'd. */
2942
2943 static void
2944 mcore_mark_dllimport (tree decl)
2945 {
2946 const char * oldname;
2947 char * newname;
2948 tree idp;
2949 rtx rtlname;
2950 rtx newrtl;
2951
2952 rtlname = XEXP (DECL_RTL (decl), 0);
2953
2954 if (GET_CODE (rtlname) == MEM)
2955 rtlname = XEXP (rtlname, 0);
2956 gcc_assert (GET_CODE (rtlname) == SYMBOL_REF);
2957 oldname = XSTR (rtlname, 0);
2958
2959 gcc_assert (!mcore_dllexport_name_p (oldname));
2960 if (mcore_dllimport_name_p (oldname))
2961 return; /* Already done. */
2962
2963 /* ??? One can well ask why we're making these checks here,
2964 and that would be a good question. */
2965
2966 /* Imported variables can't be initialized. */
2967 if (TREE_CODE (decl) == VAR_DECL
2968 && !DECL_VIRTUAL_P (decl)
2969 && DECL_INITIAL (decl))
2970 {
2971 error ("initialized variable %q+D is marked dllimport", decl);
2972 return;
2973 }
2974
2975 /* `extern' needn't be specified with dllimport.
2976 Specify `extern' now and hope for the best. Sigh. */
2977 if (TREE_CODE (decl) == VAR_DECL
2978 /* ??? Is this test for vtables needed? */
2979 && !DECL_VIRTUAL_P (decl))
2980 {
2981 DECL_EXTERNAL (decl) = 1;
2982 TREE_PUBLIC (decl) = 1;
2983 }
2984
2985 newname = XALLOCAVEC (char, strlen (oldname) + 11);
2986 sprintf (newname, "@i.__imp_%s", oldname);
2987
2988 /* We pass newname through get_identifier to ensure it has a unique
2989 address. RTL processing can sometimes peek inside the symbol ref
2990 and compare the string's addresses to see if two symbols are
2991 identical. */
2992 /* ??? At least I think that's why we do this. */
2993 idp = get_identifier (newname);
2994
2995 newrtl = gen_rtx_MEM (Pmode,
2996 gen_rtx_SYMBOL_REF (Pmode,
2997 IDENTIFIER_POINTER (idp)));
2998 XEXP (DECL_RTL (decl), 0) = newrtl;
2999 }
3000
3001 static int
3002 mcore_dllexport_p (tree decl)
3003 {
3004 if ( TREE_CODE (decl) != VAR_DECL
3005 && TREE_CODE (decl) != FUNCTION_DECL)
3006 return 0;
3007
3008 return lookup_attribute ("dllexport", DECL_ATTRIBUTES (decl)) != 0;
3009 }
3010
3011 static int
3012 mcore_dllimport_p (tree decl)
3013 {
3014 if ( TREE_CODE (decl) != VAR_DECL
3015 && TREE_CODE (decl) != FUNCTION_DECL)
3016 return 0;
3017
3018 return lookup_attribute ("dllimport", DECL_ATTRIBUTES (decl)) != 0;
3019 }
3020
3021 /* We must mark dll symbols specially. Definitions of dllexport'd objects
3022 install some info in the .drective (PE) or .exports (ELF) sections. */
3023
3024 static void
3025 mcore_encode_section_info (tree decl, rtx rtl ATTRIBUTE_UNUSED, int first ATTRIBUTE_UNUSED)
3026 {
3027 /* Mark the decl so we can tell from the rtl whether the object is
3028 dllexport'd or dllimport'd. */
3029 if (mcore_dllexport_p (decl))
3030 mcore_mark_dllexport (decl);
3031 else if (mcore_dllimport_p (decl))
3032 mcore_mark_dllimport (decl);
3033
3034 /* It might be that DECL has already been marked as dllimport, but
3035 a subsequent definition nullified that. The attribute is gone
3036 but DECL_RTL still has @i.__imp_foo. We need to remove that. */
3037 else if ((TREE_CODE (decl) == FUNCTION_DECL
3038 || TREE_CODE (decl) == VAR_DECL)
3039 && DECL_RTL (decl) != NULL_RTX
3040 && GET_CODE (DECL_RTL (decl)) == MEM
3041 && GET_CODE (XEXP (DECL_RTL (decl), 0)) == MEM
3042 && GET_CODE (XEXP (XEXP (DECL_RTL (decl), 0), 0)) == SYMBOL_REF
3043 && mcore_dllimport_name_p (XSTR (XEXP (XEXP (DECL_RTL (decl), 0), 0), 0)))
3044 {
3045 const char * oldname = XSTR (XEXP (XEXP (DECL_RTL (decl), 0), 0), 0);
3046 tree idp = get_identifier (oldname + 9);
3047 rtx newrtl = gen_rtx_SYMBOL_REF (Pmode, IDENTIFIER_POINTER (idp));
3048
3049 XEXP (DECL_RTL (decl), 0) = newrtl;
3050
3051 /* We previously set TREE_PUBLIC and DECL_EXTERNAL.
3052 ??? We leave these alone for now. */
3053 }
3054 }
3055
3056 /* Undo the effects of the above. */
3057
3058 static const char *
3059 mcore_strip_name_encoding (const char * str)
3060 {
3061 return str + (str[0] == '@' ? 3 : 0);
3062 }
3063
3064 /* MCore specific attribute support.
3065 dllexport - for exporting a function/variable that will live in a dll
3066 dllimport - for importing a function/variable from a dll
3067 naked - do not create a function prologue/epilogue. */
3068
3069 /* Handle a "naked" attribute; arguments as in
3070 struct attribute_spec.handler. */
3071
3072 static tree
3073 mcore_handle_naked_attribute (tree * node, tree name, tree args ATTRIBUTE_UNUSED,
3074 int flags ATTRIBUTE_UNUSED, bool * no_add_attrs)
3075 {
3076 if (TREE_CODE (*node) != FUNCTION_DECL)
3077 {
3078 warning (OPT_Wattributes, "%qE attribute only applies to functions",
3079 name);
3080 *no_add_attrs = true;
3081 }
3082
3083 return NULL_TREE;
3084 }
3085
3086 /* ??? It looks like this is PE specific? Oh well, this is what the
3087 old code did as well. */
3088
3089 static void
3090 mcore_unique_section (tree decl, int reloc ATTRIBUTE_UNUSED)
3091 {
3092 int len;
3093 const char * name;
3094 char * string;
3095 const char * prefix;
3096
3097 name = IDENTIFIER_POINTER (DECL_ASSEMBLER_NAME (decl));
3098
3099 /* Strip off any encoding in name. */
3100 name = (* targetm.strip_name_encoding) (name);
3101
3102 /* The object is put in, for example, section .text$foo.
3103 The linker will then ultimately place them in .text
3104 (everything from the $ on is stripped). */
3105 if (TREE_CODE (decl) == FUNCTION_DECL)
3106 prefix = ".text$";
3107 /* For compatibility with EPOC, we ignore the fact that the
3108 section might have relocs against it. */
3109 else if (decl_readonly_section (decl, 0))
3110 prefix = ".rdata$";
3111 else
3112 prefix = ".data$";
3113
3114 len = strlen (name) + strlen (prefix);
3115 string = XALLOCAVEC (char, len + 1);
3116
3117 sprintf (string, "%s%s", prefix, name);
3118
3119 set_decl_section_name (decl, string);
3120 }
3121
3122 int
3123 mcore_naked_function_p (void)
3124 {
3125 return lookup_attribute ("naked", DECL_ATTRIBUTES (current_function_decl)) != NULL_TREE;
3126 }
3127
3128 static bool
3129 mcore_warn_func_return (tree decl)
3130 {
3131 /* Naked functions are implemented entirely in assembly, including the
3132 return sequence, so suppress warnings about this. */
3133 return lookup_attribute ("naked", DECL_ATTRIBUTES (decl)) == NULL_TREE;
3134 }
3135
3136 #ifdef OBJECT_FORMAT_ELF
3137 static void
3138 mcore_asm_named_section (const char *name,
3139 unsigned int flags ATTRIBUTE_UNUSED,
3140 tree decl ATTRIBUTE_UNUSED)
3141 {
3142 fprintf (asm_out_file, "\t.section %s\n", name);
3143 }
3144 #endif /* OBJECT_FORMAT_ELF */
3145
3146 /* Worker function for TARGET_ASM_EXTERNAL_LIBCALL. */
3147
3148 static void
3149 mcore_external_libcall (rtx fun)
3150 {
3151 fprintf (asm_out_file, "\t.import\t");
3152 assemble_name (asm_out_file, XSTR (fun, 0));
3153 fprintf (asm_out_file, "\n");
3154 }
3155
3156 /* Worker function for TARGET_RETURN_IN_MEMORY. */
3157
3158 static bool
3159 mcore_return_in_memory (const_tree type, const_tree fntype ATTRIBUTE_UNUSED)
3160 {
3161 const HOST_WIDE_INT size = int_size_in_bytes (type);
3162 return (size == -1 || size > 2 * UNITS_PER_WORD);
3163 }
3164
3165 /* Worker function for TARGET_ASM_TRAMPOLINE_TEMPLATE.
3166 Output assembler code for a block containing the constant parts
3167 of a trampoline, leaving space for the variable parts.
3168
3169 On the MCore, the trampoline looks like:
3170 lrw r1, function
3171 lrw r13, area
3172 jmp r13
3173 or r0, r0
3174 .literals */
3175
3176 static void
3177 mcore_asm_trampoline_template (FILE *f)
3178 {
3179 fprintf (f, "\t.short 0x7102\n");
3180 fprintf (f, "\t.short 0x7d02\n");
3181 fprintf (f, "\t.short 0x00cd\n");
3182 fprintf (f, "\t.short 0x1e00\n");
3183 fprintf (f, "\t.long 0\n");
3184 fprintf (f, "\t.long 0\n");
3185 }
3186
3187 /* Worker function for TARGET_TRAMPOLINE_INIT. */
3188
3189 static void
3190 mcore_trampoline_init (rtx m_tramp, tree fndecl, rtx chain_value)
3191 {
3192 rtx fnaddr = XEXP (DECL_RTL (fndecl), 0);
3193 rtx mem;
3194
3195 emit_block_move (m_tramp, assemble_trampoline_template (),
3196 GEN_INT (2*UNITS_PER_WORD), BLOCK_OP_NORMAL);
3197
3198 mem = adjust_address (m_tramp, SImode, 8);
3199 emit_move_insn (mem, chain_value);
3200 mem = adjust_address (m_tramp, SImode, 12);
3201 emit_move_insn (mem, fnaddr);
3202 }
3203
3204 /* Implement TARGET_LEGITIMATE_CONSTANT_P
3205
3206 On the MCore, allow anything but a double. */
3207
3208 static bool
3209 mcore_legitimate_constant_p (machine_mode mode ATTRIBUTE_UNUSED, rtx x)
3210 {
3211 return GET_CODE (x) != CONST_DOUBLE;
3212 }