]> git.ipfire.org Git - thirdparty/gcc.git/blob - gcc/config/mcore/mcore.c
Update FSF address.
[thirdparty/gcc.git] / gcc / config / mcore / mcore.c
1 /* Output routines for Motorola MCore processor
2 Copyright (C) 1993, 1999, 2000, 2001, 2002, 2003, 2004, 2005
3 Free Software Foundation, Inc.
4
5 This file is part of GCC.
6
7 GCC is free software; you can redistribute it and/or modify it
8 under the terms of the GNU General Public License as published
9 by the Free Software Foundation; either version 2, or (at your
10 option) any later version.
11
12 GCC is distributed in the hope that it will be useful, but WITHOUT
13 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
14 or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public
15 License for more details.
16
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING. If not, write to
19 the Free Software Foundation, 51 Franklin Street, Fifth Floor,
20 Boston, MA 02110-1301, USA. */
21
22 #include "config.h"
23 #include "system.h"
24 #include "coretypes.h"
25 #include "tm.h"
26 #include "rtl.h"
27 #include "tree.h"
28 #include "tm_p.h"
29 #include "assert.h"
30 #include "mcore.h"
31 #include "regs.h"
32 #include "hard-reg-set.h"
33 #include "real.h"
34 #include "insn-config.h"
35 #include "conditions.h"
36 #include "output.h"
37 #include "insn-attr.h"
38 #include "flags.h"
39 #include "obstack.h"
40 #include "expr.h"
41 #include "reload.h"
42 #include "recog.h"
43 #include "function.h"
44 #include "ggc.h"
45 #include "toplev.h"
46 #include "target.h"
47 #include "target-def.h"
48
49 /* Maximum size we are allowed to grow the stack in a single operation.
50 If we want more, we must do it in increments of at most this size.
51 If this value is 0, we don't check at all. */
52 int mcore_stack_increment = STACK_UNITS_MAXSTEP;
53
54 /* For dumping information about frame sizes. */
55 char * mcore_current_function_name = 0;
56 long mcore_current_compilation_timestamp = 0;
57
58 /* Global variables for machine-dependent things. */
59
60 /* Saved operands from the last compare to use when we generate an scc
61 or bcc insn. */
62 rtx arch_compare_op0;
63 rtx arch_compare_op1;
64
65 /* Provides the class number of the smallest class containing
66 reg number. */
67 const int regno_reg_class[FIRST_PSEUDO_REGISTER] =
68 {
69 GENERAL_REGS, ONLYR1_REGS, LRW_REGS, LRW_REGS,
70 LRW_REGS, LRW_REGS, LRW_REGS, LRW_REGS,
71 LRW_REGS, LRW_REGS, LRW_REGS, LRW_REGS,
72 LRW_REGS, LRW_REGS, LRW_REGS, GENERAL_REGS,
73 GENERAL_REGS, C_REGS, NO_REGS, NO_REGS,
74 };
75
76 /* Provide reg_class from a letter such as appears in the machine
77 description. */
78 const enum reg_class reg_class_from_letter[] =
79 {
80 /* a */ LRW_REGS, /* b */ ONLYR1_REGS, /* c */ C_REGS, /* d */ NO_REGS,
81 /* e */ NO_REGS, /* f */ NO_REGS, /* g */ NO_REGS, /* h */ NO_REGS,
82 /* i */ NO_REGS, /* j */ NO_REGS, /* k */ NO_REGS, /* l */ NO_REGS,
83 /* m */ NO_REGS, /* n */ NO_REGS, /* o */ NO_REGS, /* p */ NO_REGS,
84 /* q */ NO_REGS, /* r */ GENERAL_REGS, /* s */ NO_REGS, /* t */ NO_REGS,
85 /* u */ NO_REGS, /* v */ NO_REGS, /* w */ NO_REGS, /* x */ ALL_REGS,
86 /* y */ NO_REGS, /* z */ NO_REGS
87 };
88
89 struct mcore_frame
90 {
91 int arg_size; /* Stdarg spills (bytes). */
92 int reg_size; /* Non-volatile reg saves (bytes). */
93 int reg_mask; /* Non-volatile reg saves. */
94 int local_size; /* Locals. */
95 int outbound_size; /* Arg overflow on calls out. */
96 int pad_outbound;
97 int pad_local;
98 int pad_reg;
99 /* Describe the steps we'll use to grow it. */
100 #define MAX_STACK_GROWS 4 /* Gives us some spare space. */
101 int growth[MAX_STACK_GROWS];
102 int arg_offset;
103 int reg_offset;
104 int reg_growth;
105 int local_growth;
106 };
107
108 typedef enum
109 {
110 COND_NO,
111 COND_MOV_INSN,
112 COND_CLR_INSN,
113 COND_INC_INSN,
114 COND_DEC_INSN,
115 COND_BRANCH_INSN
116 }
117 cond_type;
118
119 static void output_stack_adjust (int, int);
120 static int calc_live_regs (int *);
121 static int try_constant_tricks (long, int *, int *);
122 static const char * output_inline_const (enum machine_mode, rtx *);
123 static void layout_mcore_frame (struct mcore_frame *);
124 static void mcore_setup_incoming_varargs (CUMULATIVE_ARGS *, enum machine_mode, tree, int *, int);
125 static cond_type is_cond_candidate (rtx);
126 static rtx emit_new_cond_insn (rtx, int);
127 static rtx conditionalize_block (rtx);
128 static void conditionalize_optimization (void);
129 static void mcore_reorg (void);
130 static rtx handle_structs_in_regs (enum machine_mode, tree, int);
131 static void mcore_mark_dllexport (tree);
132 static void mcore_mark_dllimport (tree);
133 static int mcore_dllexport_p (tree);
134 static int mcore_dllimport_p (tree);
135 const struct attribute_spec mcore_attribute_table[];
136 static tree mcore_handle_naked_attribute (tree *, tree, tree, int, bool *);
137 #ifdef OBJECT_FORMAT_ELF
138 static void mcore_asm_named_section (const char *,
139 unsigned int, tree);
140 #endif
141 static void mcore_unique_section (tree, int);
142 static void mcore_encode_section_info (tree, rtx, int);
143 static const char *mcore_strip_name_encoding (const char *);
144 static int mcore_const_costs (rtx, RTX_CODE);
145 static int mcore_and_cost (rtx);
146 static int mcore_ior_cost (rtx);
147 static bool mcore_rtx_costs (rtx, int, int, int *);
148 static void mcore_external_libcall (rtx);
149 static bool mcore_return_in_memory (tree, tree);
150 static int mcore_arg_partial_bytes (CUMULATIVE_ARGS *,
151 enum machine_mode,
152 tree, bool);
153
154 \f
155 /* Initialize the GCC target structure. */
156 #undef TARGET_ASM_EXTERNAL_LIBCALL
157 #define TARGET_ASM_EXTERNAL_LIBCALL mcore_external_libcall
158
159 #if TARGET_DLLIMPORT_DECL_ATTRIBUTES
160 #undef TARGET_MERGE_DECL_ATTRIBUTES
161 #define TARGET_MERGE_DECL_ATTRIBUTES merge_dllimport_decl_attributes
162 #endif
163
164 #ifdef OBJECT_FORMAT_ELF
165 #undef TARGET_ASM_UNALIGNED_HI_OP
166 #define TARGET_ASM_UNALIGNED_HI_OP "\t.short\t"
167 #undef TARGET_ASM_UNALIGNED_SI_OP
168 #define TARGET_ASM_UNALIGNED_SI_OP "\t.long\t"
169 #endif
170
171 #undef TARGET_ATTRIBUTE_TABLE
172 #define TARGET_ATTRIBUTE_TABLE mcore_attribute_table
173 #undef TARGET_ASM_UNIQUE_SECTION
174 #define TARGET_ASM_UNIQUE_SECTION mcore_unique_section
175 #undef TARGET_ASM_FUNCTION_RODATA_SECTION
176 #define TARGET_ASM_FUNCTION_RODATA_SECTION default_no_function_rodata_section
177 #undef TARGET_DEFAULT_TARGET_FLAGS
178 #define TARGET_DEFAULT_TARGET_FLAGS TARGET_DEFAULT
179 #undef TARGET_ENCODE_SECTION_INFO
180 #define TARGET_ENCODE_SECTION_INFO mcore_encode_section_info
181 #undef TARGET_STRIP_NAME_ENCODING
182 #define TARGET_STRIP_NAME_ENCODING mcore_strip_name_encoding
183 #undef TARGET_RTX_COSTS
184 #define TARGET_RTX_COSTS mcore_rtx_costs
185 #undef TARGET_ADDRESS_COST
186 #define TARGET_ADDRESS_COST hook_int_rtx_0
187 #undef TARGET_MACHINE_DEPENDENT_REORG
188 #define TARGET_MACHINE_DEPENDENT_REORG mcore_reorg
189
190 #undef TARGET_PROMOTE_FUNCTION_ARGS
191 #define TARGET_PROMOTE_FUNCTION_ARGS hook_bool_tree_true
192 #undef TARGET_PROMOTE_FUNCTION_RETURN
193 #define TARGET_PROMOTE_FUNCTION_RETURN hook_bool_tree_true
194 #undef TARGET_PROMOTE_PROTOTYPES
195 #define TARGET_PROMOTE_PROTOTYPES hook_bool_tree_true
196
197 #undef TARGET_RETURN_IN_MEMORY
198 #define TARGET_RETURN_IN_MEMORY mcore_return_in_memory
199 #undef TARGET_MUST_PASS_IN_STACK
200 #define TARGET_MUST_PASS_IN_STACK must_pass_in_stack_var_size
201 #undef TARGET_PASS_BY_REFERENCE
202 #define TARGET_PASS_BY_REFERENCE hook_pass_by_reference_must_pass_in_stack
203 #undef TARGET_ARG_PARTIAL_BYTES
204 #define TARGET_ARG_PARTIAL_BYTES mcore_arg_partial_bytes
205
206 #undef TARGET_SETUP_INCOMING_VARARGS
207 #define TARGET_SETUP_INCOMING_VARARGS mcore_setup_incoming_varargs
208
209 struct gcc_target targetm = TARGET_INITIALIZER;
210 \f
211 /* Adjust the stack and return the number of bytes taken to do it. */
212 static void
213 output_stack_adjust (int direction, int size)
214 {
215 /* If extending stack a lot, we do it incrementally. */
216 if (direction < 0 && size > mcore_stack_increment && mcore_stack_increment > 0)
217 {
218 rtx tmp = gen_rtx_REG (SImode, 1);
219 rtx memref;
220
221 emit_insn (gen_movsi (tmp, GEN_INT (mcore_stack_increment)));
222 do
223 {
224 emit_insn (gen_subsi3 (stack_pointer_rtx, stack_pointer_rtx, tmp));
225 memref = gen_rtx_MEM (SImode, stack_pointer_rtx);
226 MEM_VOLATILE_P (memref) = 1;
227 emit_insn (gen_movsi (memref, stack_pointer_rtx));
228 size -= mcore_stack_increment;
229 }
230 while (size > mcore_stack_increment);
231
232 /* SIZE is now the residual for the last adjustment,
233 which doesn't require a probe. */
234 }
235
236 if (size)
237 {
238 rtx insn;
239 rtx val = GEN_INT (size);
240
241 if (size > 32)
242 {
243 rtx nval = gen_rtx_REG (SImode, 1);
244 emit_insn (gen_movsi (nval, val));
245 val = nval;
246 }
247
248 if (direction > 0)
249 insn = gen_addsi3 (stack_pointer_rtx, stack_pointer_rtx, val);
250 else
251 insn = gen_subsi3 (stack_pointer_rtx, stack_pointer_rtx, val);
252
253 emit_insn (insn);
254 }
255 }
256
257 /* Work out the registers which need to be saved,
258 both as a mask and a count. */
259
260 static int
261 calc_live_regs (int * count)
262 {
263 int reg;
264 int live_regs_mask = 0;
265
266 * count = 0;
267
268 for (reg = 0; reg < FIRST_PSEUDO_REGISTER; reg++)
269 {
270 if (regs_ever_live[reg] && !call_used_regs[reg])
271 {
272 (*count)++;
273 live_regs_mask |= (1 << reg);
274 }
275 }
276
277 return live_regs_mask;
278 }
279
280 /* Print the operand address in x to the stream. */
281
282 void
283 mcore_print_operand_address (FILE * stream, rtx x)
284 {
285 switch (GET_CODE (x))
286 {
287 case REG:
288 fprintf (stream, "(%s)", reg_names[REGNO (x)]);
289 break;
290
291 case PLUS:
292 {
293 rtx base = XEXP (x, 0);
294 rtx index = XEXP (x, 1);
295
296 if (GET_CODE (base) != REG)
297 {
298 /* Ensure that BASE is a register (one of them must be). */
299 rtx temp = base;
300 base = index;
301 index = temp;
302 }
303
304 switch (GET_CODE (index))
305 {
306 case CONST_INT:
307 fprintf (stream, "(%s," HOST_WIDE_INT_PRINT_DEC ")",
308 reg_names[REGNO(base)], INTVAL (index));
309 break;
310
311 default:
312 gcc_unreachable ();
313 }
314 }
315
316 break;
317
318 default:
319 output_addr_const (stream, x);
320 break;
321 }
322 }
323
324 /* Print operand x (an rtx) in assembler syntax to file stream
325 according to modifier code.
326
327 'R' print the next register or memory location along, i.e. the lsw in
328 a double word value
329 'O' print a constant without the #
330 'M' print a constant as its negative
331 'P' print log2 of a power of two
332 'Q' print log2 of an inverse of a power of two
333 'U' print register for ldm/stm instruction
334 'X' print byte number for xtrbN instruction. */
335
336 void
337 mcore_print_operand (FILE * stream, rtx x, int code)
338 {
339 switch (code)
340 {
341 case 'N':
342 if (INTVAL(x) == -1)
343 fprintf (asm_out_file, "32");
344 else
345 fprintf (asm_out_file, "%d", exact_log2 (INTVAL (x) + 1));
346 break;
347 case 'P':
348 fprintf (asm_out_file, "%d", exact_log2 (INTVAL (x)));
349 break;
350 case 'Q':
351 fprintf (asm_out_file, "%d", exact_log2 (~INTVAL (x)));
352 break;
353 case 'O':
354 fprintf (asm_out_file, HOST_WIDE_INT_PRINT_DEC, INTVAL (x));
355 break;
356 case 'M':
357 fprintf (asm_out_file, HOST_WIDE_INT_PRINT_DEC, - INTVAL (x));
358 break;
359 case 'R':
360 /* Next location along in memory or register. */
361 switch (GET_CODE (x))
362 {
363 case REG:
364 fputs (reg_names[REGNO (x) + 1], (stream));
365 break;
366 case MEM:
367 mcore_print_operand_address
368 (stream, XEXP (adjust_address (x, SImode, 4), 0));
369 break;
370 default:
371 gcc_unreachable ();
372 }
373 break;
374 case 'U':
375 fprintf (asm_out_file, "%s-%s", reg_names[REGNO (x)],
376 reg_names[REGNO (x) + 3]);
377 break;
378 case 'x':
379 fprintf (asm_out_file, HOST_WIDE_INT_PRINT_HEX, INTVAL (x));
380 break;
381 case 'X':
382 fprintf (asm_out_file, HOST_WIDE_INT_PRINT_DEC, 3 - INTVAL (x) / 8);
383 break;
384
385 default:
386 switch (GET_CODE (x))
387 {
388 case REG:
389 fputs (reg_names[REGNO (x)], (stream));
390 break;
391 case MEM:
392 output_address (XEXP (x, 0));
393 break;
394 default:
395 output_addr_const (stream, x);
396 break;
397 }
398 break;
399 }
400 }
401
402 /* What does a constant cost ? */
403
404 static int
405 mcore_const_costs (rtx exp, enum rtx_code code)
406 {
407 int val = INTVAL (exp);
408
409 /* Easy constants. */
410 if ( CONST_OK_FOR_I (val)
411 || CONST_OK_FOR_M (val)
412 || CONST_OK_FOR_N (val)
413 || (code == PLUS && CONST_OK_FOR_L (val)))
414 return 1;
415 else if (code == AND
416 && ( CONST_OK_FOR_M (~val)
417 || CONST_OK_FOR_N (~val)))
418 return 2;
419 else if (code == PLUS
420 && ( CONST_OK_FOR_I (-val)
421 || CONST_OK_FOR_M (-val)
422 || CONST_OK_FOR_N (-val)))
423 return 2;
424
425 return 5;
426 }
427
428 /* What does an and instruction cost - we do this b/c immediates may
429 have been relaxed. We want to ensure that cse will cse relaxed immeds
430 out. Otherwise we'll get bad code (multiple reloads of the same const). */
431
432 static int
433 mcore_and_cost (rtx x)
434 {
435 int val;
436
437 if (GET_CODE (XEXP (x, 1)) != CONST_INT)
438 return 2;
439
440 val = INTVAL (XEXP (x, 1));
441
442 /* Do it directly. */
443 if (CONST_OK_FOR_K (val) || CONST_OK_FOR_M (~val))
444 return 2;
445 /* Takes one instruction to load. */
446 else if (const_ok_for_mcore (val))
447 return 3;
448 /* Takes two instructions to load. */
449 else if (TARGET_HARDLIT && mcore_const_ok_for_inline (val))
450 return 4;
451
452 /* Takes a lrw to load. */
453 return 5;
454 }
455
456 /* What does an or cost - see and_cost(). */
457
458 static int
459 mcore_ior_cost (rtx x)
460 {
461 int val;
462
463 if (GET_CODE (XEXP (x, 1)) != CONST_INT)
464 return 2;
465
466 val = INTVAL (XEXP (x, 1));
467
468 /* Do it directly with bclri. */
469 if (CONST_OK_FOR_M (val))
470 return 2;
471 /* Takes one instruction to load. */
472 else if (const_ok_for_mcore (val))
473 return 3;
474 /* Takes two instructions to load. */
475 else if (TARGET_HARDLIT && mcore_const_ok_for_inline (val))
476 return 4;
477
478 /* Takes a lrw to load. */
479 return 5;
480 }
481
482 static bool
483 mcore_rtx_costs (rtx x, int code, int outer_code, int * total)
484 {
485 switch (code)
486 {
487 case CONST_INT:
488 *total = mcore_const_costs (x, outer_code);
489 return true;
490 case CONST:
491 case LABEL_REF:
492 case SYMBOL_REF:
493 *total = 5;
494 return true;
495 case CONST_DOUBLE:
496 *total = 10;
497 return true;
498
499 case AND:
500 *total = COSTS_N_INSNS (mcore_and_cost (x));
501 return true;
502
503 case IOR:
504 *total = COSTS_N_INSNS (mcore_ior_cost (x));
505 return true;
506
507 case DIV:
508 case UDIV:
509 case MOD:
510 case UMOD:
511 case FLOAT:
512 case FIX:
513 *total = COSTS_N_INSNS (100);
514 return true;
515
516 default:
517 return false;
518 }
519 }
520
521 /* Check to see if a comparison against a constant can be made more efficient
522 by incrementing/decrementing the constant to get one that is more efficient
523 to load. */
524
525 int
526 mcore_modify_comparison (enum rtx_code code)
527 {
528 rtx op1 = arch_compare_op1;
529
530 if (GET_CODE (op1) == CONST_INT)
531 {
532 int val = INTVAL (op1);
533
534 switch (code)
535 {
536 case LE:
537 if (CONST_OK_FOR_J (val + 1))
538 {
539 arch_compare_op1 = GEN_INT (val + 1);
540 return 1;
541 }
542 break;
543
544 default:
545 break;
546 }
547 }
548
549 return 0;
550 }
551
552 /* Prepare the operands for a comparison. */
553
554 rtx
555 mcore_gen_compare_reg (enum rtx_code code)
556 {
557 rtx op0 = arch_compare_op0;
558 rtx op1 = arch_compare_op1;
559 rtx cc_reg = gen_rtx_REG (CCmode, CC_REG);
560
561 if (CONSTANT_P (op1) && GET_CODE (op1) != CONST_INT)
562 op1 = force_reg (SImode, op1);
563
564 /* cmpnei: 0-31 (K immediate)
565 cmplti: 1-32 (J immediate, 0 using btsti x,31). */
566 switch (code)
567 {
568 case EQ: /* Use inverted condition, cmpne. */
569 code = NE;
570 /* Drop through. */
571
572 case NE: /* Use normal condition, cmpne. */
573 if (GET_CODE (op1) == CONST_INT && ! CONST_OK_FOR_K (INTVAL (op1)))
574 op1 = force_reg (SImode, op1);
575 break;
576
577 case LE: /* Use inverted condition, reversed cmplt. */
578 code = GT;
579 /* Drop through. */
580
581 case GT: /* Use normal condition, reversed cmplt. */
582 if (GET_CODE (op1) == CONST_INT)
583 op1 = force_reg (SImode, op1);
584 break;
585
586 case GE: /* Use inverted condition, cmplt. */
587 code = LT;
588 /* Drop through. */
589
590 case LT: /* Use normal condition, cmplt. */
591 if (GET_CODE (op1) == CONST_INT &&
592 /* covered by btsti x,31. */
593 INTVAL (op1) != 0 &&
594 ! CONST_OK_FOR_J (INTVAL (op1)))
595 op1 = force_reg (SImode, op1);
596 break;
597
598 case GTU: /* Use inverted condition, cmple. */
599 /* Unsigned > 0 is the same as != 0, but we need to invert the
600 condition, so we want to set code = EQ. This cannot be done
601 however, as the mcore does not support such a test. Instead
602 we cope with this case in the "bgtu" pattern itself so we
603 should never reach this point. */
604 gcc_assert (GET_CODE (op1) != CONST_INT || INTVAL (op1) != 0);
605 code = LEU;
606 /* Drop through. */
607
608 case LEU: /* Use normal condition, reversed cmphs. */
609 if (GET_CODE (op1) == CONST_INT && INTVAL (op1) != 0)
610 op1 = force_reg (SImode, op1);
611 break;
612
613 case LTU: /* Use inverted condition, cmphs. */
614 code = GEU;
615 /* Drop through. */
616
617 case GEU: /* Use normal condition, cmphs. */
618 if (GET_CODE (op1) == CONST_INT && INTVAL (op1) != 0)
619 op1 = force_reg (SImode, op1);
620 break;
621
622 default:
623 break;
624 }
625
626 emit_insn (gen_rtx_SET (VOIDmode, cc_reg, gen_rtx_fmt_ee (code, CCmode, op0, op1)));
627
628 return cc_reg;
629 }
630
631 int
632 mcore_symbolic_address_p (rtx x)
633 {
634 switch (GET_CODE (x))
635 {
636 case SYMBOL_REF:
637 case LABEL_REF:
638 return 1;
639 case CONST:
640 x = XEXP (x, 0);
641 return ( (GET_CODE (XEXP (x, 0)) == SYMBOL_REF
642 || GET_CODE (XEXP (x, 0)) == LABEL_REF)
643 && GET_CODE (XEXP (x, 1)) == CONST_INT);
644 default:
645 return 0;
646 }
647 }
648
649 /* Functions to output assembly code for a function call. */
650
651 char *
652 mcore_output_call (rtx operands[], int index)
653 {
654 static char buffer[20];
655 rtx addr = operands [index];
656
657 if (REG_P (addr))
658 {
659 if (TARGET_CG_DATA)
660 {
661 gcc_assert (mcore_current_function_name);
662
663 ASM_OUTPUT_CG_EDGE (asm_out_file, mcore_current_function_name,
664 "unknown", 1);
665 }
666
667 sprintf (buffer, "jsr\t%%%d", index);
668 }
669 else
670 {
671 if (TARGET_CG_DATA)
672 {
673 gcc_assert (mcore_current_function_name);
674 gcc_assert (GET_CODE (addr) == SYMBOL_REF);
675
676 ASM_OUTPUT_CG_EDGE (asm_out_file, mcore_current_function_name,
677 XSTR (addr, 0), 0);
678 }
679
680 sprintf (buffer, "jbsr\t%%%d", index);
681 }
682
683 return buffer;
684 }
685
686 /* Can we load a constant with a single instruction ? */
687
688 int
689 const_ok_for_mcore (int value)
690 {
691 if (value >= 0 && value <= 127)
692 return 1;
693
694 /* Try exact power of two. */
695 if ((value & (value - 1)) == 0)
696 return 1;
697
698 /* Try exact power of two - 1. */
699 if ((value & (value + 1)) == 0)
700 return 1;
701
702 return 0;
703 }
704
705 /* Can we load a constant inline with up to 2 instructions ? */
706
707 int
708 mcore_const_ok_for_inline (long value)
709 {
710 int x, y;
711
712 return try_constant_tricks (value, & x, & y) > 0;
713 }
714
715 /* Are we loading the constant using a not ? */
716
717 int
718 mcore_const_trick_uses_not (long value)
719 {
720 int x, y;
721
722 return try_constant_tricks (value, & x, & y) == 2;
723 }
724
725 /* Try tricks to load a constant inline and return the trick number if
726 success (0 is non-inlinable).
727
728 0: not inlinable
729 1: single instruction (do the usual thing)
730 2: single insn followed by a 'not'
731 3: single insn followed by a subi
732 4: single insn followed by an addi
733 5: single insn followed by rsubi
734 6: single insn followed by bseti
735 7: single insn followed by bclri
736 8: single insn followed by rotli
737 9: single insn followed by lsli
738 10: single insn followed by ixh
739 11: single insn followed by ixw. */
740
741 static int
742 try_constant_tricks (long value, int * x, int * y)
743 {
744 int i;
745 unsigned bit, shf, rot;
746
747 if (const_ok_for_mcore (value))
748 return 1; /* Do the usual thing. */
749
750 if (TARGET_HARDLIT)
751 {
752 if (const_ok_for_mcore (~value))
753 {
754 *x = ~value;
755 return 2;
756 }
757
758 for (i = 1; i <= 32; i++)
759 {
760 if (const_ok_for_mcore (value - i))
761 {
762 *x = value - i;
763 *y = i;
764
765 return 3;
766 }
767
768 if (const_ok_for_mcore (value + i))
769 {
770 *x = value + i;
771 *y = i;
772
773 return 4;
774 }
775 }
776
777 bit = 0x80000000L;
778
779 for (i = 0; i <= 31; i++)
780 {
781 if (const_ok_for_mcore (i - value))
782 {
783 *x = i - value;
784 *y = i;
785
786 return 5;
787 }
788
789 if (const_ok_for_mcore (value & ~bit))
790 {
791 *y = bit;
792 *x = value & ~bit;
793
794 return 6;
795 }
796
797 if (const_ok_for_mcore (value | bit))
798 {
799 *y = ~bit;
800 *x = value | bit;
801
802 return 7;
803 }
804
805 bit >>= 1;
806 }
807
808 shf = value;
809 rot = value;
810
811 for (i = 1; i < 31; i++)
812 {
813 int c;
814
815 /* MCore has rotate left. */
816 c = rot << 31;
817 rot >>= 1;
818 rot &= 0x7FFFFFFF;
819 rot |= c; /* Simulate rotate. */
820
821 if (const_ok_for_mcore (rot))
822 {
823 *y = i;
824 *x = rot;
825
826 return 8;
827 }
828
829 if (shf & 1)
830 shf = 0; /* Can't use logical shift, low order bit is one. */
831
832 shf >>= 1;
833
834 if (shf != 0 && const_ok_for_mcore (shf))
835 {
836 *y = i;
837 *x = shf;
838
839 return 9;
840 }
841 }
842
843 if ((value % 3) == 0 && const_ok_for_mcore (value / 3))
844 {
845 *x = value / 3;
846
847 return 10;
848 }
849
850 if ((value % 5) == 0 && const_ok_for_mcore (value / 5))
851 {
852 *x = value / 5;
853
854 return 11;
855 }
856 }
857
858 return 0;
859 }
860
861 /* Check whether reg is dead at first. This is done by searching ahead
862 for either the next use (i.e., reg is live), a death note, or a set of
863 reg. Don't just use dead_or_set_p() since reload does not always mark
864 deaths (especially if PRESERVE_DEATH_NOTES_REGNO_P is not defined). We
865 can ignore subregs by extracting the actual register. BRC */
866
867 int
868 mcore_is_dead (rtx first, rtx reg)
869 {
870 rtx insn;
871
872 /* For mcore, subregs can't live independently of their parent regs. */
873 if (GET_CODE (reg) == SUBREG)
874 reg = SUBREG_REG (reg);
875
876 /* Dies immediately. */
877 if (dead_or_set_p (first, reg))
878 return 1;
879
880 /* Look for conclusive evidence of live/death, otherwise we have
881 to assume that it is live. */
882 for (insn = NEXT_INSN (first); insn; insn = NEXT_INSN (insn))
883 {
884 if (GET_CODE (insn) == JUMP_INSN)
885 return 0; /* We lose track, assume it is alive. */
886
887 else if (GET_CODE(insn) == CALL_INSN)
888 {
889 /* Call's might use it for target or register parms. */
890 if (reg_referenced_p (reg, PATTERN (insn))
891 || find_reg_fusage (insn, USE, reg))
892 return 0;
893 else if (dead_or_set_p (insn, reg))
894 return 1;
895 }
896 else if (GET_CODE (insn) == INSN)
897 {
898 if (reg_referenced_p (reg, PATTERN (insn)))
899 return 0;
900 else if (dead_or_set_p (insn, reg))
901 return 1;
902 }
903 }
904
905 /* No conclusive evidence either way, we cannot take the chance
906 that control flow hid the use from us -- "I'm not dead yet". */
907 return 0;
908 }
909
910 /* Count the number of ones in mask. */
911
912 int
913 mcore_num_ones (int mask)
914 {
915 /* A trick to count set bits recently posted on comp.compilers. */
916 mask = (mask >> 1 & 0x55555555) + (mask & 0x55555555);
917 mask = ((mask >> 2) & 0x33333333) + (mask & 0x33333333);
918 mask = ((mask >> 4) + mask) & 0x0f0f0f0f;
919 mask = ((mask >> 8) + mask);
920
921 return (mask + (mask >> 16)) & 0xff;
922 }
923
924 /* Count the number of zeros in mask. */
925
926 int
927 mcore_num_zeros (int mask)
928 {
929 return 32 - mcore_num_ones (mask);
930 }
931
932 /* Determine byte being masked. */
933
934 int
935 mcore_byte_offset (unsigned int mask)
936 {
937 if (mask == 0x00ffffffL)
938 return 0;
939 else if (mask == 0xff00ffffL)
940 return 1;
941 else if (mask == 0xffff00ffL)
942 return 2;
943 else if (mask == 0xffffff00L)
944 return 3;
945
946 return -1;
947 }
948
949 /* Determine halfword being masked. */
950
951 int
952 mcore_halfword_offset (unsigned int mask)
953 {
954 if (mask == 0x0000ffffL)
955 return 0;
956 else if (mask == 0xffff0000L)
957 return 1;
958
959 return -1;
960 }
961
962 /* Output a series of bseti's corresponding to mask. */
963
964 const char *
965 mcore_output_bseti (rtx dst, int mask)
966 {
967 rtx out_operands[2];
968 int bit;
969
970 out_operands[0] = dst;
971
972 for (bit = 0; bit < 32; bit++)
973 {
974 if ((mask & 0x1) == 0x1)
975 {
976 out_operands[1] = GEN_INT (bit);
977
978 output_asm_insn ("bseti\t%0,%1", out_operands);
979 }
980 mask >>= 1;
981 }
982
983 return "";
984 }
985
986 /* Output a series of bclri's corresponding to mask. */
987
988 const char *
989 mcore_output_bclri (rtx dst, int mask)
990 {
991 rtx out_operands[2];
992 int bit;
993
994 out_operands[0] = dst;
995
996 for (bit = 0; bit < 32; bit++)
997 {
998 if ((mask & 0x1) == 0x0)
999 {
1000 out_operands[1] = GEN_INT (bit);
1001
1002 output_asm_insn ("bclri\t%0,%1", out_operands);
1003 }
1004
1005 mask >>= 1;
1006 }
1007
1008 return "";
1009 }
1010
1011 /* Output a conditional move of two constants that are +/- 1 within each
1012 other. See the "movtK" patterns in mcore.md. I'm not sure this is
1013 really worth the effort. */
1014
1015 const char *
1016 mcore_output_cmov (rtx operands[], int cmp_t, const char * test)
1017 {
1018 int load_value;
1019 int adjust_value;
1020 rtx out_operands[4];
1021
1022 out_operands[0] = operands[0];
1023
1024 /* Check to see which constant is loadable. */
1025 if (const_ok_for_mcore (INTVAL (operands[1])))
1026 {
1027 out_operands[1] = operands[1];
1028 out_operands[2] = operands[2];
1029 }
1030 else if (const_ok_for_mcore (INTVAL (operands[2])))
1031 {
1032 out_operands[1] = operands[2];
1033 out_operands[2] = operands[1];
1034
1035 /* Complement test since constants are swapped. */
1036 cmp_t = (cmp_t == 0);
1037 }
1038 load_value = INTVAL (out_operands[1]);
1039 adjust_value = INTVAL (out_operands[2]);
1040
1041 /* First output the test if folded into the pattern. */
1042
1043 if (test)
1044 output_asm_insn (test, operands);
1045
1046 /* Load the constant - for now, only support constants that can be
1047 generated with a single instruction. maybe add general inlinable
1048 constants later (this will increase the # of patterns since the
1049 instruction sequence has a different length attribute). */
1050 if (load_value >= 0 && load_value <= 127)
1051 output_asm_insn ("movi\t%0,%1", out_operands);
1052 else if ((load_value & (load_value - 1)) == 0)
1053 output_asm_insn ("bgeni\t%0,%P1", out_operands);
1054 else if ((load_value & (load_value + 1)) == 0)
1055 output_asm_insn ("bmaski\t%0,%N1", out_operands);
1056
1057 /* Output the constant adjustment. */
1058 if (load_value > adjust_value)
1059 {
1060 if (cmp_t)
1061 output_asm_insn ("decf\t%0", out_operands);
1062 else
1063 output_asm_insn ("dect\t%0", out_operands);
1064 }
1065 else
1066 {
1067 if (cmp_t)
1068 output_asm_insn ("incf\t%0", out_operands);
1069 else
1070 output_asm_insn ("inct\t%0", out_operands);
1071 }
1072
1073 return "";
1074 }
1075
1076 /* Outputs the peephole for moving a constant that gets not'ed followed
1077 by an and (i.e. combine the not and the and into andn). BRC */
1078
1079 const char *
1080 mcore_output_andn (rtx insn ATTRIBUTE_UNUSED, rtx operands[])
1081 {
1082 int x, y;
1083 rtx out_operands[3];
1084 const char * load_op;
1085 char buf[256];
1086 int trick_no;
1087
1088 trick_no = try_constant_tricks (INTVAL (operands[1]), &x, &y);
1089 gcc_assert (trick_no == 2);
1090
1091 out_operands[0] = operands[0];
1092 out_operands[1] = GEN_INT(x);
1093 out_operands[2] = operands[2];
1094
1095 if (x >= 0 && x <= 127)
1096 load_op = "movi\t%0,%1";
1097
1098 /* Try exact power of two. */
1099 else if ((x & (x - 1)) == 0)
1100 load_op = "bgeni\t%0,%P1";
1101
1102 /* Try exact power of two - 1. */
1103 else if ((x & (x + 1)) == 0)
1104 load_op = "bmaski\t%0,%N1";
1105
1106 else
1107 load_op = "BADMOVI\t%0,%1";
1108
1109 sprintf (buf, "%s\n\tandn\t%%2,%%0", load_op);
1110 output_asm_insn (buf, out_operands);
1111
1112 return "";
1113 }
1114
1115 /* Output an inline constant. */
1116
1117 static const char *
1118 output_inline_const (enum machine_mode mode, rtx operands[])
1119 {
1120 int x = 0, y = 0;
1121 int trick_no;
1122 rtx out_operands[3];
1123 char buf[256];
1124 char load_op[256];
1125 const char *dst_fmt;
1126 int value;
1127
1128 value = INTVAL (operands[1]);
1129
1130 trick_no = try_constant_tricks (value, &x, &y);
1131 /* lrw's are handled separately: Large inlinable constants never get
1132 turned into lrw's. Our caller uses try_constant_tricks to back
1133 off to an lrw rather than calling this routine. */
1134 gcc_assert (trick_no != 0);
1135
1136 if (trick_no == 1)
1137 x = value;
1138
1139 /* operands: 0 = dst, 1 = load immed., 2 = immed. adjustment. */
1140 out_operands[0] = operands[0];
1141 out_operands[1] = GEN_INT (x);
1142
1143 if (trick_no > 2)
1144 out_operands[2] = GEN_INT (y);
1145
1146 /* Select dst format based on mode. */
1147 if (mode == DImode && (! TARGET_LITTLE_END))
1148 dst_fmt = "%R0";
1149 else
1150 dst_fmt = "%0";
1151
1152 if (x >= 0 && x <= 127)
1153 sprintf (load_op, "movi\t%s,%%1", dst_fmt);
1154
1155 /* Try exact power of two. */
1156 else if ((x & (x - 1)) == 0)
1157 sprintf (load_op, "bgeni\t%s,%%P1", dst_fmt);
1158
1159 /* Try exact power of two - 1. */
1160 else if ((x & (x + 1)) == 0)
1161 sprintf (load_op, "bmaski\t%s,%%N1", dst_fmt);
1162
1163 else
1164 sprintf (load_op, "BADMOVI\t%s,%%1", dst_fmt);
1165
1166 switch (trick_no)
1167 {
1168 case 1:
1169 strcpy (buf, load_op);
1170 break;
1171 case 2: /* not */
1172 sprintf (buf, "%s\n\tnot\t%s\t// %d 0x%x", load_op, dst_fmt, value, value);
1173 break;
1174 case 3: /* add */
1175 sprintf (buf, "%s\n\taddi\t%s,%%2\t// %d 0x%x", load_op, dst_fmt, value, value);
1176 break;
1177 case 4: /* sub */
1178 sprintf (buf, "%s\n\tsubi\t%s,%%2\t// %d 0x%x", load_op, dst_fmt, value, value);
1179 break;
1180 case 5: /* rsub */
1181 /* Never happens unless -mrsubi, see try_constant_tricks(). */
1182 sprintf (buf, "%s\n\trsubi\t%s,%%2\t// %d 0x%x", load_op, dst_fmt, value, value);
1183 break;
1184 case 6: /* bset */
1185 sprintf (buf, "%s\n\tbseti\t%s,%%P2\t// %d 0x%x", load_op, dst_fmt, value, value);
1186 break;
1187 case 7: /* bclr */
1188 sprintf (buf, "%s\n\tbclri\t%s,%%Q2\t// %d 0x%x", load_op, dst_fmt, value, value);
1189 break;
1190 case 8: /* rotl */
1191 sprintf (buf, "%s\n\trotli\t%s,%%2\t// %d 0x%x", load_op, dst_fmt, value, value);
1192 break;
1193 case 9: /* lsl */
1194 sprintf (buf, "%s\n\tlsli\t%s,%%2\t// %d 0x%x", load_op, dst_fmt, value, value);
1195 break;
1196 case 10: /* ixh */
1197 sprintf (buf, "%s\n\tixh\t%s,%s\t// %d 0x%x", load_op, dst_fmt, dst_fmt, value, value);
1198 break;
1199 case 11: /* ixw */
1200 sprintf (buf, "%s\n\tixw\t%s,%s\t// %d 0x%x", load_op, dst_fmt, dst_fmt, value, value);
1201 break;
1202 default:
1203 return "";
1204 }
1205
1206 output_asm_insn (buf, out_operands);
1207
1208 return "";
1209 }
1210
1211 /* Output a move of a word or less value. */
1212
1213 const char *
1214 mcore_output_move (rtx insn ATTRIBUTE_UNUSED, rtx operands[],
1215 enum machine_mode mode ATTRIBUTE_UNUSED)
1216 {
1217 rtx dst = operands[0];
1218 rtx src = operands[1];
1219
1220 if (GET_CODE (dst) == REG)
1221 {
1222 if (GET_CODE (src) == REG)
1223 {
1224 if (REGNO (src) == CC_REG) /* r-c */
1225 return "mvc\t%0";
1226 else
1227 return "mov\t%0,%1"; /* r-r*/
1228 }
1229 else if (GET_CODE (src) == MEM)
1230 {
1231 if (GET_CODE (XEXP (src, 0)) == LABEL_REF)
1232 return "lrw\t%0,[%1]"; /* a-R */
1233 else
1234 switch (GET_MODE (src)) /* r-m */
1235 {
1236 case SImode:
1237 return "ldw\t%0,%1";
1238 case HImode:
1239 return "ld.h\t%0,%1";
1240 case QImode:
1241 return "ld.b\t%0,%1";
1242 default:
1243 gcc_unreachable ();
1244 }
1245 }
1246 else if (GET_CODE (src) == CONST_INT)
1247 {
1248 int x, y;
1249
1250 if (CONST_OK_FOR_I (INTVAL (src))) /* r-I */
1251 return "movi\t%0,%1";
1252 else if (CONST_OK_FOR_M (INTVAL (src))) /* r-M */
1253 return "bgeni\t%0,%P1\t// %1 %x1";
1254 else if (CONST_OK_FOR_N (INTVAL (src))) /* r-N */
1255 return "bmaski\t%0,%N1\t// %1 %x1";
1256 else if (try_constant_tricks (INTVAL (src), &x, &y)) /* R-P */
1257 return output_inline_const (SImode, operands); /* 1-2 insns */
1258 else
1259 return "lrw\t%0,%x1\t// %1"; /* Get it from literal pool. */
1260 }
1261 else
1262 return "lrw\t%0, %1"; /* Into the literal pool. */
1263 }
1264 else if (GET_CODE (dst) == MEM) /* m-r */
1265 switch (GET_MODE (dst))
1266 {
1267 case SImode:
1268 return "stw\t%1,%0";
1269 case HImode:
1270 return "st.h\t%1,%0";
1271 case QImode:
1272 return "st.b\t%1,%0";
1273 default:
1274 gcc_unreachable ();
1275 }
1276
1277 gcc_unreachable ();
1278 }
1279
1280 /* Return a sequence of instructions to perform DI or DF move.
1281 Since the MCORE cannot move a DI or DF in one instruction, we have
1282 to take care when we see overlapping source and dest registers. */
1283
1284 const char *
1285 mcore_output_movedouble (rtx operands[], enum machine_mode mode ATTRIBUTE_UNUSED)
1286 {
1287 rtx dst = operands[0];
1288 rtx src = operands[1];
1289
1290 if (GET_CODE (dst) == REG)
1291 {
1292 if (GET_CODE (src) == REG)
1293 {
1294 int dstreg = REGNO (dst);
1295 int srcreg = REGNO (src);
1296
1297 /* Ensure the second source not overwritten. */
1298 if (srcreg + 1 == dstreg)
1299 return "mov %R0,%R1\n\tmov %0,%1";
1300 else
1301 return "mov %0,%1\n\tmov %R0,%R1";
1302 }
1303 else if (GET_CODE (src) == MEM)
1304 {
1305 rtx memexp = memexp = XEXP (src, 0);
1306 int dstreg = REGNO (dst);
1307 int basereg = -1;
1308
1309 if (GET_CODE (memexp) == LABEL_REF)
1310 return "lrw\t%0,[%1]\n\tlrw\t%R0,[%R1]";
1311 else if (GET_CODE (memexp) == REG)
1312 basereg = REGNO (memexp);
1313 else if (GET_CODE (memexp) == PLUS)
1314 {
1315 if (GET_CODE (XEXP (memexp, 0)) == REG)
1316 basereg = REGNO (XEXP (memexp, 0));
1317 else if (GET_CODE (XEXP (memexp, 1)) == REG)
1318 basereg = REGNO (XEXP (memexp, 1));
1319 else
1320 gcc_unreachable ();
1321 }
1322 else
1323 gcc_unreachable ();
1324
1325 /* ??? length attribute is wrong here. */
1326 if (dstreg == basereg)
1327 {
1328 /* Just load them in reverse order. */
1329 return "ldw\t%R0,%R1\n\tldw\t%0,%1";
1330
1331 /* XXX: alternative: move basereg to basereg+1
1332 and then fall through. */
1333 }
1334 else
1335 return "ldw\t%0,%1\n\tldw\t%R0,%R1";
1336 }
1337 else if (GET_CODE (src) == CONST_INT)
1338 {
1339 if (TARGET_LITTLE_END)
1340 {
1341 if (CONST_OK_FOR_I (INTVAL (src)))
1342 output_asm_insn ("movi %0,%1", operands);
1343 else if (CONST_OK_FOR_M (INTVAL (src)))
1344 output_asm_insn ("bgeni %0,%P1", operands);
1345 else if (INTVAL (src) == -1)
1346 output_asm_insn ("bmaski %0,32", operands);
1347 else if (CONST_OK_FOR_N (INTVAL (src)))
1348 output_asm_insn ("bmaski %0,%N1", operands);
1349 else
1350 gcc_unreachable ();
1351
1352 if (INTVAL (src) < 0)
1353 return "bmaski %R0,32";
1354 else
1355 return "movi %R0,0";
1356 }
1357 else
1358 {
1359 if (CONST_OK_FOR_I (INTVAL (src)))
1360 output_asm_insn ("movi %R0,%1", operands);
1361 else if (CONST_OK_FOR_M (INTVAL (src)))
1362 output_asm_insn ("bgeni %R0,%P1", operands);
1363 else if (INTVAL (src) == -1)
1364 output_asm_insn ("bmaski %R0,32", operands);
1365 else if (CONST_OK_FOR_N (INTVAL (src)))
1366 output_asm_insn ("bmaski %R0,%N1", operands);
1367 else
1368 gcc_unreachable ();
1369
1370 if (INTVAL (src) < 0)
1371 return "bmaski %0,32";
1372 else
1373 return "movi %0,0";
1374 }
1375 }
1376 else
1377 gcc_unreachable ();
1378 }
1379 else if (GET_CODE (dst) == MEM && GET_CODE (src) == REG)
1380 return "stw\t%1,%0\n\tstw\t%R1,%R0";
1381 else
1382 gcc_unreachable ();
1383 }
1384
1385 /* Predicates used by the templates. */
1386
1387 int
1388 mcore_arith_S_operand (rtx op)
1389 {
1390 if (GET_CODE (op) == CONST_INT && CONST_OK_FOR_M (~INTVAL (op)))
1391 return 1;
1392
1393 return 0;
1394 }
1395
1396 /* Expand insert bit field. BRC */
1397
1398 int
1399 mcore_expand_insv (rtx operands[])
1400 {
1401 int width = INTVAL (operands[1]);
1402 int posn = INTVAL (operands[2]);
1403 int mask;
1404 rtx mreg, sreg, ereg;
1405
1406 /* To get width 1 insv, the test in store_bit_field() (expmed.c, line 191)
1407 for width==1 must be removed. Look around line 368. This is something
1408 we really want the md part to do. */
1409 if (width == 1 && GET_CODE (operands[3]) == CONST_INT)
1410 {
1411 /* Do directly with bseti or bclri. */
1412 /* RBE: 2/97 consider only low bit of constant. */
1413 if ((INTVAL(operands[3])&1) == 0)
1414 {
1415 mask = ~(1 << posn);
1416 emit_insn (gen_rtx_SET (SImode, operands[0],
1417 gen_rtx_AND (SImode, operands[0], GEN_INT (mask))));
1418 }
1419 else
1420 {
1421 mask = 1 << posn;
1422 emit_insn (gen_rtx_SET (SImode, operands[0],
1423 gen_rtx_IOR (SImode, operands[0], GEN_INT (mask))));
1424 }
1425
1426 return 1;
1427 }
1428
1429 /* Look at some bit-field placements that we aren't interested
1430 in handling ourselves, unless specifically directed to do so. */
1431 if (! TARGET_W_FIELD)
1432 return 0; /* Generally, give up about now. */
1433
1434 if (width == 8 && posn % 8 == 0)
1435 /* Byte sized and aligned; let caller break it up. */
1436 return 0;
1437
1438 if (width == 16 && posn % 16 == 0)
1439 /* Short sized and aligned; let caller break it up. */
1440 return 0;
1441
1442 /* The general case - we can do this a little bit better than what the
1443 machine independent part tries. This will get rid of all the subregs
1444 that mess up constant folding in combine when working with relaxed
1445 immediates. */
1446
1447 /* If setting the entire field, do it directly. */
1448 if (GET_CODE (operands[3]) == CONST_INT &&
1449 INTVAL (operands[3]) == ((1 << width) - 1))
1450 {
1451 mreg = force_reg (SImode, GEN_INT (INTVAL (operands[3]) << posn));
1452 emit_insn (gen_rtx_SET (SImode, operands[0],
1453 gen_rtx_IOR (SImode, operands[0], mreg)));
1454 return 1;
1455 }
1456
1457 /* Generate the clear mask. */
1458 mreg = force_reg (SImode, GEN_INT (~(((1 << width) - 1) << posn)));
1459
1460 /* Clear the field, to overlay it later with the source. */
1461 emit_insn (gen_rtx_SET (SImode, operands[0],
1462 gen_rtx_AND (SImode, operands[0], mreg)));
1463
1464 /* If the source is constant 0, we've nothing to add back. */
1465 if (GET_CODE (operands[3]) == CONST_INT && INTVAL (operands[3]) == 0)
1466 return 1;
1467
1468 /* XXX: Should we worry about more games with constant values?
1469 We've covered the high profile: set/clear single-bit and many-bit
1470 fields. How often do we see "arbitrary bit pattern" constants? */
1471 sreg = copy_to_mode_reg (SImode, operands[3]);
1472
1473 /* Extract src as same width as dst (needed for signed values). We
1474 always have to do this since we widen everything to SImode.
1475 We don't have to mask if we're shifting this up against the
1476 MSB of the register (e.g., the shift will push out any hi-order
1477 bits. */
1478 if (width + posn != (int) GET_MODE_SIZE (SImode))
1479 {
1480 ereg = force_reg (SImode, GEN_INT ((1 << width) - 1));
1481 emit_insn (gen_rtx_SET (SImode, sreg,
1482 gen_rtx_AND (SImode, sreg, ereg)));
1483 }
1484
1485 /* Insert source value in dest. */
1486 if (posn != 0)
1487 emit_insn (gen_rtx_SET (SImode, sreg,
1488 gen_rtx_ASHIFT (SImode, sreg, GEN_INT (posn))));
1489
1490 emit_insn (gen_rtx_SET (SImode, operands[0],
1491 gen_rtx_IOR (SImode, operands[0], sreg)));
1492
1493 return 1;
1494 }
1495 \f
1496 /* ??? Block move stuff stolen from m88k. This code has not been
1497 verified for correctness. */
1498
1499 /* Emit code to perform a block move. Choose the best method.
1500
1501 OPERANDS[0] is the destination.
1502 OPERANDS[1] is the source.
1503 OPERANDS[2] is the size.
1504 OPERANDS[3] is the alignment safe to use. */
1505
1506 /* Emit code to perform a block move with an offset sequence of ldw/st
1507 instructions (..., ldw 0, stw 1, ldw 1, stw 0, ...). SIZE and ALIGN are
1508 known constants. DEST and SRC are registers. OFFSET is the known
1509 starting point for the output pattern. */
1510
1511 static const enum machine_mode mode_from_align[] =
1512 {
1513 VOIDmode, QImode, HImode, VOIDmode, SImode,
1514 };
1515
1516 static void
1517 block_move_sequence (rtx dst_mem, rtx src_mem, int size, int align)
1518 {
1519 rtx temp[2];
1520 enum machine_mode mode[2];
1521 int amount[2];
1522 bool active[2];
1523 int phase = 0;
1524 int next;
1525 int offset_ld = 0;
1526 int offset_st = 0;
1527 rtx x;
1528
1529 x = XEXP (dst_mem, 0);
1530 if (!REG_P (x))
1531 {
1532 x = force_reg (Pmode, x);
1533 dst_mem = replace_equiv_address (dst_mem, x);
1534 }
1535
1536 x = XEXP (src_mem, 0);
1537 if (!REG_P (x))
1538 {
1539 x = force_reg (Pmode, x);
1540 src_mem = replace_equiv_address (src_mem, x);
1541 }
1542
1543 active[0] = active[1] = false;
1544
1545 do
1546 {
1547 next = phase;
1548 phase ^= 1;
1549
1550 if (size > 0)
1551 {
1552 int next_amount;
1553
1554 next_amount = (size >= 4 ? 4 : (size >= 2 ? 2 : 1));
1555 next_amount = MIN (next_amount, align);
1556
1557 amount[next] = next_amount;
1558 mode[next] = mode_from_align[next_amount];
1559 temp[next] = gen_reg_rtx (mode[next]);
1560
1561 x = adjust_address (src_mem, mode[next], offset_ld);
1562 emit_insn (gen_rtx_SET (VOIDmode, temp[next], x));
1563
1564 offset_ld += next_amount;
1565 size -= next_amount;
1566 active[next] = true;
1567 }
1568
1569 if (active[phase])
1570 {
1571 active[phase] = false;
1572
1573 x = adjust_address (dst_mem, mode[phase], offset_st);
1574 emit_insn (gen_rtx_SET (VOIDmode, x, temp[phase]));
1575
1576 offset_st += amount[phase];
1577 }
1578 }
1579 while (active[next]);
1580 }
1581
1582 bool
1583 mcore_expand_block_move (rtx *operands)
1584 {
1585 HOST_WIDE_INT align, bytes, max;
1586
1587 if (GET_CODE (operands[2]) != CONST_INT)
1588 return false;
1589
1590 bytes = INTVAL (operands[2]);
1591 align = INTVAL (operands[3]);
1592
1593 if (bytes <= 0)
1594 return false;
1595 if (align > 4)
1596 align = 4;
1597
1598 switch (align)
1599 {
1600 case 4:
1601 if (bytes & 1)
1602 max = 4*4;
1603 else if (bytes & 3)
1604 max = 8*4;
1605 else
1606 max = 16*4;
1607 break;
1608 case 2:
1609 max = 4*2;
1610 break;
1611 case 1:
1612 max = 4*1;
1613 break;
1614 default:
1615 gcc_unreachable ();
1616 }
1617
1618 if (bytes <= max)
1619 {
1620 block_move_sequence (operands[0], operands[1], bytes, align);
1621 return true;
1622 }
1623
1624 return false;
1625 }
1626 \f
1627
1628 /* Code to generate prologue and epilogue sequences. */
1629 static int number_of_regs_before_varargs;
1630
1631 /* Set by TARGET_SETUP_INCOMING_VARARGS to indicate to prolog that this is
1632 for a varargs function. */
1633 static int current_function_anonymous_args;
1634
1635 #define STACK_BYTES (STACK_BOUNDARY/BITS_PER_UNIT)
1636 #define STORE_REACH (64) /* Maximum displace of word store + 4. */
1637 #define ADDI_REACH (32) /* Maximum addi operand. */
1638
1639 static void
1640 layout_mcore_frame (struct mcore_frame * infp)
1641 {
1642 int n;
1643 unsigned int i;
1644 int nbytes;
1645 int regarg;
1646 int localregarg;
1647 int localreg;
1648 int outbounds;
1649 unsigned int growths;
1650 int step;
1651
1652 /* Might have to spill bytes to re-assemble a big argument that
1653 was passed partially in registers and partially on the stack. */
1654 nbytes = current_function_pretend_args_size;
1655
1656 /* Determine how much space for spilled anonymous args (e.g., stdarg). */
1657 if (current_function_anonymous_args)
1658 nbytes += (NPARM_REGS - number_of_regs_before_varargs) * UNITS_PER_WORD;
1659
1660 infp->arg_size = nbytes;
1661
1662 /* How much space to save non-volatile registers we stomp. */
1663 infp->reg_mask = calc_live_regs (& n);
1664 infp->reg_size = n * 4;
1665
1666 /* And the rest of it... locals and space for overflowed outbounds. */
1667 infp->local_size = get_frame_size ();
1668 infp->outbound_size = current_function_outgoing_args_size;
1669
1670 /* Make sure we have a whole number of words for the locals. */
1671 if (infp->local_size % STACK_BYTES)
1672 infp->local_size = (infp->local_size + STACK_BYTES - 1) & ~ (STACK_BYTES -1);
1673
1674 /* Only thing we know we have to pad is the outbound space, since
1675 we've aligned our locals assuming that base of locals is aligned. */
1676 infp->pad_local = 0;
1677 infp->pad_reg = 0;
1678 infp->pad_outbound = 0;
1679 if (infp->outbound_size % STACK_BYTES)
1680 infp->pad_outbound = STACK_BYTES - (infp->outbound_size % STACK_BYTES);
1681
1682 /* Now we see how we want to stage the prologue so that it does
1683 the most appropriate stack growth and register saves to either:
1684 (1) run fast,
1685 (2) reduce instruction space, or
1686 (3) reduce stack space. */
1687 for (i = 0; i < ARRAY_SIZE (infp->growth); i++)
1688 infp->growth[i] = 0;
1689
1690 regarg = infp->reg_size + infp->arg_size;
1691 localregarg = infp->local_size + regarg;
1692 localreg = infp->local_size + infp->reg_size;
1693 outbounds = infp->outbound_size + infp->pad_outbound;
1694 growths = 0;
1695
1696 /* XXX: Consider one where we consider localregarg + outbound too! */
1697
1698 /* Frame of <= 32 bytes and using stm would get <= 2 registers.
1699 use stw's with offsets and buy the frame in one shot. */
1700 if (localregarg <= ADDI_REACH
1701 && (infp->reg_size <= 8 || (infp->reg_mask & 0xc000) != 0xc000))
1702 {
1703 /* Make sure we'll be aligned. */
1704 if (localregarg % STACK_BYTES)
1705 infp->pad_reg = STACK_BYTES - (localregarg % STACK_BYTES);
1706
1707 step = localregarg + infp->pad_reg;
1708 infp->reg_offset = infp->local_size;
1709
1710 if (outbounds + step <= ADDI_REACH && !frame_pointer_needed)
1711 {
1712 step += outbounds;
1713 infp->reg_offset += outbounds;
1714 outbounds = 0;
1715 }
1716
1717 infp->arg_offset = step - 4;
1718 infp->growth[growths++] = step;
1719 infp->reg_growth = growths;
1720 infp->local_growth = growths;
1721
1722 /* If we haven't already folded it in. */
1723 if (outbounds)
1724 infp->growth[growths++] = outbounds;
1725
1726 goto finish;
1727 }
1728
1729 /* Frame can't be done with a single subi, but can be done with 2
1730 insns. If the 'stm' is getting <= 2 registers, we use stw's and
1731 shift some of the stack purchase into the first subi, so both are
1732 single instructions. */
1733 if (localregarg <= STORE_REACH
1734 && (infp->local_size > ADDI_REACH)
1735 && (infp->reg_size <= 8 || (infp->reg_mask & 0xc000) != 0xc000))
1736 {
1737 int all;
1738
1739 /* Make sure we'll be aligned; use either pad_reg or pad_local. */
1740 if (localregarg % STACK_BYTES)
1741 infp->pad_reg = STACK_BYTES - (localregarg % STACK_BYTES);
1742
1743 all = localregarg + infp->pad_reg + infp->pad_local;
1744 step = ADDI_REACH; /* As much up front as we can. */
1745 if (step > all)
1746 step = all;
1747
1748 /* XXX: Consider whether step will still be aligned; we believe so. */
1749 infp->arg_offset = step - 4;
1750 infp->growth[growths++] = step;
1751 infp->reg_growth = growths;
1752 infp->reg_offset = step - infp->pad_reg - infp->reg_size;
1753 all -= step;
1754
1755 /* Can we fold in any space required for outbounds? */
1756 if (outbounds + all <= ADDI_REACH && !frame_pointer_needed)
1757 {
1758 all += outbounds;
1759 outbounds = 0;
1760 }
1761
1762 /* Get the rest of the locals in place. */
1763 step = all;
1764 infp->growth[growths++] = step;
1765 infp->local_growth = growths;
1766 all -= step;
1767
1768 assert (all == 0);
1769
1770 /* Finish off if we need to do so. */
1771 if (outbounds)
1772 infp->growth[growths++] = outbounds;
1773
1774 goto finish;
1775 }
1776
1777 /* Registers + args is nicely aligned, so we'll buy that in one shot.
1778 Then we buy the rest of the frame in 1 or 2 steps depending on
1779 whether we need a frame pointer. */
1780 if ((regarg % STACK_BYTES) == 0)
1781 {
1782 infp->growth[growths++] = regarg;
1783 infp->reg_growth = growths;
1784 infp->arg_offset = regarg - 4;
1785 infp->reg_offset = 0;
1786
1787 if (infp->local_size % STACK_BYTES)
1788 infp->pad_local = STACK_BYTES - (infp->local_size % STACK_BYTES);
1789
1790 step = infp->local_size + infp->pad_local;
1791
1792 if (!frame_pointer_needed)
1793 {
1794 step += outbounds;
1795 outbounds = 0;
1796 }
1797
1798 infp->growth[growths++] = step;
1799 infp->local_growth = growths;
1800
1801 /* If there's any left to be done. */
1802 if (outbounds)
1803 infp->growth[growths++] = outbounds;
1804
1805 goto finish;
1806 }
1807
1808 /* XXX: optimizations that we'll want to play with....
1809 -- regarg is not aligned, but it's a small number of registers;
1810 use some of localsize so that regarg is aligned and then
1811 save the registers. */
1812
1813 /* Simple encoding; plods down the stack buying the pieces as it goes.
1814 -- does not optimize space consumption.
1815 -- does not attempt to optimize instruction counts.
1816 -- but it is safe for all alignments. */
1817 if (regarg % STACK_BYTES != 0)
1818 infp->pad_reg = STACK_BYTES - (regarg % STACK_BYTES);
1819
1820 infp->growth[growths++] = infp->arg_size + infp->reg_size + infp->pad_reg;
1821 infp->reg_growth = growths;
1822 infp->arg_offset = infp->growth[0] - 4;
1823 infp->reg_offset = 0;
1824
1825 if (frame_pointer_needed)
1826 {
1827 if (infp->local_size % STACK_BYTES != 0)
1828 infp->pad_local = STACK_BYTES - (infp->local_size % STACK_BYTES);
1829
1830 infp->growth[growths++] = infp->local_size + infp->pad_local;
1831 infp->local_growth = growths;
1832
1833 infp->growth[growths++] = outbounds;
1834 }
1835 else
1836 {
1837 if ((infp->local_size + outbounds) % STACK_BYTES != 0)
1838 infp->pad_local = STACK_BYTES - ((infp->local_size + outbounds) % STACK_BYTES);
1839
1840 infp->growth[growths++] = infp->local_size + infp->pad_local + outbounds;
1841 infp->local_growth = growths;
1842 }
1843
1844 /* Anything else that we've forgotten?, plus a few consistency checks. */
1845 finish:
1846 assert (infp->reg_offset >= 0);
1847 assert (growths <= MAX_STACK_GROWS);
1848
1849 for (i = 0; i < growths; i++)
1850 gcc_assert (!(infp->growth[i] % STACK_BYTES));
1851 }
1852
1853 /* Define the offset between two registers, one to be eliminated, and
1854 the other its replacement, at the start of a routine. */
1855
1856 int
1857 mcore_initial_elimination_offset (int from, int to)
1858 {
1859 int above_frame;
1860 int below_frame;
1861 struct mcore_frame fi;
1862
1863 layout_mcore_frame (& fi);
1864
1865 /* fp to ap */
1866 above_frame = fi.local_size + fi.pad_local + fi.reg_size + fi.pad_reg;
1867 /* sp to fp */
1868 below_frame = fi.outbound_size + fi.pad_outbound;
1869
1870 if (from == ARG_POINTER_REGNUM && to == FRAME_POINTER_REGNUM)
1871 return above_frame;
1872
1873 if (from == ARG_POINTER_REGNUM && to == STACK_POINTER_REGNUM)
1874 return above_frame + below_frame;
1875
1876 if (from == FRAME_POINTER_REGNUM && to == STACK_POINTER_REGNUM)
1877 return below_frame;
1878
1879 gcc_unreachable ();
1880 }
1881
1882 /* Keep track of some information about varargs for the prolog. */
1883
1884 static void
1885 mcore_setup_incoming_varargs (CUMULATIVE_ARGS *args_so_far,
1886 enum machine_mode mode, tree type,
1887 int * ptr_pretend_size ATTRIBUTE_UNUSED,
1888 int second_time ATTRIBUTE_UNUSED)
1889 {
1890 current_function_anonymous_args = 1;
1891
1892 /* We need to know how many argument registers are used before
1893 the varargs start, so that we can push the remaining argument
1894 registers during the prologue. */
1895 number_of_regs_before_varargs = *args_so_far + mcore_num_arg_regs (mode, type);
1896
1897 /* There is a bug somewhere in the arg handling code.
1898 Until I can find it this workaround always pushes the
1899 last named argument onto the stack. */
1900 number_of_regs_before_varargs = *args_so_far;
1901
1902 /* The last named argument may be split between argument registers
1903 and the stack. Allow for this here. */
1904 if (number_of_regs_before_varargs > NPARM_REGS)
1905 number_of_regs_before_varargs = NPARM_REGS;
1906 }
1907
1908 void
1909 mcore_expand_prolog (void)
1910 {
1911 struct mcore_frame fi;
1912 int space_allocated = 0;
1913 int growth = 0;
1914
1915 /* Find out what we're doing. */
1916 layout_mcore_frame (&fi);
1917
1918 space_allocated = fi.arg_size + fi.reg_size + fi.local_size +
1919 fi.outbound_size + fi.pad_outbound + fi.pad_local + fi.pad_reg;
1920
1921 if (TARGET_CG_DATA)
1922 {
1923 /* Emit a symbol for this routine's frame size. */
1924 rtx x;
1925
1926 x = DECL_RTL (current_function_decl);
1927
1928 gcc_assert (GET_CODE (x) == MEM);
1929
1930 x = XEXP (x, 0);
1931
1932 gcc_assert (GET_CODE (x) == SYMBOL_REF);
1933
1934 if (mcore_current_function_name)
1935 free (mcore_current_function_name);
1936
1937 mcore_current_function_name = xstrdup (XSTR (x, 0));
1938
1939 ASM_OUTPUT_CG_NODE (asm_out_file, mcore_current_function_name, space_allocated);
1940
1941 if (current_function_calls_alloca)
1942 ASM_OUTPUT_CG_EDGE (asm_out_file, mcore_current_function_name, "alloca", 1);
1943
1944 /* 970425: RBE:
1945 We're looking at how the 8byte alignment affects stack layout
1946 and where we had to pad things. This emits information we can
1947 extract which tells us about frame sizes and the like. */
1948 fprintf (asm_out_file,
1949 "\t.equ\t__$frame$info$_%s_$_%d_%d_x%x_%d_%d_%d,0\n",
1950 mcore_current_function_name,
1951 fi.arg_size, fi.reg_size, fi.reg_mask,
1952 fi.local_size, fi.outbound_size,
1953 frame_pointer_needed);
1954 }
1955
1956 if (mcore_naked_function_p ())
1957 return;
1958
1959 /* Handle stdarg+regsaves in one shot: can't be more than 64 bytes. */
1960 output_stack_adjust (-1, fi.growth[growth++]); /* Grows it. */
1961
1962 /* If we have a parameter passed partially in regs and partially in memory,
1963 the registers will have been stored to memory already in function.c. So
1964 we only need to do something here for varargs functions. */
1965 if (fi.arg_size != 0 && current_function_pretend_args_size == 0)
1966 {
1967 int offset;
1968 int rn = FIRST_PARM_REG + NPARM_REGS - 1;
1969 int remaining = fi.arg_size;
1970
1971 for (offset = fi.arg_offset; remaining >= 4; offset -= 4, rn--, remaining -= 4)
1972 {
1973 emit_insn (gen_movsi
1974 (gen_rtx_MEM (SImode,
1975 plus_constant (stack_pointer_rtx, offset)),
1976 gen_rtx_REG (SImode, rn)));
1977 }
1978 }
1979
1980 /* Do we need another stack adjustment before we do the register saves? */
1981 if (growth < fi.reg_growth)
1982 output_stack_adjust (-1, fi.growth[growth++]); /* Grows it. */
1983
1984 if (fi.reg_size != 0)
1985 {
1986 int i;
1987 int offs = fi.reg_offset;
1988
1989 for (i = 15; i >= 0; i--)
1990 {
1991 if (offs == 0 && i == 15 && ((fi.reg_mask & 0xc000) == 0xc000))
1992 {
1993 int first_reg = 15;
1994
1995 while (fi.reg_mask & (1 << first_reg))
1996 first_reg--;
1997 first_reg++;
1998
1999 emit_insn (gen_store_multiple (gen_rtx_MEM (SImode, stack_pointer_rtx),
2000 gen_rtx_REG (SImode, first_reg),
2001 GEN_INT (16 - first_reg)));
2002
2003 i -= (15 - first_reg);
2004 offs += (16 - first_reg) * 4;
2005 }
2006 else if (fi.reg_mask & (1 << i))
2007 {
2008 emit_insn (gen_movsi
2009 (gen_rtx_MEM (SImode,
2010 plus_constant (stack_pointer_rtx, offs)),
2011 gen_rtx_REG (SImode, i)));
2012 offs += 4;
2013 }
2014 }
2015 }
2016
2017 /* Figure the locals + outbounds. */
2018 if (frame_pointer_needed)
2019 {
2020 /* If we haven't already purchased to 'fp'. */
2021 if (growth < fi.local_growth)
2022 output_stack_adjust (-1, fi.growth[growth++]); /* Grows it. */
2023
2024 emit_insn (gen_movsi (frame_pointer_rtx, stack_pointer_rtx));
2025
2026 /* ... and then go any remaining distance for outbounds, etc. */
2027 if (fi.growth[growth])
2028 output_stack_adjust (-1, fi.growth[growth++]);
2029 }
2030 else
2031 {
2032 if (growth < fi.local_growth)
2033 output_stack_adjust (-1, fi.growth[growth++]); /* Grows it. */
2034 if (fi.growth[growth])
2035 output_stack_adjust (-1, fi.growth[growth++]);
2036 }
2037 }
2038
2039 void
2040 mcore_expand_epilog (void)
2041 {
2042 struct mcore_frame fi;
2043 int i;
2044 int offs;
2045 int growth = MAX_STACK_GROWS - 1 ;
2046
2047
2048 /* Find out what we're doing. */
2049 layout_mcore_frame(&fi);
2050
2051 if (mcore_naked_function_p ())
2052 return;
2053
2054 /* If we had a frame pointer, restore the sp from that. */
2055 if (frame_pointer_needed)
2056 {
2057 emit_insn (gen_movsi (stack_pointer_rtx, frame_pointer_rtx));
2058 growth = fi.local_growth - 1;
2059 }
2060 else
2061 {
2062 /* XXX: while loop should accumulate and do a single sell. */
2063 while (growth >= fi.local_growth)
2064 {
2065 if (fi.growth[growth] != 0)
2066 output_stack_adjust (1, fi.growth[growth]);
2067 growth--;
2068 }
2069 }
2070
2071 /* Make sure we've shrunk stack back to the point where the registers
2072 were laid down. This is typically 0/1 iterations. Then pull the
2073 register save information back off the stack. */
2074 while (growth >= fi.reg_growth)
2075 output_stack_adjust ( 1, fi.growth[growth--]);
2076
2077 offs = fi.reg_offset;
2078
2079 for (i = 15; i >= 0; i--)
2080 {
2081 if (offs == 0 && i == 15 && ((fi.reg_mask & 0xc000) == 0xc000))
2082 {
2083 int first_reg;
2084
2085 /* Find the starting register. */
2086 first_reg = 15;
2087
2088 while (fi.reg_mask & (1 << first_reg))
2089 first_reg--;
2090
2091 first_reg++;
2092
2093 emit_insn (gen_load_multiple (gen_rtx_REG (SImode, first_reg),
2094 gen_rtx_MEM (SImode, stack_pointer_rtx),
2095 GEN_INT (16 - first_reg)));
2096
2097 i -= (15 - first_reg);
2098 offs += (16 - first_reg) * 4;
2099 }
2100 else if (fi.reg_mask & (1 << i))
2101 {
2102 emit_insn (gen_movsi
2103 (gen_rtx_REG (SImode, i),
2104 gen_rtx_MEM (SImode,
2105 plus_constant (stack_pointer_rtx, offs))));
2106 offs += 4;
2107 }
2108 }
2109
2110 /* Give back anything else. */
2111 /* XXX: Should accumulate total and then give it back. */
2112 while (growth >= 0)
2113 output_stack_adjust ( 1, fi.growth[growth--]);
2114 }
2115 \f
2116 /* This code is borrowed from the SH port. */
2117
2118 /* The MCORE cannot load a large constant into a register, constants have to
2119 come from a pc relative load. The reference of a pc relative load
2120 instruction must be less than 1k in front of the instruction. This
2121 means that we often have to dump a constant inside a function, and
2122 generate code to branch around it.
2123
2124 It is important to minimize this, since the branches will slow things
2125 down and make things bigger.
2126
2127 Worst case code looks like:
2128
2129 lrw L1,r0
2130 br L2
2131 align
2132 L1: .long value
2133 L2:
2134 ..
2135
2136 lrw L3,r0
2137 br L4
2138 align
2139 L3: .long value
2140 L4:
2141 ..
2142
2143 We fix this by performing a scan before scheduling, which notices which
2144 instructions need to have their operands fetched from the constant table
2145 and builds the table.
2146
2147 The algorithm is:
2148
2149 scan, find an instruction which needs a pcrel move. Look forward, find the
2150 last barrier which is within MAX_COUNT bytes of the requirement.
2151 If there isn't one, make one. Process all the instructions between
2152 the find and the barrier.
2153
2154 In the above example, we can tell that L3 is within 1k of L1, so
2155 the first move can be shrunk from the 2 insn+constant sequence into
2156 just 1 insn, and the constant moved to L3 to make:
2157
2158 lrw L1,r0
2159 ..
2160 lrw L3,r0
2161 bra L4
2162 align
2163 L3:.long value
2164 L4:.long value
2165
2166 Then the second move becomes the target for the shortening process. */
2167
2168 typedef struct
2169 {
2170 rtx value; /* Value in table. */
2171 rtx label; /* Label of value. */
2172 } pool_node;
2173
2174 /* The maximum number of constants that can fit into one pool, since
2175 the pc relative range is 0...1020 bytes and constants are at least 4
2176 bytes long. We subtract 4 from the range to allow for the case where
2177 we need to add a branch/align before the constant pool. */
2178
2179 #define MAX_COUNT 1016
2180 #define MAX_POOL_SIZE (MAX_COUNT/4)
2181 static pool_node pool_vector[MAX_POOL_SIZE];
2182 static int pool_size;
2183
2184 /* Dump out any constants accumulated in the final pass. These
2185 will only be labels. */
2186
2187 const char *
2188 mcore_output_jump_label_table (void)
2189 {
2190 int i;
2191
2192 if (pool_size)
2193 {
2194 fprintf (asm_out_file, "\t.align 2\n");
2195
2196 for (i = 0; i < pool_size; i++)
2197 {
2198 pool_node * p = pool_vector + i;
2199
2200 (*targetm.asm_out.internal_label) (asm_out_file, "L", CODE_LABEL_NUMBER (p->label));
2201
2202 output_asm_insn (".long %0", &p->value);
2203 }
2204
2205 pool_size = 0;
2206 }
2207
2208 return "";
2209 }
2210
2211 /* Check whether insn is a candidate for a conditional. */
2212
2213 static cond_type
2214 is_cond_candidate (rtx insn)
2215 {
2216 /* The only things we conditionalize are those that can be directly
2217 changed into a conditional. Only bother with SImode items. If
2218 we wanted to be a little more aggressive, we could also do other
2219 modes such as DImode with reg-reg move or load 0. */
2220 if (GET_CODE (insn) == INSN)
2221 {
2222 rtx pat = PATTERN (insn);
2223 rtx src, dst;
2224
2225 if (GET_CODE (pat) != SET)
2226 return COND_NO;
2227
2228 dst = XEXP (pat, 0);
2229
2230 if ((GET_CODE (dst) != REG &&
2231 GET_CODE (dst) != SUBREG) ||
2232 GET_MODE (dst) != SImode)
2233 return COND_NO;
2234
2235 src = XEXP (pat, 1);
2236
2237 if ((GET_CODE (src) == REG ||
2238 (GET_CODE (src) == SUBREG &&
2239 GET_CODE (SUBREG_REG (src)) == REG)) &&
2240 GET_MODE (src) == SImode)
2241 return COND_MOV_INSN;
2242 else if (GET_CODE (src) == CONST_INT &&
2243 INTVAL (src) == 0)
2244 return COND_CLR_INSN;
2245 else if (GET_CODE (src) == PLUS &&
2246 (GET_CODE (XEXP (src, 0)) == REG ||
2247 (GET_CODE (XEXP (src, 0)) == SUBREG &&
2248 GET_CODE (SUBREG_REG (XEXP (src, 0))) == REG)) &&
2249 GET_MODE (XEXP (src, 0)) == SImode &&
2250 GET_CODE (XEXP (src, 1)) == CONST_INT &&
2251 INTVAL (XEXP (src, 1)) == 1)
2252 return COND_INC_INSN;
2253 else if (((GET_CODE (src) == MINUS &&
2254 GET_CODE (XEXP (src, 1)) == CONST_INT &&
2255 INTVAL( XEXP (src, 1)) == 1) ||
2256 (GET_CODE (src) == PLUS &&
2257 GET_CODE (XEXP (src, 1)) == CONST_INT &&
2258 INTVAL (XEXP (src, 1)) == -1)) &&
2259 (GET_CODE (XEXP (src, 0)) == REG ||
2260 (GET_CODE (XEXP (src, 0)) == SUBREG &&
2261 GET_CODE (SUBREG_REG (XEXP (src, 0))) == REG)) &&
2262 GET_MODE (XEXP (src, 0)) == SImode)
2263 return COND_DEC_INSN;
2264
2265 /* Some insns that we don't bother with:
2266 (set (rx:DI) (ry:DI))
2267 (set (rx:DI) (const_int 0))
2268 */
2269
2270 }
2271 else if (GET_CODE (insn) == JUMP_INSN &&
2272 GET_CODE (PATTERN (insn)) == SET &&
2273 GET_CODE (XEXP (PATTERN (insn), 1)) == LABEL_REF)
2274 return COND_BRANCH_INSN;
2275
2276 return COND_NO;
2277 }
2278
2279 /* Emit a conditional version of insn and replace the old insn with the
2280 new one. Return the new insn if emitted. */
2281
2282 static rtx
2283 emit_new_cond_insn (rtx insn, int cond)
2284 {
2285 rtx c_insn = 0;
2286 rtx pat, dst, src;
2287 cond_type num;
2288
2289 if ((num = is_cond_candidate (insn)) == COND_NO)
2290 return NULL;
2291
2292 pat = PATTERN (insn);
2293
2294 if (GET_CODE (insn) == INSN)
2295 {
2296 dst = SET_DEST (pat);
2297 src = SET_SRC (pat);
2298 }
2299 else
2300 {
2301 dst = JUMP_LABEL (insn);
2302 src = NULL_RTX;
2303 }
2304
2305 switch (num)
2306 {
2307 case COND_MOV_INSN:
2308 case COND_CLR_INSN:
2309 if (cond)
2310 c_insn = gen_movt0 (dst, src, dst);
2311 else
2312 c_insn = gen_movt0 (dst, dst, src);
2313 break;
2314
2315 case COND_INC_INSN:
2316 if (cond)
2317 c_insn = gen_incscc (dst, dst);
2318 else
2319 c_insn = gen_incscc_false (dst, dst);
2320 break;
2321
2322 case COND_DEC_INSN:
2323 if (cond)
2324 c_insn = gen_decscc (dst, dst);
2325 else
2326 c_insn = gen_decscc_false (dst, dst);
2327 break;
2328
2329 case COND_BRANCH_INSN:
2330 if (cond)
2331 c_insn = gen_branch_true (dst);
2332 else
2333 c_insn = gen_branch_false (dst);
2334 break;
2335
2336 default:
2337 return NULL;
2338 }
2339
2340 /* Only copy the notes if they exist. */
2341 if (rtx_length [GET_CODE (c_insn)] >= 7 && rtx_length [GET_CODE (insn)] >= 7)
2342 {
2343 /* We really don't need to bother with the notes and links at this
2344 point, but go ahead and save the notes. This will help is_dead()
2345 when applying peepholes (links don't matter since they are not
2346 used any more beyond this point for the mcore). */
2347 REG_NOTES (c_insn) = REG_NOTES (insn);
2348 }
2349
2350 if (num == COND_BRANCH_INSN)
2351 {
2352 /* For jumps, we need to be a little bit careful and emit the new jump
2353 before the old one and to update the use count for the target label.
2354 This way, the barrier following the old (uncond) jump will get
2355 deleted, but the label won't. */
2356 c_insn = emit_jump_insn_before (c_insn, insn);
2357
2358 ++ LABEL_NUSES (dst);
2359
2360 JUMP_LABEL (c_insn) = dst;
2361 }
2362 else
2363 c_insn = emit_insn_after (c_insn, insn);
2364
2365 delete_insn (insn);
2366
2367 return c_insn;
2368 }
2369
2370 /* Attempt to change a basic block into a series of conditional insns. This
2371 works by taking the branch at the end of the 1st block and scanning for the
2372 end of the 2nd block. If all instructions in the 2nd block have cond.
2373 versions and the label at the start of block 3 is the same as the target
2374 from the branch at block 1, then conditionalize all insn in block 2 using
2375 the inverse condition of the branch at block 1. (Note I'm bending the
2376 definition of basic block here.)
2377
2378 e.g., change:
2379
2380 bt L2 <-- end of block 1 (delete)
2381 mov r7,r8
2382 addu r7,1
2383 br L3 <-- end of block 2
2384
2385 L2: ... <-- start of block 3 (NUSES==1)
2386 L3: ...
2387
2388 to:
2389
2390 movf r7,r8
2391 incf r7
2392 bf L3
2393
2394 L3: ...
2395
2396 we can delete the L2 label if NUSES==1 and re-apply the optimization
2397 starting at the last instruction of block 2. This may allow an entire
2398 if-then-else statement to be conditionalized. BRC */
2399 static rtx
2400 conditionalize_block (rtx first)
2401 {
2402 rtx insn;
2403 rtx br_pat;
2404 rtx end_blk_1_br = 0;
2405 rtx end_blk_2_insn = 0;
2406 rtx start_blk_3_lab = 0;
2407 int cond;
2408 int br_lab_num;
2409 int blk_size = 0;
2410
2411
2412 /* Check that the first insn is a candidate conditional jump. This is
2413 the one that we'll eliminate. If not, advance to the next insn to
2414 try. */
2415 if (GET_CODE (first) != JUMP_INSN ||
2416 GET_CODE (PATTERN (first)) != SET ||
2417 GET_CODE (XEXP (PATTERN (first), 1)) != IF_THEN_ELSE)
2418 return NEXT_INSN (first);
2419
2420 /* Extract some information we need. */
2421 end_blk_1_br = first;
2422 br_pat = PATTERN (end_blk_1_br);
2423
2424 /* Complement the condition since we use the reverse cond. for the insns. */
2425 cond = (GET_CODE (XEXP (XEXP (br_pat, 1), 0)) == EQ);
2426
2427 /* Determine what kind of branch we have. */
2428 if (GET_CODE (XEXP (XEXP (br_pat, 1), 1)) == LABEL_REF)
2429 {
2430 /* A normal branch, so extract label out of first arm. */
2431 br_lab_num = CODE_LABEL_NUMBER (XEXP (XEXP (XEXP (br_pat, 1), 1), 0));
2432 }
2433 else
2434 {
2435 /* An inverse branch, so extract the label out of the 2nd arm
2436 and complement the condition. */
2437 cond = (cond == 0);
2438 br_lab_num = CODE_LABEL_NUMBER (XEXP (XEXP (XEXP (br_pat, 1), 2), 0));
2439 }
2440
2441 /* Scan forward for the start of block 2: it must start with a
2442 label and that label must be the same as the branch target
2443 label from block 1. We don't care about whether block 2 actually
2444 ends with a branch or a label (an uncond. branch is
2445 conditionalizable). */
2446 for (insn = NEXT_INSN (first); insn; insn = NEXT_INSN (insn))
2447 {
2448 enum rtx_code code;
2449
2450 code = GET_CODE (insn);
2451
2452 /* Look for the label at the start of block 3. */
2453 if (code == CODE_LABEL && CODE_LABEL_NUMBER (insn) == br_lab_num)
2454 break;
2455
2456 /* Skip barriers, notes, and conditionalizable insns. If the
2457 insn is not conditionalizable or makes this optimization fail,
2458 just return the next insn so we can start over from that point. */
2459 if (code != BARRIER && code != NOTE && !is_cond_candidate (insn))
2460 return NEXT_INSN (insn);
2461
2462 /* Remember the last real insn before the label (i.e. end of block 2). */
2463 if (code == JUMP_INSN || code == INSN)
2464 {
2465 blk_size ++;
2466 end_blk_2_insn = insn;
2467 }
2468 }
2469
2470 if (!insn)
2471 return insn;
2472
2473 /* It is possible for this optimization to slow performance if the blocks
2474 are long. This really depends upon whether the branch is likely taken
2475 or not. If the branch is taken, we slow performance in many cases. But,
2476 if the branch is not taken, we always help performance (for a single
2477 block, but for a double block (i.e. when the optimization is re-applied)
2478 this is not true since the 'right thing' depends on the overall length of
2479 the collapsed block). As a compromise, don't apply this optimization on
2480 blocks larger than size 2 (unlikely for the mcore) when speed is important.
2481 the best threshold depends on the latencies of the instructions (i.e.,
2482 the branch penalty). */
2483 if (optimize > 1 && blk_size > 2)
2484 return insn;
2485
2486 /* At this point, we've found the start of block 3 and we know that
2487 it is the destination of the branch from block 1. Also, all
2488 instructions in the block 2 are conditionalizable. So, apply the
2489 conditionalization and delete the branch. */
2490 start_blk_3_lab = insn;
2491
2492 for (insn = NEXT_INSN (end_blk_1_br); insn != start_blk_3_lab;
2493 insn = NEXT_INSN (insn))
2494 {
2495 rtx newinsn;
2496
2497 if (INSN_DELETED_P (insn))
2498 continue;
2499
2500 /* Try to form a conditional variant of the instruction and emit it. */
2501 if ((newinsn = emit_new_cond_insn (insn, cond)))
2502 {
2503 if (end_blk_2_insn == insn)
2504 end_blk_2_insn = newinsn;
2505
2506 insn = newinsn;
2507 }
2508 }
2509
2510 /* Note whether we will delete the label starting blk 3 when the jump
2511 gets deleted. If so, we want to re-apply this optimization at the
2512 last real instruction right before the label. */
2513 if (LABEL_NUSES (start_blk_3_lab) == 1)
2514 {
2515 start_blk_3_lab = 0;
2516 }
2517
2518 /* ??? we probably should redistribute the death notes for this insn, esp.
2519 the death of cc, but it doesn't really matter this late in the game.
2520 The peepholes all use is_dead() which will find the correct death
2521 regardless of whether there is a note. */
2522 delete_insn (end_blk_1_br);
2523
2524 if (! start_blk_3_lab)
2525 return end_blk_2_insn;
2526
2527 /* Return the insn right after the label at the start of block 3. */
2528 return NEXT_INSN (start_blk_3_lab);
2529 }
2530
2531 /* Apply the conditionalization of blocks optimization. This is the
2532 outer loop that traverses through the insns scanning for a branch
2533 that signifies an opportunity to apply the optimization. Note that
2534 this optimization is applied late. If we could apply it earlier,
2535 say before cse 2, it may expose more optimization opportunities.
2536 but, the pay back probably isn't really worth the effort (we'd have
2537 to update all reg/flow/notes/links/etc to make it work - and stick it
2538 in before cse 2). */
2539
2540 static void
2541 conditionalize_optimization (void)
2542 {
2543 rtx insn;
2544
2545 for (insn = get_insns (); insn; insn = conditionalize_block (insn))
2546 continue;
2547 }
2548
2549 static int saved_warn_return_type = -1;
2550 static int saved_warn_return_type_count = 0;
2551
2552 /* This is to handle loads from the constant pool. */
2553
2554 static void
2555 mcore_reorg (void)
2556 {
2557 /* Reset this variable. */
2558 current_function_anonymous_args = 0;
2559
2560 /* Restore the warn_return_type if it has been altered. */
2561 if (saved_warn_return_type != -1)
2562 {
2563 /* Only restore the value if we have reached another function.
2564 The test of warn_return_type occurs in final_function () in
2565 c-decl.c a long time after the code for the function is generated,
2566 so we need a counter to tell us when we have finished parsing that
2567 function and can restore the flag. */
2568 if (--saved_warn_return_type_count == 0)
2569 {
2570 warn_return_type = saved_warn_return_type;
2571 saved_warn_return_type = -1;
2572 }
2573 }
2574
2575 if (optimize == 0)
2576 return;
2577
2578 /* Conditionalize blocks where we can. */
2579 conditionalize_optimization ();
2580
2581 /* Literal pool generation is now pushed off until the assembler. */
2582 }
2583
2584 \f
2585 /* Return true if X is something that can be moved directly into r15. */
2586
2587 bool
2588 mcore_r15_operand_p (rtx x)
2589 {
2590 switch (GET_CODE (x))
2591 {
2592 case CONST_INT:
2593 return mcore_const_ok_for_inline (INTVAL (x));
2594
2595 case REG:
2596 case SUBREG:
2597 case MEM:
2598 return 1;
2599
2600 default:
2601 return 0;
2602 }
2603 }
2604
2605 /* Implement SECONDARY_RELOAD_CLASS. If CLASS contains r15, and we can't
2606 directly move X into it, use r1-r14 as a temporary. */
2607
2608 enum reg_class
2609 mcore_secondary_reload_class (enum reg_class class,
2610 enum machine_mode mode ATTRIBUTE_UNUSED, rtx x)
2611 {
2612 if (TEST_HARD_REG_BIT (reg_class_contents[class], 15)
2613 && !mcore_r15_operand_p (x))
2614 return LRW_REGS;
2615 return NO_REGS;
2616 }
2617
2618 /* Return the reg_class to use when reloading the rtx X into the class
2619 CLASS. If X is too complex to move directly into r15, prefer to
2620 use LRW_REGS instead. */
2621
2622 enum reg_class
2623 mcore_reload_class (rtx x, enum reg_class class)
2624 {
2625 if (reg_class_subset_p (LRW_REGS, class) && !mcore_r15_operand_p (x))
2626 return LRW_REGS;
2627
2628 return class;
2629 }
2630
2631 /* Tell me if a pair of reg/subreg rtx's actually refer to the same
2632 register. Note that the current version doesn't worry about whether
2633 they are the same mode or note (e.g., a QImode in r2 matches an HImode
2634 in r2 matches an SImode in r2. Might think in the future about whether
2635 we want to be able to say something about modes. */
2636
2637 int
2638 mcore_is_same_reg (rtx x, rtx y)
2639 {
2640 /* Strip any and all of the subreg wrappers. */
2641 while (GET_CODE (x) == SUBREG)
2642 x = SUBREG_REG (x);
2643
2644 while (GET_CODE (y) == SUBREG)
2645 y = SUBREG_REG (y);
2646
2647 if (GET_CODE(x) == REG && GET_CODE(y) == REG && REGNO(x) == REGNO(y))
2648 return 1;
2649
2650 return 0;
2651 }
2652
2653 void
2654 mcore_override_options (void)
2655 {
2656 /* Only the m340 supports little endian code. */
2657 if (TARGET_LITTLE_END && ! TARGET_M340)
2658 target_flags |= MASK_M340;
2659 }
2660 \f
2661 /* Compute the number of word sized registers needed to
2662 hold a function argument of mode MODE and type TYPE. */
2663
2664 int
2665 mcore_num_arg_regs (enum machine_mode mode, tree type)
2666 {
2667 int size;
2668
2669 if (targetm.calls.must_pass_in_stack (mode, type))
2670 return 0;
2671
2672 if (type && mode == BLKmode)
2673 size = int_size_in_bytes (type);
2674 else
2675 size = GET_MODE_SIZE (mode);
2676
2677 return ROUND_ADVANCE (size);
2678 }
2679
2680 static rtx
2681 handle_structs_in_regs (enum machine_mode mode, tree type, int reg)
2682 {
2683 int size;
2684
2685 /* The MCore ABI defines that a structure whose size is not a whole multiple
2686 of bytes is passed packed into registers (or spilled onto the stack if
2687 not enough registers are available) with the last few bytes of the
2688 structure being packed, left-justified, into the last register/stack slot.
2689 GCC handles this correctly if the last word is in a stack slot, but we
2690 have to generate a special, PARALLEL RTX if the last word is in an
2691 argument register. */
2692 if (type
2693 && TYPE_MODE (type) == BLKmode
2694 && TREE_CODE (TYPE_SIZE (type)) == INTEGER_CST
2695 && (size = int_size_in_bytes (type)) > UNITS_PER_WORD
2696 && (size % UNITS_PER_WORD != 0)
2697 && (reg + mcore_num_arg_regs (mode, type) <= (FIRST_PARM_REG + NPARM_REGS)))
2698 {
2699 rtx arg_regs [NPARM_REGS];
2700 int nregs;
2701 rtx result;
2702 rtvec rtvec;
2703
2704 for (nregs = 0; size > 0; size -= UNITS_PER_WORD)
2705 {
2706 arg_regs [nregs] =
2707 gen_rtx_EXPR_LIST (SImode, gen_rtx_REG (SImode, reg ++),
2708 GEN_INT (nregs * UNITS_PER_WORD));
2709 nregs ++;
2710 }
2711
2712 /* We assume here that NPARM_REGS == 6. The assert checks this. */
2713 assert (ARRAY_SIZE (arg_regs) == 6);
2714 rtvec = gen_rtvec (nregs, arg_regs[0], arg_regs[1], arg_regs[2],
2715 arg_regs[3], arg_regs[4], arg_regs[5]);
2716
2717 result = gen_rtx_PARALLEL (mode, rtvec);
2718 return result;
2719 }
2720
2721 return gen_rtx_REG (mode, reg);
2722 }
2723
2724 rtx
2725 mcore_function_value (tree valtype, tree func ATTRIBUTE_UNUSED)
2726 {
2727 enum machine_mode mode;
2728 int unsigned_p;
2729
2730 mode = TYPE_MODE (valtype);
2731
2732 PROMOTE_MODE (mode, unsigned_p, NULL);
2733
2734 return handle_structs_in_regs (mode, valtype, FIRST_RET_REG);
2735 }
2736
2737 /* Define where to put the arguments to a function.
2738 Value is zero to push the argument on the stack,
2739 or a hard register in which to store the argument.
2740
2741 MODE is the argument's machine mode.
2742 TYPE is the data type of the argument (as a tree).
2743 This is null for libcalls where that information may
2744 not be available.
2745 CUM is a variable of type CUMULATIVE_ARGS which gives info about
2746 the preceding args and about the function being called.
2747 NAMED is nonzero if this argument is a named parameter
2748 (otherwise it is an extra parameter matching an ellipsis).
2749
2750 On MCore the first args are normally in registers
2751 and the rest are pushed. Any arg that starts within the first
2752 NPARM_REGS words is at least partially passed in a register unless
2753 its data type forbids. */
2754
2755 rtx
2756 mcore_function_arg (CUMULATIVE_ARGS cum, enum machine_mode mode,
2757 tree type, int named)
2758 {
2759 int arg_reg;
2760
2761 if (! named || mode == VOIDmode)
2762 return 0;
2763
2764 if (targetm.calls.must_pass_in_stack (mode, type))
2765 return 0;
2766
2767 arg_reg = ROUND_REG (cum, mode);
2768
2769 if (arg_reg < NPARM_REGS)
2770 return handle_structs_in_regs (mode, type, FIRST_PARM_REG + arg_reg);
2771
2772 return 0;
2773 }
2774
2775 /* Returns the number of bytes of argument registers required to hold *part*
2776 of a parameter of machine mode MODE and type TYPE (which may be NULL if
2777 the type is not known). If the argument fits entirely in the argument
2778 registers, or entirely on the stack, then 0 is returned. CUM is the
2779 number of argument registers already used by earlier parameters to
2780 the function. */
2781
2782 static int
2783 mcore_arg_partial_bytes (CUMULATIVE_ARGS *cum, enum machine_mode mode,
2784 tree type, bool named)
2785 {
2786 int reg = ROUND_REG (*cum, mode);
2787
2788 if (named == 0)
2789 return 0;
2790
2791 if (targetm.calls.must_pass_in_stack (mode, type))
2792 return 0;
2793
2794 /* REG is not the *hardware* register number of the register that holds
2795 the argument, it is the *argument* register number. So for example,
2796 the first argument to a function goes in argument register 0, which
2797 translates (for the MCore) into hardware register 2. The second
2798 argument goes into argument register 1, which translates into hardware
2799 register 3, and so on. NPARM_REGS is the number of argument registers
2800 supported by the target, not the maximum hardware register number of
2801 the target. */
2802 if (reg >= NPARM_REGS)
2803 return 0;
2804
2805 /* If the argument fits entirely in registers, return 0. */
2806 if (reg + mcore_num_arg_regs (mode, type) <= NPARM_REGS)
2807 return 0;
2808
2809 /* The argument overflows the number of available argument registers.
2810 Compute how many argument registers have not yet been assigned to
2811 hold an argument. */
2812 reg = NPARM_REGS - reg;
2813
2814 /* Return partially in registers and partially on the stack. */
2815 return reg * UNITS_PER_WORD;
2816 }
2817 \f
2818 /* Return nonzero if SYMBOL is marked as being dllexport'd. */
2819
2820 int
2821 mcore_dllexport_name_p (const char * symbol)
2822 {
2823 return symbol[0] == '@' && symbol[1] == 'e' && symbol[2] == '.';
2824 }
2825
2826 /* Return nonzero if SYMBOL is marked as being dllimport'd. */
2827
2828 int
2829 mcore_dllimport_name_p (const char * symbol)
2830 {
2831 return symbol[0] == '@' && symbol[1] == 'i' && symbol[2] == '.';
2832 }
2833
2834 /* Mark a DECL as being dllexport'd. */
2835
2836 static void
2837 mcore_mark_dllexport (tree decl)
2838 {
2839 const char * oldname;
2840 char * newname;
2841 rtx rtlname;
2842 tree idp;
2843
2844 rtlname = XEXP (DECL_RTL (decl), 0);
2845
2846 if (GET_CODE (rtlname) == MEM)
2847 rtlname = XEXP (rtlname, 0);
2848 gcc_assert (GET_CODE (rtlname) == SYMBOL_REF);
2849 oldname = XSTR (rtlname, 0);
2850
2851 if (mcore_dllexport_name_p (oldname))
2852 return; /* Already done. */
2853
2854 newname = alloca (strlen (oldname) + 4);
2855 sprintf (newname, "@e.%s", oldname);
2856
2857 /* We pass newname through get_identifier to ensure it has a unique
2858 address. RTL processing can sometimes peek inside the symbol ref
2859 and compare the string's addresses to see if two symbols are
2860 identical. */
2861 /* ??? At least I think that's why we do this. */
2862 idp = get_identifier (newname);
2863
2864 XEXP (DECL_RTL (decl), 0) =
2865 gen_rtx_SYMBOL_REF (Pmode, IDENTIFIER_POINTER (idp));
2866 }
2867
2868 /* Mark a DECL as being dllimport'd. */
2869
2870 static void
2871 mcore_mark_dllimport (tree decl)
2872 {
2873 const char * oldname;
2874 char * newname;
2875 tree idp;
2876 rtx rtlname;
2877 rtx newrtl;
2878
2879 rtlname = XEXP (DECL_RTL (decl), 0);
2880
2881 if (GET_CODE (rtlname) == MEM)
2882 rtlname = XEXP (rtlname, 0);
2883 gcc_assert (GET_CODE (rtlname) == SYMBOL_REF);
2884 oldname = XSTR (rtlname, 0);
2885
2886 gcc_assert (!mcore_dllexport_name_p (oldname));
2887 if (mcore_dllimport_name_p (oldname))
2888 return; /* Already done. */
2889
2890 /* ??? One can well ask why we're making these checks here,
2891 and that would be a good question. */
2892
2893 /* Imported variables can't be initialized. */
2894 if (TREE_CODE (decl) == VAR_DECL
2895 && !DECL_VIRTUAL_P (decl)
2896 && DECL_INITIAL (decl))
2897 {
2898 error ("%Jinitialized variable '%D' is marked dllimport", decl, decl);
2899 return;
2900 }
2901
2902 /* `extern' needn't be specified with dllimport.
2903 Specify `extern' now and hope for the best. Sigh. */
2904 if (TREE_CODE (decl) == VAR_DECL
2905 /* ??? Is this test for vtables needed? */
2906 && !DECL_VIRTUAL_P (decl))
2907 {
2908 DECL_EXTERNAL (decl) = 1;
2909 TREE_PUBLIC (decl) = 1;
2910 }
2911
2912 newname = alloca (strlen (oldname) + 11);
2913 sprintf (newname, "@i.__imp_%s", oldname);
2914
2915 /* We pass newname through get_identifier to ensure it has a unique
2916 address. RTL processing can sometimes peek inside the symbol ref
2917 and compare the string's addresses to see if two symbols are
2918 identical. */
2919 /* ??? At least I think that's why we do this. */
2920 idp = get_identifier (newname);
2921
2922 newrtl = gen_rtx_MEM (Pmode,
2923 gen_rtx_SYMBOL_REF (Pmode,
2924 IDENTIFIER_POINTER (idp)));
2925 XEXP (DECL_RTL (decl), 0) = newrtl;
2926 }
2927
2928 static int
2929 mcore_dllexport_p (tree decl)
2930 {
2931 if ( TREE_CODE (decl) != VAR_DECL
2932 && TREE_CODE (decl) != FUNCTION_DECL)
2933 return 0;
2934
2935 return lookup_attribute ("dllexport", DECL_ATTRIBUTES (decl)) != 0;
2936 }
2937
2938 static int
2939 mcore_dllimport_p (tree decl)
2940 {
2941 if ( TREE_CODE (decl) != VAR_DECL
2942 && TREE_CODE (decl) != FUNCTION_DECL)
2943 return 0;
2944
2945 return lookup_attribute ("dllimport", DECL_ATTRIBUTES (decl)) != 0;
2946 }
2947
2948 /* We must mark dll symbols specially. Definitions of dllexport'd objects
2949 install some info in the .drective (PE) or .exports (ELF) sections. */
2950
2951 static void
2952 mcore_encode_section_info (tree decl, rtx rtl ATTRIBUTE_UNUSED, int first ATTRIBUTE_UNUSED)
2953 {
2954 /* Mark the decl so we can tell from the rtl whether the object is
2955 dllexport'd or dllimport'd. */
2956 if (mcore_dllexport_p (decl))
2957 mcore_mark_dllexport (decl);
2958 else if (mcore_dllimport_p (decl))
2959 mcore_mark_dllimport (decl);
2960
2961 /* It might be that DECL has already been marked as dllimport, but
2962 a subsequent definition nullified that. The attribute is gone
2963 but DECL_RTL still has @i.__imp_foo. We need to remove that. */
2964 else if ((TREE_CODE (decl) == FUNCTION_DECL
2965 || TREE_CODE (decl) == VAR_DECL)
2966 && DECL_RTL (decl) != NULL_RTX
2967 && GET_CODE (DECL_RTL (decl)) == MEM
2968 && GET_CODE (XEXP (DECL_RTL (decl), 0)) == MEM
2969 && GET_CODE (XEXP (XEXP (DECL_RTL (decl), 0), 0)) == SYMBOL_REF
2970 && mcore_dllimport_name_p (XSTR (XEXP (XEXP (DECL_RTL (decl), 0), 0), 0)))
2971 {
2972 const char * oldname = XSTR (XEXP (XEXP (DECL_RTL (decl), 0), 0), 0);
2973 tree idp = get_identifier (oldname + 9);
2974 rtx newrtl = gen_rtx_SYMBOL_REF (Pmode, IDENTIFIER_POINTER (idp));
2975
2976 XEXP (DECL_RTL (decl), 0) = newrtl;
2977
2978 /* We previously set TREE_PUBLIC and DECL_EXTERNAL.
2979 ??? We leave these alone for now. */
2980 }
2981 }
2982
2983 /* Undo the effects of the above. */
2984
2985 static const char *
2986 mcore_strip_name_encoding (const char * str)
2987 {
2988 return str + (str[0] == '@' ? 3 : 0);
2989 }
2990
2991 /* MCore specific attribute support.
2992 dllexport - for exporting a function/variable that will live in a dll
2993 dllimport - for importing a function/variable from a dll
2994 naked - do not create a function prologue/epilogue. */
2995
2996 const struct attribute_spec mcore_attribute_table[] =
2997 {
2998 /* { name, min_len, max_len, decl_req, type_req, fn_type_req, handler } */
2999 { "dllexport", 0, 0, true, false, false, NULL },
3000 { "dllimport", 0, 0, true, false, false, NULL },
3001 { "naked", 0, 0, true, false, false, mcore_handle_naked_attribute },
3002 { NULL, 0, 0, false, false, false, NULL }
3003 };
3004
3005 /* Handle a "naked" attribute; arguments as in
3006 struct attribute_spec.handler. */
3007
3008 static tree
3009 mcore_handle_naked_attribute (tree * node, tree name, tree args ATTRIBUTE_UNUSED,
3010 int flags ATTRIBUTE_UNUSED, bool * no_add_attrs)
3011 {
3012 if (TREE_CODE (*node) == FUNCTION_DECL)
3013 {
3014 /* PR14310 - don't complain about lack of return statement
3015 in naked functions. The solution here is a gross hack
3016 but this is the only way to solve the problem without
3017 adding a new feature to GCC. I did try submitting a patch
3018 that would add such a new feature, but it was (rightfully)
3019 rejected on the grounds that it was creeping featurism,
3020 so hence this code. */
3021 if (warn_return_type)
3022 {
3023 saved_warn_return_type = warn_return_type;
3024 warn_return_type = 0;
3025 saved_warn_return_type_count = 2;
3026 }
3027 else if (saved_warn_return_type_count)
3028 saved_warn_return_type_count = 2;
3029 }
3030 else
3031 {
3032 warning (OPT_Wattributes, "%qs attribute only applies to functions",
3033 IDENTIFIER_POINTER (name));
3034 *no_add_attrs = true;
3035 }
3036
3037 return NULL_TREE;
3038 }
3039
3040 /* ??? It looks like this is PE specific? Oh well, this is what the
3041 old code did as well. */
3042
3043 static void
3044 mcore_unique_section (tree decl, int reloc ATTRIBUTE_UNUSED)
3045 {
3046 int len;
3047 const char * name;
3048 char * string;
3049 const char * prefix;
3050
3051 name = IDENTIFIER_POINTER (DECL_ASSEMBLER_NAME (decl));
3052
3053 /* Strip off any encoding in name. */
3054 name = (* targetm.strip_name_encoding) (name);
3055
3056 /* The object is put in, for example, section .text$foo.
3057 The linker will then ultimately place them in .text
3058 (everything from the $ on is stripped). */
3059 if (TREE_CODE (decl) == FUNCTION_DECL)
3060 prefix = ".text$";
3061 /* For compatibility with EPOC, we ignore the fact that the
3062 section might have relocs against it. */
3063 else if (decl_readonly_section (decl, 0))
3064 prefix = ".rdata$";
3065 else
3066 prefix = ".data$";
3067
3068 len = strlen (name) + strlen (prefix);
3069 string = alloca (len + 1);
3070
3071 sprintf (string, "%s%s", prefix, name);
3072
3073 DECL_SECTION_NAME (decl) = build_string (len, string);
3074 }
3075
3076 int
3077 mcore_naked_function_p (void)
3078 {
3079 return lookup_attribute ("naked", DECL_ATTRIBUTES (current_function_decl)) != NULL_TREE;
3080 }
3081
3082 #ifdef OBJECT_FORMAT_ELF
3083 static void
3084 mcore_asm_named_section (const char *name,
3085 unsigned int flags ATTRIBUTE_UNUSED,
3086 tree decl ATTRIBUTE_UNUSED)
3087 {
3088 fprintf (asm_out_file, "\t.section %s\n", name);
3089 }
3090 #endif /* OBJECT_FORMAT_ELF */
3091
3092 /* Worker function for TARGET_ASM_EXTERNAL_LIBCALL. */
3093
3094 static void
3095 mcore_external_libcall (rtx fun)
3096 {
3097 fprintf (asm_out_file, "\t.import\t");
3098 assemble_name (asm_out_file, XSTR (fun, 0));
3099 fprintf (asm_out_file, "\n");
3100 }
3101
3102 /* Worker function for TARGET_RETURN_IN_MEMORY. */
3103
3104 static bool
3105 mcore_return_in_memory (tree type, tree fntype ATTRIBUTE_UNUSED)
3106 {
3107 HOST_WIDE_INT size = int_size_in_bytes (type);
3108 return (size == -1 || size > 2 * UNITS_PER_WORD);
3109 }