]> git.ipfire.org Git - thirdparty/gcc.git/blob - gcc/config/mips/mips.c
frv.h: Clean up references to GO_IF_LEGITIMATE_ADDRESS.
[thirdparty/gcc.git] / gcc / config / mips / mips.c
1 /* Subroutines used for MIPS code generation.
2 Copyright (C) 1989, 1990, 1991, 1993, 1994, 1995, 1996, 1997, 1998,
3 1999, 2000, 2001, 2002, 2003, 2004, 2005, 2006, 2007, 2008, 2009
4 Free Software Foundation, Inc.
5 Contributed by A. Lichnewsky, lich@inria.inria.fr.
6 Changes by Michael Meissner, meissner@osf.org.
7 64-bit r4000 support by Ian Lance Taylor, ian@cygnus.com, and
8 Brendan Eich, brendan@microunity.com.
9
10 This file is part of GCC.
11
12 GCC is free software; you can redistribute it and/or modify
13 it under the terms of the GNU General Public License as published by
14 the Free Software Foundation; either version 3, or (at your option)
15 any later version.
16
17 GCC is distributed in the hope that it will be useful,
18 but WITHOUT ANY WARRANTY; without even the implied warranty of
19 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
20 GNU General Public License for more details.
21
22 You should have received a copy of the GNU General Public License
23 along with GCC; see the file COPYING3. If not see
24 <http://www.gnu.org/licenses/>. */
25
26 #include "config.h"
27 #include "system.h"
28 #include "coretypes.h"
29 #include "tm.h"
30 #include <signal.h>
31 #include "rtl.h"
32 #include "regs.h"
33 #include "hard-reg-set.h"
34 #include "real.h"
35 #include "insn-config.h"
36 #include "conditions.h"
37 #include "insn-attr.h"
38 #include "recog.h"
39 #include "toplev.h"
40 #include "output.h"
41 #include "tree.h"
42 #include "function.h"
43 #include "expr.h"
44 #include "optabs.h"
45 #include "libfuncs.h"
46 #include "flags.h"
47 #include "reload.h"
48 #include "tm_p.h"
49 #include "ggc.h"
50 #include "gstab.h"
51 #include "hashtab.h"
52 #include "debug.h"
53 #include "target.h"
54 #include "target-def.h"
55 #include "integrate.h"
56 #include "langhooks.h"
57 #include "cfglayout.h"
58 #include "sched-int.h"
59 #include "gimple.h"
60 #include "bitmap.h"
61 #include "diagnostic.h"
62
63 /* True if X is an UNSPEC wrapper around a SYMBOL_REF or LABEL_REF. */
64 #define UNSPEC_ADDRESS_P(X) \
65 (GET_CODE (X) == UNSPEC \
66 && XINT (X, 1) >= UNSPEC_ADDRESS_FIRST \
67 && XINT (X, 1) < UNSPEC_ADDRESS_FIRST + NUM_SYMBOL_TYPES)
68
69 /* Extract the symbol or label from UNSPEC wrapper X. */
70 #define UNSPEC_ADDRESS(X) \
71 XVECEXP (X, 0, 0)
72
73 /* Extract the symbol type from UNSPEC wrapper X. */
74 #define UNSPEC_ADDRESS_TYPE(X) \
75 ((enum mips_symbol_type) (XINT (X, 1) - UNSPEC_ADDRESS_FIRST))
76
77 /* The maximum distance between the top of the stack frame and the
78 value $sp has when we save and restore registers.
79
80 The value for normal-mode code must be a SMALL_OPERAND and must
81 preserve the maximum stack alignment. We therefore use a value
82 of 0x7ff0 in this case.
83
84 MIPS16e SAVE and RESTORE instructions can adjust the stack pointer by
85 up to 0x7f8 bytes and can usually save or restore all the registers
86 that we need to save or restore. (Note that we can only use these
87 instructions for o32, for which the stack alignment is 8 bytes.)
88
89 We use a maximum gap of 0x100 or 0x400 for MIPS16 code when SAVE and
90 RESTORE are not available. We can then use unextended instructions
91 to save and restore registers, and to allocate and deallocate the top
92 part of the frame. */
93 #define MIPS_MAX_FIRST_STACK_STEP \
94 (!TARGET_MIPS16 ? 0x7ff0 \
95 : GENERATE_MIPS16E_SAVE_RESTORE ? 0x7f8 \
96 : TARGET_64BIT ? 0x100 : 0x400)
97
98 /* True if INSN is a mips.md pattern or asm statement. */
99 #define USEFUL_INSN_P(INSN) \
100 (INSN_P (INSN) \
101 && GET_CODE (PATTERN (INSN)) != USE \
102 && GET_CODE (PATTERN (INSN)) != CLOBBER \
103 && GET_CODE (PATTERN (INSN)) != ADDR_VEC \
104 && GET_CODE (PATTERN (INSN)) != ADDR_DIFF_VEC)
105
106 /* If INSN is a delayed branch sequence, return the first instruction
107 in the sequence, otherwise return INSN itself. */
108 #define SEQ_BEGIN(INSN) \
109 (INSN_P (INSN) && GET_CODE (PATTERN (INSN)) == SEQUENCE \
110 ? XVECEXP (PATTERN (INSN), 0, 0) \
111 : (INSN))
112
113 /* Likewise for the last instruction in a delayed branch sequence. */
114 #define SEQ_END(INSN) \
115 (INSN_P (INSN) && GET_CODE (PATTERN (INSN)) == SEQUENCE \
116 ? XVECEXP (PATTERN (INSN), 0, XVECLEN (PATTERN (INSN), 0) - 1) \
117 : (INSN))
118
119 /* Execute the following loop body with SUBINSN set to each instruction
120 between SEQ_BEGIN (INSN) and SEQ_END (INSN) inclusive. */
121 #define FOR_EACH_SUBINSN(SUBINSN, INSN) \
122 for ((SUBINSN) = SEQ_BEGIN (INSN); \
123 (SUBINSN) != NEXT_INSN (SEQ_END (INSN)); \
124 (SUBINSN) = NEXT_INSN (SUBINSN))
125
126 /* True if bit BIT is set in VALUE. */
127 #define BITSET_P(VALUE, BIT) (((VALUE) & (1 << (BIT))) != 0)
128
129 /* Classifies an address.
130
131 ADDRESS_REG
132 A natural register + offset address. The register satisfies
133 mips_valid_base_register_p and the offset is a const_arith_operand.
134
135 ADDRESS_LO_SUM
136 A LO_SUM rtx. The first operand is a valid base register and
137 the second operand is a symbolic address.
138
139 ADDRESS_CONST_INT
140 A signed 16-bit constant address.
141
142 ADDRESS_SYMBOLIC:
143 A constant symbolic address. */
144 enum mips_address_type {
145 ADDRESS_REG,
146 ADDRESS_LO_SUM,
147 ADDRESS_CONST_INT,
148 ADDRESS_SYMBOLIC
149 };
150
151 /* Enumerates the setting of the -mr10k-cache-barrier option. */
152 enum mips_r10k_cache_barrier_setting {
153 R10K_CACHE_BARRIER_NONE,
154 R10K_CACHE_BARRIER_STORE,
155 R10K_CACHE_BARRIER_LOAD_STORE
156 };
157
158 /* Macros to create an enumeration identifier for a function prototype. */
159 #define MIPS_FTYPE_NAME1(A, B) MIPS_##A##_FTYPE_##B
160 #define MIPS_FTYPE_NAME2(A, B, C) MIPS_##A##_FTYPE_##B##_##C
161 #define MIPS_FTYPE_NAME3(A, B, C, D) MIPS_##A##_FTYPE_##B##_##C##_##D
162 #define MIPS_FTYPE_NAME4(A, B, C, D, E) MIPS_##A##_FTYPE_##B##_##C##_##D##_##E
163
164 /* Classifies the prototype of a built-in function. */
165 enum mips_function_type {
166 #define DEF_MIPS_FTYPE(NARGS, LIST) MIPS_FTYPE_NAME##NARGS LIST,
167 #include "config/mips/mips-ftypes.def"
168 #undef DEF_MIPS_FTYPE
169 MIPS_MAX_FTYPE_MAX
170 };
171
172 /* Specifies how a built-in function should be converted into rtl. */
173 enum mips_builtin_type {
174 /* The function corresponds directly to an .md pattern. The return
175 value is mapped to operand 0 and the arguments are mapped to
176 operands 1 and above. */
177 MIPS_BUILTIN_DIRECT,
178
179 /* The function corresponds directly to an .md pattern. There is no return
180 value and the arguments are mapped to operands 0 and above. */
181 MIPS_BUILTIN_DIRECT_NO_TARGET,
182
183 /* The function corresponds to a comparison instruction followed by
184 a mips_cond_move_tf_ps pattern. The first two arguments are the
185 values to compare and the second two arguments are the vector
186 operands for the movt.ps or movf.ps instruction (in assembly order). */
187 MIPS_BUILTIN_MOVF,
188 MIPS_BUILTIN_MOVT,
189
190 /* The function corresponds to a V2SF comparison instruction. Operand 0
191 of this instruction is the result of the comparison, which has mode
192 CCV2 or CCV4. The function arguments are mapped to operands 1 and
193 above. The function's return value is an SImode boolean that is
194 true under the following conditions:
195
196 MIPS_BUILTIN_CMP_ANY: one of the registers is true
197 MIPS_BUILTIN_CMP_ALL: all of the registers are true
198 MIPS_BUILTIN_CMP_LOWER: the first register is true
199 MIPS_BUILTIN_CMP_UPPER: the second register is true. */
200 MIPS_BUILTIN_CMP_ANY,
201 MIPS_BUILTIN_CMP_ALL,
202 MIPS_BUILTIN_CMP_UPPER,
203 MIPS_BUILTIN_CMP_LOWER,
204
205 /* As above, but the instruction only sets a single $fcc register. */
206 MIPS_BUILTIN_CMP_SINGLE,
207
208 /* For generating bposge32 branch instructions in MIPS32 DSP ASE. */
209 MIPS_BUILTIN_BPOSGE32
210 };
211
212 /* Invoke MACRO (COND) for each C.cond.fmt condition. */
213 #define MIPS_FP_CONDITIONS(MACRO) \
214 MACRO (f), \
215 MACRO (un), \
216 MACRO (eq), \
217 MACRO (ueq), \
218 MACRO (olt), \
219 MACRO (ult), \
220 MACRO (ole), \
221 MACRO (ule), \
222 MACRO (sf), \
223 MACRO (ngle), \
224 MACRO (seq), \
225 MACRO (ngl), \
226 MACRO (lt), \
227 MACRO (nge), \
228 MACRO (le), \
229 MACRO (ngt)
230
231 /* Enumerates the codes above as MIPS_FP_COND_<X>. */
232 #define DECLARE_MIPS_COND(X) MIPS_FP_COND_ ## X
233 enum mips_fp_condition {
234 MIPS_FP_CONDITIONS (DECLARE_MIPS_COND)
235 };
236
237 /* Index X provides the string representation of MIPS_FP_COND_<X>. */
238 #define STRINGIFY(X) #X
239 static const char *const mips_fp_conditions[] = {
240 MIPS_FP_CONDITIONS (STRINGIFY)
241 };
242
243 /* Information about a function's frame layout. */
244 struct GTY(()) mips_frame_info {
245 /* The size of the frame in bytes. */
246 HOST_WIDE_INT total_size;
247
248 /* The number of bytes allocated to variables. */
249 HOST_WIDE_INT var_size;
250
251 /* The number of bytes allocated to outgoing function arguments. */
252 HOST_WIDE_INT args_size;
253
254 /* The number of bytes allocated to the .cprestore slot, or 0 if there
255 is no such slot. */
256 HOST_WIDE_INT cprestore_size;
257
258 /* Bit X is set if the function saves or restores GPR X. */
259 unsigned int mask;
260
261 /* Likewise FPR X. */
262 unsigned int fmask;
263
264 /* Likewise doubleword accumulator X ($acX). */
265 unsigned int acc_mask;
266
267 /* The number of GPRs, FPRs, doubleword accumulators and COP0
268 registers saved. */
269 unsigned int num_gp;
270 unsigned int num_fp;
271 unsigned int num_acc;
272 unsigned int num_cop0_regs;
273
274 /* The offset of the topmost GPR, FPR, accumulator and COP0-register
275 save slots from the top of the frame, or zero if no such slots are
276 needed. */
277 HOST_WIDE_INT gp_save_offset;
278 HOST_WIDE_INT fp_save_offset;
279 HOST_WIDE_INT acc_save_offset;
280 HOST_WIDE_INT cop0_save_offset;
281
282 /* Likewise, but giving offsets from the bottom of the frame. */
283 HOST_WIDE_INT gp_sp_offset;
284 HOST_WIDE_INT fp_sp_offset;
285 HOST_WIDE_INT acc_sp_offset;
286 HOST_WIDE_INT cop0_sp_offset;
287
288 /* The offset of arg_pointer_rtx from the bottom of the frame. */
289 HOST_WIDE_INT arg_pointer_offset;
290
291 /* The offset of hard_frame_pointer_rtx from the bottom of the frame. */
292 HOST_WIDE_INT hard_frame_pointer_offset;
293 };
294
295 struct GTY(()) machine_function {
296 /* The register returned by mips16_gp_pseudo_reg; see there for details. */
297 rtx mips16_gp_pseudo_rtx;
298
299 /* The number of extra stack bytes taken up by register varargs.
300 This area is allocated by the callee at the very top of the frame. */
301 int varargs_size;
302
303 /* The current frame information, calculated by mips_compute_frame_info. */
304 struct mips_frame_info frame;
305
306 /* The register to use as the function's global pointer, or INVALID_REGNUM
307 if the function doesn't need one. */
308 unsigned int global_pointer;
309
310 /* True if mips_adjust_insn_length should ignore an instruction's
311 hazard attribute. */
312 bool ignore_hazard_length_p;
313
314 /* True if the whole function is suitable for .set noreorder and
315 .set nomacro. */
316 bool all_noreorder_p;
317
318 /* True if the function is known to have an instruction that needs $gp. */
319 bool has_gp_insn_p;
320
321 /* True if we have emitted an instruction to initialize
322 mips16_gp_pseudo_rtx. */
323 bool initialized_mips16_gp_pseudo_p;
324
325 /* True if this is an interrupt handler. */
326 bool interrupt_handler_p;
327
328 /* True if this is an interrupt handler that uses shadow registers. */
329 bool use_shadow_register_set_p;
330
331 /* True if this is an interrupt handler that should keep interrupts
332 masked. */
333 bool keep_interrupts_masked_p;
334
335 /* True if this is an interrupt handler that should use DERET
336 instead of ERET. */
337 bool use_debug_exception_return_p;
338 };
339
340 /* Information about a single argument. */
341 struct mips_arg_info {
342 /* True if the argument is passed in a floating-point register, or
343 would have been if we hadn't run out of registers. */
344 bool fpr_p;
345
346 /* The number of words passed in registers, rounded up. */
347 unsigned int reg_words;
348
349 /* For EABI, the offset of the first register from GP_ARG_FIRST or
350 FP_ARG_FIRST. For other ABIs, the offset of the first register from
351 the start of the ABI's argument structure (see the CUMULATIVE_ARGS
352 comment for details).
353
354 The value is MAX_ARGS_IN_REGISTERS if the argument is passed entirely
355 on the stack. */
356 unsigned int reg_offset;
357
358 /* The number of words that must be passed on the stack, rounded up. */
359 unsigned int stack_words;
360
361 /* The offset from the start of the stack overflow area of the argument's
362 first stack word. Only meaningful when STACK_WORDS is nonzero. */
363 unsigned int stack_offset;
364 };
365
366 /* Information about an address described by mips_address_type.
367
368 ADDRESS_CONST_INT
369 No fields are used.
370
371 ADDRESS_REG
372 REG is the base register and OFFSET is the constant offset.
373
374 ADDRESS_LO_SUM
375 REG and OFFSET are the operands to the LO_SUM and SYMBOL_TYPE
376 is the type of symbol it references.
377
378 ADDRESS_SYMBOLIC
379 SYMBOL_TYPE is the type of symbol that the address references. */
380 struct mips_address_info {
381 enum mips_address_type type;
382 rtx reg;
383 rtx offset;
384 enum mips_symbol_type symbol_type;
385 };
386
387 /* One stage in a constant building sequence. These sequences have
388 the form:
389
390 A = VALUE[0]
391 A = A CODE[1] VALUE[1]
392 A = A CODE[2] VALUE[2]
393 ...
394
395 where A is an accumulator, each CODE[i] is a binary rtl operation
396 and each VALUE[i] is a constant integer. CODE[0] is undefined. */
397 struct mips_integer_op {
398 enum rtx_code code;
399 unsigned HOST_WIDE_INT value;
400 };
401
402 /* The largest number of operations needed to load an integer constant.
403 The worst accepted case for 64-bit constants is LUI,ORI,SLL,ORI,SLL,ORI.
404 When the lowest bit is clear, we can try, but reject a sequence with
405 an extra SLL at the end. */
406 #define MIPS_MAX_INTEGER_OPS 7
407
408 /* Information about a MIPS16e SAVE or RESTORE instruction. */
409 struct mips16e_save_restore_info {
410 /* The number of argument registers saved by a SAVE instruction.
411 0 for RESTORE instructions. */
412 unsigned int nargs;
413
414 /* Bit X is set if the instruction saves or restores GPR X. */
415 unsigned int mask;
416
417 /* The total number of bytes to allocate. */
418 HOST_WIDE_INT size;
419 };
420
421 /* Global variables for machine-dependent things. */
422
423 /* The -G setting, or the configuration's default small-data limit if
424 no -G option is given. */
425 static unsigned int mips_small_data_threshold;
426
427 /* The number of file directives written by mips_output_filename. */
428 int num_source_filenames;
429
430 /* The name that appeared in the last .file directive written by
431 mips_output_filename, or "" if mips_output_filename hasn't
432 written anything yet. */
433 const char *current_function_file = "";
434
435 /* A label counter used by PUT_SDB_BLOCK_START and PUT_SDB_BLOCK_END. */
436 int sdb_label_count;
437
438 /* Arrays that map GCC register numbers to debugger register numbers. */
439 int mips_dbx_regno[FIRST_PSEUDO_REGISTER];
440 int mips_dwarf_regno[FIRST_PSEUDO_REGISTER];
441
442 /* The nesting depth of the PRINT_OPERAND '%(', '%<' and '%[' constructs. */
443 int set_noreorder;
444 int set_nomacro;
445 static int set_noat;
446
447 /* True if we're writing out a branch-likely instruction rather than a
448 normal branch. */
449 static bool mips_branch_likely;
450
451 /* The current instruction-set architecture. */
452 enum processor_type mips_arch;
453 const struct mips_cpu_info *mips_arch_info;
454
455 /* The processor that we should tune the code for. */
456 enum processor_type mips_tune;
457 const struct mips_cpu_info *mips_tune_info;
458
459 /* The ISA level associated with mips_arch. */
460 int mips_isa;
461
462 /* The architecture selected by -mipsN, or null if -mipsN wasn't used. */
463 static const struct mips_cpu_info *mips_isa_option_info;
464
465 /* Which ABI to use. */
466 int mips_abi = MIPS_ABI_DEFAULT;
467
468 /* Which cost information to use. */
469 const struct mips_rtx_cost_data *mips_cost;
470
471 /* The ambient target flags, excluding MASK_MIPS16. */
472 static int mips_base_target_flags;
473
474 /* True if MIPS16 is the default mode. */
475 bool mips_base_mips16;
476
477 /* The ambient values of other global variables. */
478 static int mips_base_schedule_insns; /* flag_schedule_insns */
479 static int mips_base_reorder_blocks_and_partition; /* flag_reorder... */
480 static int mips_base_move_loop_invariants; /* flag_move_loop_invariants */
481 static int mips_base_align_loops; /* align_loops */
482 static int mips_base_align_jumps; /* align_jumps */
483 static int mips_base_align_functions; /* align_functions */
484
485 /* The -mcode-readable setting. */
486 enum mips_code_readable_setting mips_code_readable = CODE_READABLE_YES;
487
488 /* The -mr10k-cache-barrier setting. */
489 static enum mips_r10k_cache_barrier_setting mips_r10k_cache_barrier;
490
491 /* Index [M][R] is true if register R is allowed to hold a value of mode M. */
492 bool mips_hard_regno_mode_ok[(int) MAX_MACHINE_MODE][FIRST_PSEUDO_REGISTER];
493
494 /* Index C is true if character C is a valid PRINT_OPERAND punctation
495 character. */
496 bool mips_print_operand_punct[256];
497
498 static GTY (()) int mips_output_filename_first_time = 1;
499
500 /* mips_split_p[X] is true if symbols of type X can be split by
501 mips_split_symbol. */
502 bool mips_split_p[NUM_SYMBOL_TYPES];
503
504 /* mips_split_hi_p[X] is true if the high parts of symbols of type X
505 can be split by mips_split_symbol. */
506 bool mips_split_hi_p[NUM_SYMBOL_TYPES];
507
508 /* mips_lo_relocs[X] is the relocation to use when a symbol of type X
509 appears in a LO_SUM. It can be null if such LO_SUMs aren't valid or
510 if they are matched by a special .md file pattern. */
511 static const char *mips_lo_relocs[NUM_SYMBOL_TYPES];
512
513 /* Likewise for HIGHs. */
514 static const char *mips_hi_relocs[NUM_SYMBOL_TYPES];
515
516 /* Index R is the smallest register class that contains register R. */
517 const enum reg_class mips_regno_to_class[FIRST_PSEUDO_REGISTER] = {
518 LEA_REGS, LEA_REGS, M16_REGS, V1_REG,
519 M16_REGS, M16_REGS, M16_REGS, M16_REGS,
520 LEA_REGS, LEA_REGS, LEA_REGS, LEA_REGS,
521 LEA_REGS, LEA_REGS, LEA_REGS, LEA_REGS,
522 M16_REGS, M16_REGS, LEA_REGS, LEA_REGS,
523 LEA_REGS, LEA_REGS, LEA_REGS, LEA_REGS,
524 T_REG, PIC_FN_ADDR_REG, LEA_REGS, LEA_REGS,
525 LEA_REGS, LEA_REGS, LEA_REGS, LEA_REGS,
526 FP_REGS, FP_REGS, FP_REGS, FP_REGS,
527 FP_REGS, FP_REGS, FP_REGS, FP_REGS,
528 FP_REGS, FP_REGS, FP_REGS, FP_REGS,
529 FP_REGS, FP_REGS, FP_REGS, FP_REGS,
530 FP_REGS, FP_REGS, FP_REGS, FP_REGS,
531 FP_REGS, FP_REGS, FP_REGS, FP_REGS,
532 FP_REGS, FP_REGS, FP_REGS, FP_REGS,
533 FP_REGS, FP_REGS, FP_REGS, FP_REGS,
534 MD0_REG, MD1_REG, NO_REGS, ST_REGS,
535 ST_REGS, ST_REGS, ST_REGS, ST_REGS,
536 ST_REGS, ST_REGS, ST_REGS, NO_REGS,
537 NO_REGS, FRAME_REGS, FRAME_REGS, NO_REGS,
538 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS,
539 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS,
540 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS,
541 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS,
542 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS,
543 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS,
544 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS,
545 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS,
546 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS,
547 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS,
548 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS,
549 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS,
550 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS,
551 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS,
552 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS,
553 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS,
554 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS,
555 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS,
556 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS,
557 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS,
558 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS,
559 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS,
560 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS,
561 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS,
562 DSP_ACC_REGS, DSP_ACC_REGS, DSP_ACC_REGS, DSP_ACC_REGS,
563 DSP_ACC_REGS, DSP_ACC_REGS, ALL_REGS, ALL_REGS,
564 ALL_REGS, ALL_REGS, ALL_REGS, ALL_REGS
565 };
566
567 /* The value of TARGET_ATTRIBUTE_TABLE. */
568 const struct attribute_spec mips_attribute_table[] = {
569 /* { name, min_len, max_len, decl_req, type_req, fn_type_req, handler } */
570 { "long_call", 0, 0, false, true, true, NULL },
571 { "far", 0, 0, false, true, true, NULL },
572 { "near", 0, 0, false, true, true, NULL },
573 /* We would really like to treat "mips16" and "nomips16" as type
574 attributes, but GCC doesn't provide the hooks we need to support
575 the right conversion rules. As declaration attributes, they affect
576 code generation but don't carry other semantics. */
577 { "mips16", 0, 0, true, false, false, NULL },
578 { "nomips16", 0, 0, true, false, false, NULL },
579 /* Allow functions to be specified as interrupt handlers */
580 { "interrupt", 0, 0, false, true, true, NULL },
581 { "use_shadow_register_set", 0, 0, false, true, true, NULL },
582 { "keep_interrupts_masked", 0, 0, false, true, true, NULL },
583 { "use_debug_exception_return", 0, 0, false, true, true, NULL },
584 { NULL, 0, 0, false, false, false, NULL }
585 };
586 \f
587 /* A table describing all the processors GCC knows about. Names are
588 matched in the order listed. The first mention of an ISA level is
589 taken as the canonical name for that ISA.
590
591 To ease comparison, please keep this table in the same order
592 as GAS's mips_cpu_info_table. Please also make sure that
593 MIPS_ISA_LEVEL_SPEC and MIPS_ARCH_FLOAT_SPEC handle all -march
594 options correctly. */
595 static const struct mips_cpu_info mips_cpu_info_table[] = {
596 /* Entries for generic ISAs. */
597 { "mips1", PROCESSOR_R3000, 1, 0 },
598 { "mips2", PROCESSOR_R6000, 2, 0 },
599 { "mips3", PROCESSOR_R4000, 3, 0 },
600 { "mips4", PROCESSOR_R8000, 4, 0 },
601 /* Prefer not to use branch-likely instructions for generic MIPS32rX
602 and MIPS64rX code. The instructions were officially deprecated
603 in revisions 2 and earlier, but revision 3 is likely to downgrade
604 that to a recommendation to avoid the instructions in code that
605 isn't tuned to a specific processor. */
606 { "mips32", PROCESSOR_4KC, 32, PTF_AVOID_BRANCHLIKELY },
607 { "mips32r2", PROCESSOR_M4K, 33, PTF_AVOID_BRANCHLIKELY },
608 { "mips64", PROCESSOR_5KC, 64, PTF_AVOID_BRANCHLIKELY },
609 /* ??? For now just tune the generic MIPS64r2 for 5KC as well. */
610 { "mips64r2", PROCESSOR_5KC, 65, PTF_AVOID_BRANCHLIKELY },
611
612 /* MIPS I processors. */
613 { "r3000", PROCESSOR_R3000, 1, 0 },
614 { "r2000", PROCESSOR_R3000, 1, 0 },
615 { "r3900", PROCESSOR_R3900, 1, 0 },
616
617 /* MIPS II processors. */
618 { "r6000", PROCESSOR_R6000, 2, 0 },
619
620 /* MIPS III processors. */
621 { "r4000", PROCESSOR_R4000, 3, 0 },
622 { "vr4100", PROCESSOR_R4100, 3, 0 },
623 { "vr4111", PROCESSOR_R4111, 3, 0 },
624 { "vr4120", PROCESSOR_R4120, 3, 0 },
625 { "vr4130", PROCESSOR_R4130, 3, 0 },
626 { "vr4300", PROCESSOR_R4300, 3, 0 },
627 { "r4400", PROCESSOR_R4000, 3, 0 },
628 { "r4600", PROCESSOR_R4600, 3, 0 },
629 { "orion", PROCESSOR_R4600, 3, 0 },
630 { "r4650", PROCESSOR_R4650, 3, 0 },
631 /* ST Loongson 2E/2F processors. */
632 { "loongson2e", PROCESSOR_LOONGSON_2E, 3, PTF_AVOID_BRANCHLIKELY },
633 { "loongson2f", PROCESSOR_LOONGSON_2F, 3, PTF_AVOID_BRANCHLIKELY },
634
635 /* MIPS IV processors. */
636 { "r8000", PROCESSOR_R8000, 4, 0 },
637 { "r10000", PROCESSOR_R10000, 4, 0 },
638 { "r12000", PROCESSOR_R10000, 4, 0 },
639 { "r14000", PROCESSOR_R10000, 4, 0 },
640 { "r16000", PROCESSOR_R10000, 4, 0 },
641 { "vr5000", PROCESSOR_R5000, 4, 0 },
642 { "vr5400", PROCESSOR_R5400, 4, 0 },
643 { "vr5500", PROCESSOR_R5500, 4, PTF_AVOID_BRANCHLIKELY },
644 { "rm7000", PROCESSOR_R7000, 4, 0 },
645 { "rm9000", PROCESSOR_R9000, 4, 0 },
646
647 /* MIPS32 processors. */
648 { "4kc", PROCESSOR_4KC, 32, 0 },
649 { "4km", PROCESSOR_4KC, 32, 0 },
650 { "4kp", PROCESSOR_4KP, 32, 0 },
651 { "4ksc", PROCESSOR_4KC, 32, 0 },
652
653 /* MIPS32 Release 2 processors. */
654 { "m4k", PROCESSOR_M4K, 33, 0 },
655 { "4kec", PROCESSOR_4KC, 33, 0 },
656 { "4kem", PROCESSOR_4KC, 33, 0 },
657 { "4kep", PROCESSOR_4KP, 33, 0 },
658 { "4ksd", PROCESSOR_4KC, 33, 0 },
659
660 { "24kc", PROCESSOR_24KC, 33, 0 },
661 { "24kf2_1", PROCESSOR_24KF2_1, 33, 0 },
662 { "24kf", PROCESSOR_24KF2_1, 33, 0 },
663 { "24kf1_1", PROCESSOR_24KF1_1, 33, 0 },
664 { "24kfx", PROCESSOR_24KF1_1, 33, 0 },
665 { "24kx", PROCESSOR_24KF1_1, 33, 0 },
666
667 { "24kec", PROCESSOR_24KC, 33, 0 }, /* 24K with DSP. */
668 { "24kef2_1", PROCESSOR_24KF2_1, 33, 0 },
669 { "24kef", PROCESSOR_24KF2_1, 33, 0 },
670 { "24kef1_1", PROCESSOR_24KF1_1, 33, 0 },
671 { "24kefx", PROCESSOR_24KF1_1, 33, 0 },
672 { "24kex", PROCESSOR_24KF1_1, 33, 0 },
673
674 { "34kc", PROCESSOR_24KC, 33, 0 }, /* 34K with MT/DSP. */
675 { "34kf2_1", PROCESSOR_24KF2_1, 33, 0 },
676 { "34kf", PROCESSOR_24KF2_1, 33, 0 },
677 { "34kf1_1", PROCESSOR_24KF1_1, 33, 0 },
678 { "34kfx", PROCESSOR_24KF1_1, 33, 0 },
679 { "34kx", PROCESSOR_24KF1_1, 33, 0 },
680
681 { "74kc", PROCESSOR_74KC, 33, 0 }, /* 74K with DSPr2. */
682 { "74kf2_1", PROCESSOR_74KF2_1, 33, 0 },
683 { "74kf", PROCESSOR_74KF2_1, 33, 0 },
684 { "74kf1_1", PROCESSOR_74KF1_1, 33, 0 },
685 { "74kfx", PROCESSOR_74KF1_1, 33, 0 },
686 { "74kx", PROCESSOR_74KF1_1, 33, 0 },
687 { "74kf3_2", PROCESSOR_74KF3_2, 33, 0 },
688
689 /* MIPS64 processors. */
690 { "5kc", PROCESSOR_5KC, 64, 0 },
691 { "5kf", PROCESSOR_5KF, 64, 0 },
692 { "20kc", PROCESSOR_20KC, 64, PTF_AVOID_BRANCHLIKELY },
693 { "sb1", PROCESSOR_SB1, 64, PTF_AVOID_BRANCHLIKELY },
694 { "sb1a", PROCESSOR_SB1A, 64, PTF_AVOID_BRANCHLIKELY },
695 { "sr71000", PROCESSOR_SR71000, 64, PTF_AVOID_BRANCHLIKELY },
696 { "xlr", PROCESSOR_XLR, 64, 0 },
697
698 /* MIPS64 Release 2 processors. */
699 { "octeon", PROCESSOR_OCTEON, 65, PTF_AVOID_BRANCHLIKELY }
700 };
701
702 /* Default costs. If these are used for a processor we should look
703 up the actual costs. */
704 #define DEFAULT_COSTS COSTS_N_INSNS (6), /* fp_add */ \
705 COSTS_N_INSNS (7), /* fp_mult_sf */ \
706 COSTS_N_INSNS (8), /* fp_mult_df */ \
707 COSTS_N_INSNS (23), /* fp_div_sf */ \
708 COSTS_N_INSNS (36), /* fp_div_df */ \
709 COSTS_N_INSNS (10), /* int_mult_si */ \
710 COSTS_N_INSNS (10), /* int_mult_di */ \
711 COSTS_N_INSNS (69), /* int_div_si */ \
712 COSTS_N_INSNS (69), /* int_div_di */ \
713 2, /* branch_cost */ \
714 4 /* memory_latency */
715
716 /* Floating-point costs for processors without an FPU. Just assume that
717 all floating-point libcalls are very expensive. */
718 #define SOFT_FP_COSTS COSTS_N_INSNS (256), /* fp_add */ \
719 COSTS_N_INSNS (256), /* fp_mult_sf */ \
720 COSTS_N_INSNS (256), /* fp_mult_df */ \
721 COSTS_N_INSNS (256), /* fp_div_sf */ \
722 COSTS_N_INSNS (256) /* fp_div_df */
723
724 /* Costs to use when optimizing for size. */
725 static const struct mips_rtx_cost_data mips_rtx_cost_optimize_size = {
726 COSTS_N_INSNS (1), /* fp_add */
727 COSTS_N_INSNS (1), /* fp_mult_sf */
728 COSTS_N_INSNS (1), /* fp_mult_df */
729 COSTS_N_INSNS (1), /* fp_div_sf */
730 COSTS_N_INSNS (1), /* fp_div_df */
731 COSTS_N_INSNS (1), /* int_mult_si */
732 COSTS_N_INSNS (1), /* int_mult_di */
733 COSTS_N_INSNS (1), /* int_div_si */
734 COSTS_N_INSNS (1), /* int_div_di */
735 2, /* branch_cost */
736 4 /* memory_latency */
737 };
738
739 /* Costs to use when optimizing for speed, indexed by processor. */
740 static const struct mips_rtx_cost_data mips_rtx_cost_data[PROCESSOR_MAX] = {
741 { /* R3000 */
742 COSTS_N_INSNS (2), /* fp_add */
743 COSTS_N_INSNS (4), /* fp_mult_sf */
744 COSTS_N_INSNS (5), /* fp_mult_df */
745 COSTS_N_INSNS (12), /* fp_div_sf */
746 COSTS_N_INSNS (19), /* fp_div_df */
747 COSTS_N_INSNS (12), /* int_mult_si */
748 COSTS_N_INSNS (12), /* int_mult_di */
749 COSTS_N_INSNS (35), /* int_div_si */
750 COSTS_N_INSNS (35), /* int_div_di */
751 1, /* branch_cost */
752 4 /* memory_latency */
753 },
754 { /* 4KC */
755 SOFT_FP_COSTS,
756 COSTS_N_INSNS (6), /* int_mult_si */
757 COSTS_N_INSNS (6), /* int_mult_di */
758 COSTS_N_INSNS (36), /* int_div_si */
759 COSTS_N_INSNS (36), /* int_div_di */
760 1, /* branch_cost */
761 4 /* memory_latency */
762 },
763 { /* 4KP */
764 SOFT_FP_COSTS,
765 COSTS_N_INSNS (36), /* int_mult_si */
766 COSTS_N_INSNS (36), /* int_mult_di */
767 COSTS_N_INSNS (37), /* int_div_si */
768 COSTS_N_INSNS (37), /* int_div_di */
769 1, /* branch_cost */
770 4 /* memory_latency */
771 },
772 { /* 5KC */
773 SOFT_FP_COSTS,
774 COSTS_N_INSNS (4), /* int_mult_si */
775 COSTS_N_INSNS (11), /* int_mult_di */
776 COSTS_N_INSNS (36), /* int_div_si */
777 COSTS_N_INSNS (68), /* int_div_di */
778 1, /* branch_cost */
779 4 /* memory_latency */
780 },
781 { /* 5KF */
782 COSTS_N_INSNS (4), /* fp_add */
783 COSTS_N_INSNS (4), /* fp_mult_sf */
784 COSTS_N_INSNS (5), /* fp_mult_df */
785 COSTS_N_INSNS (17), /* fp_div_sf */
786 COSTS_N_INSNS (32), /* fp_div_df */
787 COSTS_N_INSNS (4), /* int_mult_si */
788 COSTS_N_INSNS (11), /* int_mult_di */
789 COSTS_N_INSNS (36), /* int_div_si */
790 COSTS_N_INSNS (68), /* int_div_di */
791 1, /* branch_cost */
792 4 /* memory_latency */
793 },
794 { /* 20KC */
795 COSTS_N_INSNS (4), /* fp_add */
796 COSTS_N_INSNS (4), /* fp_mult_sf */
797 COSTS_N_INSNS (5), /* fp_mult_df */
798 COSTS_N_INSNS (17), /* fp_div_sf */
799 COSTS_N_INSNS (32), /* fp_div_df */
800 COSTS_N_INSNS (4), /* int_mult_si */
801 COSTS_N_INSNS (7), /* int_mult_di */
802 COSTS_N_INSNS (42), /* int_div_si */
803 COSTS_N_INSNS (72), /* int_div_di */
804 1, /* branch_cost */
805 4 /* memory_latency */
806 },
807 { /* 24KC */
808 SOFT_FP_COSTS,
809 COSTS_N_INSNS (5), /* int_mult_si */
810 COSTS_N_INSNS (5), /* int_mult_di */
811 COSTS_N_INSNS (41), /* int_div_si */
812 COSTS_N_INSNS (41), /* int_div_di */
813 1, /* branch_cost */
814 4 /* memory_latency */
815 },
816 { /* 24KF2_1 */
817 COSTS_N_INSNS (8), /* fp_add */
818 COSTS_N_INSNS (8), /* fp_mult_sf */
819 COSTS_N_INSNS (10), /* fp_mult_df */
820 COSTS_N_INSNS (34), /* fp_div_sf */
821 COSTS_N_INSNS (64), /* fp_div_df */
822 COSTS_N_INSNS (5), /* int_mult_si */
823 COSTS_N_INSNS (5), /* int_mult_di */
824 COSTS_N_INSNS (41), /* int_div_si */
825 COSTS_N_INSNS (41), /* int_div_di */
826 1, /* branch_cost */
827 4 /* memory_latency */
828 },
829 { /* 24KF1_1 */
830 COSTS_N_INSNS (4), /* fp_add */
831 COSTS_N_INSNS (4), /* fp_mult_sf */
832 COSTS_N_INSNS (5), /* fp_mult_df */
833 COSTS_N_INSNS (17), /* fp_div_sf */
834 COSTS_N_INSNS (32), /* fp_div_df */
835 COSTS_N_INSNS (5), /* int_mult_si */
836 COSTS_N_INSNS (5), /* int_mult_di */
837 COSTS_N_INSNS (41), /* int_div_si */
838 COSTS_N_INSNS (41), /* int_div_di */
839 1, /* branch_cost */
840 4 /* memory_latency */
841 },
842 { /* 74KC */
843 SOFT_FP_COSTS,
844 COSTS_N_INSNS (5), /* int_mult_si */
845 COSTS_N_INSNS (5), /* int_mult_di */
846 COSTS_N_INSNS (41), /* int_div_si */
847 COSTS_N_INSNS (41), /* int_div_di */
848 1, /* branch_cost */
849 4 /* memory_latency */
850 },
851 { /* 74KF2_1 */
852 COSTS_N_INSNS (8), /* fp_add */
853 COSTS_N_INSNS (8), /* fp_mult_sf */
854 COSTS_N_INSNS (10), /* fp_mult_df */
855 COSTS_N_INSNS (34), /* fp_div_sf */
856 COSTS_N_INSNS (64), /* fp_div_df */
857 COSTS_N_INSNS (5), /* int_mult_si */
858 COSTS_N_INSNS (5), /* int_mult_di */
859 COSTS_N_INSNS (41), /* int_div_si */
860 COSTS_N_INSNS (41), /* int_div_di */
861 1, /* branch_cost */
862 4 /* memory_latency */
863 },
864 { /* 74KF1_1 */
865 COSTS_N_INSNS (4), /* fp_add */
866 COSTS_N_INSNS (4), /* fp_mult_sf */
867 COSTS_N_INSNS (5), /* fp_mult_df */
868 COSTS_N_INSNS (17), /* fp_div_sf */
869 COSTS_N_INSNS (32), /* fp_div_df */
870 COSTS_N_INSNS (5), /* int_mult_si */
871 COSTS_N_INSNS (5), /* int_mult_di */
872 COSTS_N_INSNS (41), /* int_div_si */
873 COSTS_N_INSNS (41), /* int_div_di */
874 1, /* branch_cost */
875 4 /* memory_latency */
876 },
877 { /* 74KF3_2 */
878 COSTS_N_INSNS (6), /* fp_add */
879 COSTS_N_INSNS (6), /* fp_mult_sf */
880 COSTS_N_INSNS (7), /* fp_mult_df */
881 COSTS_N_INSNS (25), /* fp_div_sf */
882 COSTS_N_INSNS (48), /* fp_div_df */
883 COSTS_N_INSNS (5), /* int_mult_si */
884 COSTS_N_INSNS (5), /* int_mult_di */
885 COSTS_N_INSNS (41), /* int_div_si */
886 COSTS_N_INSNS (41), /* int_div_di */
887 1, /* branch_cost */
888 4 /* memory_latency */
889 },
890 { /* Loongson-2E */
891 DEFAULT_COSTS
892 },
893 { /* Loongson-2F */
894 DEFAULT_COSTS
895 },
896 { /* M4k */
897 DEFAULT_COSTS
898 },
899 /* Octeon */
900 {
901 SOFT_FP_COSTS,
902 COSTS_N_INSNS (5), /* int_mult_si */
903 COSTS_N_INSNS (5), /* int_mult_di */
904 COSTS_N_INSNS (72), /* int_div_si */
905 COSTS_N_INSNS (72), /* int_div_di */
906 1, /* branch_cost */
907 4 /* memory_latency */
908 },
909 { /* R3900 */
910 COSTS_N_INSNS (2), /* fp_add */
911 COSTS_N_INSNS (4), /* fp_mult_sf */
912 COSTS_N_INSNS (5), /* fp_mult_df */
913 COSTS_N_INSNS (12), /* fp_div_sf */
914 COSTS_N_INSNS (19), /* fp_div_df */
915 COSTS_N_INSNS (2), /* int_mult_si */
916 COSTS_N_INSNS (2), /* int_mult_di */
917 COSTS_N_INSNS (35), /* int_div_si */
918 COSTS_N_INSNS (35), /* int_div_di */
919 1, /* branch_cost */
920 4 /* memory_latency */
921 },
922 { /* R6000 */
923 COSTS_N_INSNS (3), /* fp_add */
924 COSTS_N_INSNS (5), /* fp_mult_sf */
925 COSTS_N_INSNS (6), /* fp_mult_df */
926 COSTS_N_INSNS (15), /* fp_div_sf */
927 COSTS_N_INSNS (16), /* fp_div_df */
928 COSTS_N_INSNS (17), /* int_mult_si */
929 COSTS_N_INSNS (17), /* int_mult_di */
930 COSTS_N_INSNS (38), /* int_div_si */
931 COSTS_N_INSNS (38), /* int_div_di */
932 2, /* branch_cost */
933 6 /* memory_latency */
934 },
935 { /* R4000 */
936 COSTS_N_INSNS (6), /* fp_add */
937 COSTS_N_INSNS (7), /* fp_mult_sf */
938 COSTS_N_INSNS (8), /* fp_mult_df */
939 COSTS_N_INSNS (23), /* fp_div_sf */
940 COSTS_N_INSNS (36), /* fp_div_df */
941 COSTS_N_INSNS (10), /* int_mult_si */
942 COSTS_N_INSNS (10), /* int_mult_di */
943 COSTS_N_INSNS (69), /* int_div_si */
944 COSTS_N_INSNS (69), /* int_div_di */
945 2, /* branch_cost */
946 6 /* memory_latency */
947 },
948 { /* R4100 */
949 DEFAULT_COSTS
950 },
951 { /* R4111 */
952 DEFAULT_COSTS
953 },
954 { /* R4120 */
955 DEFAULT_COSTS
956 },
957 { /* R4130 */
958 /* The only costs that appear to be updated here are
959 integer multiplication. */
960 SOFT_FP_COSTS,
961 COSTS_N_INSNS (4), /* int_mult_si */
962 COSTS_N_INSNS (6), /* int_mult_di */
963 COSTS_N_INSNS (69), /* int_div_si */
964 COSTS_N_INSNS (69), /* int_div_di */
965 1, /* branch_cost */
966 4 /* memory_latency */
967 },
968 { /* R4300 */
969 DEFAULT_COSTS
970 },
971 { /* R4600 */
972 DEFAULT_COSTS
973 },
974 { /* R4650 */
975 DEFAULT_COSTS
976 },
977 { /* R5000 */
978 COSTS_N_INSNS (6), /* fp_add */
979 COSTS_N_INSNS (4), /* fp_mult_sf */
980 COSTS_N_INSNS (5), /* fp_mult_df */
981 COSTS_N_INSNS (23), /* fp_div_sf */
982 COSTS_N_INSNS (36), /* fp_div_df */
983 COSTS_N_INSNS (5), /* int_mult_si */
984 COSTS_N_INSNS (5), /* int_mult_di */
985 COSTS_N_INSNS (36), /* int_div_si */
986 COSTS_N_INSNS (36), /* int_div_di */
987 1, /* branch_cost */
988 4 /* memory_latency */
989 },
990 { /* R5400 */
991 COSTS_N_INSNS (6), /* fp_add */
992 COSTS_N_INSNS (5), /* fp_mult_sf */
993 COSTS_N_INSNS (6), /* fp_mult_df */
994 COSTS_N_INSNS (30), /* fp_div_sf */
995 COSTS_N_INSNS (59), /* fp_div_df */
996 COSTS_N_INSNS (3), /* int_mult_si */
997 COSTS_N_INSNS (4), /* int_mult_di */
998 COSTS_N_INSNS (42), /* int_div_si */
999 COSTS_N_INSNS (74), /* int_div_di */
1000 1, /* branch_cost */
1001 4 /* memory_latency */
1002 },
1003 { /* R5500 */
1004 COSTS_N_INSNS (6), /* fp_add */
1005 COSTS_N_INSNS (5), /* fp_mult_sf */
1006 COSTS_N_INSNS (6), /* fp_mult_df */
1007 COSTS_N_INSNS (30), /* fp_div_sf */
1008 COSTS_N_INSNS (59), /* fp_div_df */
1009 COSTS_N_INSNS (5), /* int_mult_si */
1010 COSTS_N_INSNS (9), /* int_mult_di */
1011 COSTS_N_INSNS (42), /* int_div_si */
1012 COSTS_N_INSNS (74), /* int_div_di */
1013 1, /* branch_cost */
1014 4 /* memory_latency */
1015 },
1016 { /* R7000 */
1017 /* The only costs that are changed here are
1018 integer multiplication. */
1019 COSTS_N_INSNS (6), /* fp_add */
1020 COSTS_N_INSNS (7), /* fp_mult_sf */
1021 COSTS_N_INSNS (8), /* fp_mult_df */
1022 COSTS_N_INSNS (23), /* fp_div_sf */
1023 COSTS_N_INSNS (36), /* fp_div_df */
1024 COSTS_N_INSNS (5), /* int_mult_si */
1025 COSTS_N_INSNS (9), /* int_mult_di */
1026 COSTS_N_INSNS (69), /* int_div_si */
1027 COSTS_N_INSNS (69), /* int_div_di */
1028 1, /* branch_cost */
1029 4 /* memory_latency */
1030 },
1031 { /* R8000 */
1032 DEFAULT_COSTS
1033 },
1034 { /* R9000 */
1035 /* The only costs that are changed here are
1036 integer multiplication. */
1037 COSTS_N_INSNS (6), /* fp_add */
1038 COSTS_N_INSNS (7), /* fp_mult_sf */
1039 COSTS_N_INSNS (8), /* fp_mult_df */
1040 COSTS_N_INSNS (23), /* fp_div_sf */
1041 COSTS_N_INSNS (36), /* fp_div_df */
1042 COSTS_N_INSNS (3), /* int_mult_si */
1043 COSTS_N_INSNS (8), /* int_mult_di */
1044 COSTS_N_INSNS (69), /* int_div_si */
1045 COSTS_N_INSNS (69), /* int_div_di */
1046 1, /* branch_cost */
1047 4 /* memory_latency */
1048 },
1049 { /* R1x000 */
1050 COSTS_N_INSNS (2), /* fp_add */
1051 COSTS_N_INSNS (2), /* fp_mult_sf */
1052 COSTS_N_INSNS (2), /* fp_mult_df */
1053 COSTS_N_INSNS (12), /* fp_div_sf */
1054 COSTS_N_INSNS (19), /* fp_div_df */
1055 COSTS_N_INSNS (5), /* int_mult_si */
1056 COSTS_N_INSNS (9), /* int_mult_di */
1057 COSTS_N_INSNS (34), /* int_div_si */
1058 COSTS_N_INSNS (66), /* int_div_di */
1059 1, /* branch_cost */
1060 4 /* memory_latency */
1061 },
1062 { /* SB1 */
1063 /* These costs are the same as the SB-1A below. */
1064 COSTS_N_INSNS (4), /* fp_add */
1065 COSTS_N_INSNS (4), /* fp_mult_sf */
1066 COSTS_N_INSNS (4), /* fp_mult_df */
1067 COSTS_N_INSNS (24), /* fp_div_sf */
1068 COSTS_N_INSNS (32), /* fp_div_df */
1069 COSTS_N_INSNS (3), /* int_mult_si */
1070 COSTS_N_INSNS (4), /* int_mult_di */
1071 COSTS_N_INSNS (36), /* int_div_si */
1072 COSTS_N_INSNS (68), /* int_div_di */
1073 1, /* branch_cost */
1074 4 /* memory_latency */
1075 },
1076 { /* SB1-A */
1077 /* These costs are the same as the SB-1 above. */
1078 COSTS_N_INSNS (4), /* fp_add */
1079 COSTS_N_INSNS (4), /* fp_mult_sf */
1080 COSTS_N_INSNS (4), /* fp_mult_df */
1081 COSTS_N_INSNS (24), /* fp_div_sf */
1082 COSTS_N_INSNS (32), /* fp_div_df */
1083 COSTS_N_INSNS (3), /* int_mult_si */
1084 COSTS_N_INSNS (4), /* int_mult_di */
1085 COSTS_N_INSNS (36), /* int_div_si */
1086 COSTS_N_INSNS (68), /* int_div_di */
1087 1, /* branch_cost */
1088 4 /* memory_latency */
1089 },
1090 { /* SR71000 */
1091 DEFAULT_COSTS
1092 },
1093 { /* XLR */
1094 SOFT_FP_COSTS,
1095 COSTS_N_INSNS (8), /* int_mult_si */
1096 COSTS_N_INSNS (8), /* int_mult_di */
1097 COSTS_N_INSNS (72), /* int_div_si */
1098 COSTS_N_INSNS (72), /* int_div_di */
1099 1, /* branch_cost */
1100 4 /* memory_latency */
1101 }
1102 };
1103 \f
1104 /* This hash table keeps track of implicit "mips16" and "nomips16" attributes
1105 for -mflip_mips16. It maps decl names onto a boolean mode setting. */
1106 struct GTY (()) mflip_mips16_entry {
1107 const char *name;
1108 bool mips16_p;
1109 };
1110 static GTY ((param_is (struct mflip_mips16_entry))) htab_t mflip_mips16_htab;
1111
1112 /* Hash table callbacks for mflip_mips16_htab. */
1113
1114 static hashval_t
1115 mflip_mips16_htab_hash (const void *entry)
1116 {
1117 return htab_hash_string (((const struct mflip_mips16_entry *) entry)->name);
1118 }
1119
1120 static int
1121 mflip_mips16_htab_eq (const void *entry, const void *name)
1122 {
1123 return strcmp (((const struct mflip_mips16_entry *) entry)->name,
1124 (const char *) name) == 0;
1125 }
1126
1127 /* True if -mflip-mips16 should next add an attribute for the default MIPS16
1128 mode, false if it should next add an attribute for the opposite mode. */
1129 static GTY(()) bool mips16_flipper;
1130
1131 /* DECL is a function that needs a default "mips16" or "nomips16" attribute
1132 for -mflip-mips16. Return true if it should use "mips16" and false if
1133 it should use "nomips16". */
1134
1135 static bool
1136 mflip_mips16_use_mips16_p (tree decl)
1137 {
1138 struct mflip_mips16_entry *entry;
1139 const char *name;
1140 hashval_t hash;
1141 void **slot;
1142
1143 /* Use the opposite of the command-line setting for anonymous decls. */
1144 if (!DECL_NAME (decl))
1145 return !mips_base_mips16;
1146
1147 if (!mflip_mips16_htab)
1148 mflip_mips16_htab = htab_create_ggc (37, mflip_mips16_htab_hash,
1149 mflip_mips16_htab_eq, NULL);
1150
1151 name = IDENTIFIER_POINTER (DECL_NAME (decl));
1152 hash = htab_hash_string (name);
1153 slot = htab_find_slot_with_hash (mflip_mips16_htab, name, hash, INSERT);
1154 entry = (struct mflip_mips16_entry *) *slot;
1155 if (!entry)
1156 {
1157 mips16_flipper = !mips16_flipper;
1158 entry = GGC_NEW (struct mflip_mips16_entry);
1159 entry->name = name;
1160 entry->mips16_p = mips16_flipper ? !mips_base_mips16 : mips_base_mips16;
1161 *slot = entry;
1162 }
1163 return entry->mips16_p;
1164 }
1165 \f
1166 /* Predicates to test for presence of "near" and "far"/"long_call"
1167 attributes on the given TYPE. */
1168
1169 static bool
1170 mips_near_type_p (const_tree type)
1171 {
1172 return lookup_attribute ("near", TYPE_ATTRIBUTES (type)) != NULL;
1173 }
1174
1175 static bool
1176 mips_far_type_p (const_tree type)
1177 {
1178 return (lookup_attribute ("long_call", TYPE_ATTRIBUTES (type)) != NULL
1179 || lookup_attribute ("far", TYPE_ATTRIBUTES (type)) != NULL);
1180 }
1181
1182 /* Similar predicates for "mips16"/"nomips16" function attributes. */
1183
1184 static bool
1185 mips_mips16_decl_p (const_tree decl)
1186 {
1187 return lookup_attribute ("mips16", DECL_ATTRIBUTES (decl)) != NULL;
1188 }
1189
1190 static bool
1191 mips_nomips16_decl_p (const_tree decl)
1192 {
1193 return lookup_attribute ("nomips16", DECL_ATTRIBUTES (decl)) != NULL;
1194 }
1195
1196 /* Check if the interrupt attribute is set for a function. */
1197
1198 static bool
1199 mips_interrupt_type_p (tree type)
1200 {
1201 return lookup_attribute ("interrupt", TYPE_ATTRIBUTES (type)) != NULL;
1202 }
1203
1204 /* Check if the attribute to use shadow register set is set for a function. */
1205
1206 static bool
1207 mips_use_shadow_register_set_p (tree type)
1208 {
1209 return lookup_attribute ("use_shadow_register_set",
1210 TYPE_ATTRIBUTES (type)) != NULL;
1211 }
1212
1213 /* Check if the attribute to keep interrupts masked is set for a function. */
1214
1215 static bool
1216 mips_keep_interrupts_masked_p (tree type)
1217 {
1218 return lookup_attribute ("keep_interrupts_masked",
1219 TYPE_ATTRIBUTES (type)) != NULL;
1220 }
1221
1222 /* Check if the attribute to use debug exception return is set for
1223 a function. */
1224
1225 static bool
1226 mips_use_debug_exception_return_p (tree type)
1227 {
1228 return lookup_attribute ("use_debug_exception_return",
1229 TYPE_ATTRIBUTES (type)) != NULL;
1230 }
1231
1232 /* Return true if function DECL is a MIPS16 function. Return the ambient
1233 setting if DECL is null. */
1234
1235 static bool
1236 mips_use_mips16_mode_p (tree decl)
1237 {
1238 if (decl)
1239 {
1240 /* Nested functions must use the same frame pointer as their
1241 parent and must therefore use the same ISA mode. */
1242 tree parent = decl_function_context (decl);
1243 if (parent)
1244 decl = parent;
1245 if (mips_mips16_decl_p (decl))
1246 return true;
1247 if (mips_nomips16_decl_p (decl))
1248 return false;
1249 }
1250 return mips_base_mips16;
1251 }
1252
1253 /* Implement TARGET_COMP_TYPE_ATTRIBUTES. */
1254
1255 static int
1256 mips_comp_type_attributes (const_tree type1, const_tree type2)
1257 {
1258 /* Disallow mixed near/far attributes. */
1259 if (mips_far_type_p (type1) && mips_near_type_p (type2))
1260 return 0;
1261 if (mips_near_type_p (type1) && mips_far_type_p (type2))
1262 return 0;
1263 return 1;
1264 }
1265
1266 /* Implement TARGET_INSERT_ATTRIBUTES. */
1267
1268 static void
1269 mips_insert_attributes (tree decl, tree *attributes)
1270 {
1271 const char *name;
1272 bool mips16_p, nomips16_p;
1273
1274 /* Check for "mips16" and "nomips16" attributes. */
1275 mips16_p = lookup_attribute ("mips16", *attributes) != NULL;
1276 nomips16_p = lookup_attribute ("nomips16", *attributes) != NULL;
1277 if (TREE_CODE (decl) != FUNCTION_DECL)
1278 {
1279 if (mips16_p)
1280 error ("%qs attribute only applies to functions", "mips16");
1281 if (nomips16_p)
1282 error ("%qs attribute only applies to functions", "nomips16");
1283 }
1284 else
1285 {
1286 mips16_p |= mips_mips16_decl_p (decl);
1287 nomips16_p |= mips_nomips16_decl_p (decl);
1288 if (mips16_p || nomips16_p)
1289 {
1290 /* DECL cannot be simultaneously "mips16" and "nomips16". */
1291 if (mips16_p && nomips16_p)
1292 error ("%qE cannot have both %<mips16%> and "
1293 "%<nomips16%> attributes",
1294 DECL_NAME (decl));
1295 }
1296 else if (TARGET_FLIP_MIPS16 && !DECL_ARTIFICIAL (decl))
1297 {
1298 /* Implement -mflip-mips16. If DECL has neither a "nomips16" nor a
1299 "mips16" attribute, arbitrarily pick one. We must pick the same
1300 setting for duplicate declarations of a function. */
1301 name = mflip_mips16_use_mips16_p (decl) ? "mips16" : "nomips16";
1302 *attributes = tree_cons (get_identifier (name), NULL, *attributes);
1303 }
1304 }
1305 }
1306
1307 /* Implement TARGET_MERGE_DECL_ATTRIBUTES. */
1308
1309 static tree
1310 mips_merge_decl_attributes (tree olddecl, tree newdecl)
1311 {
1312 /* The decls' "mips16" and "nomips16" attributes must match exactly. */
1313 if (mips_mips16_decl_p (olddecl) != mips_mips16_decl_p (newdecl))
1314 error ("%qE redeclared with conflicting %qs attributes",
1315 DECL_NAME (newdecl), "mips16");
1316 if (mips_nomips16_decl_p (olddecl) != mips_nomips16_decl_p (newdecl))
1317 error ("%qE redeclared with conflicting %qs attributes",
1318 DECL_NAME (newdecl), "nomips16");
1319
1320 return merge_attributes (DECL_ATTRIBUTES (olddecl),
1321 DECL_ATTRIBUTES (newdecl));
1322 }
1323 \f
1324 /* If X is a PLUS of a CONST_INT, return the two terms in *BASE_PTR
1325 and *OFFSET_PTR. Return X in *BASE_PTR and 0 in *OFFSET_PTR otherwise. */
1326
1327 static void
1328 mips_split_plus (rtx x, rtx *base_ptr, HOST_WIDE_INT *offset_ptr)
1329 {
1330 if (GET_CODE (x) == PLUS && GET_CODE (XEXP (x, 1)) == CONST_INT)
1331 {
1332 *base_ptr = XEXP (x, 0);
1333 *offset_ptr = INTVAL (XEXP (x, 1));
1334 }
1335 else
1336 {
1337 *base_ptr = x;
1338 *offset_ptr = 0;
1339 }
1340 }
1341 \f
1342 static unsigned int mips_build_integer (struct mips_integer_op *,
1343 unsigned HOST_WIDE_INT);
1344
1345 /* A subroutine of mips_build_integer, with the same interface.
1346 Assume that the final action in the sequence should be a left shift. */
1347
1348 static unsigned int
1349 mips_build_shift (struct mips_integer_op *codes, HOST_WIDE_INT value)
1350 {
1351 unsigned int i, shift;
1352
1353 /* Shift VALUE right until its lowest bit is set. Shift arithmetically
1354 since signed numbers are easier to load than unsigned ones. */
1355 shift = 0;
1356 while ((value & 1) == 0)
1357 value /= 2, shift++;
1358
1359 i = mips_build_integer (codes, value);
1360 codes[i].code = ASHIFT;
1361 codes[i].value = shift;
1362 return i + 1;
1363 }
1364
1365 /* As for mips_build_shift, but assume that the final action will be
1366 an IOR or PLUS operation. */
1367
1368 static unsigned int
1369 mips_build_lower (struct mips_integer_op *codes, unsigned HOST_WIDE_INT value)
1370 {
1371 unsigned HOST_WIDE_INT high;
1372 unsigned int i;
1373
1374 high = value & ~(unsigned HOST_WIDE_INT) 0xffff;
1375 if (!LUI_OPERAND (high) && (value & 0x18000) == 0x18000)
1376 {
1377 /* The constant is too complex to load with a simple LUI/ORI pair,
1378 so we want to give the recursive call as many trailing zeros as
1379 possible. In this case, we know bit 16 is set and that the
1380 low 16 bits form a negative number. If we subtract that number
1381 from VALUE, we will clear at least the lowest 17 bits, maybe more. */
1382 i = mips_build_integer (codes, CONST_HIGH_PART (value));
1383 codes[i].code = PLUS;
1384 codes[i].value = CONST_LOW_PART (value);
1385 }
1386 else
1387 {
1388 /* Either this is a simple LUI/ORI pair, or clearing the lowest 16
1389 bits gives a value with at least 17 trailing zeros. */
1390 i = mips_build_integer (codes, high);
1391 codes[i].code = IOR;
1392 codes[i].value = value & 0xffff;
1393 }
1394 return i + 1;
1395 }
1396
1397 /* Fill CODES with a sequence of rtl operations to load VALUE.
1398 Return the number of operations needed. */
1399
1400 static unsigned int
1401 mips_build_integer (struct mips_integer_op *codes,
1402 unsigned HOST_WIDE_INT value)
1403 {
1404 if (SMALL_OPERAND (value)
1405 || SMALL_OPERAND_UNSIGNED (value)
1406 || LUI_OPERAND (value))
1407 {
1408 /* The value can be loaded with a single instruction. */
1409 codes[0].code = UNKNOWN;
1410 codes[0].value = value;
1411 return 1;
1412 }
1413 else if ((value & 1) != 0 || LUI_OPERAND (CONST_HIGH_PART (value)))
1414 {
1415 /* Either the constant is a simple LUI/ORI combination or its
1416 lowest bit is set. We don't want to shift in this case. */
1417 return mips_build_lower (codes, value);
1418 }
1419 else if ((value & 0xffff) == 0)
1420 {
1421 /* The constant will need at least three actions. The lowest
1422 16 bits are clear, so the final action will be a shift. */
1423 return mips_build_shift (codes, value);
1424 }
1425 else
1426 {
1427 /* The final action could be a shift, add or inclusive OR.
1428 Rather than use a complex condition to select the best
1429 approach, try both mips_build_shift and mips_build_lower
1430 and pick the one that gives the shortest sequence.
1431 Note that this case is only used once per constant. */
1432 struct mips_integer_op alt_codes[MIPS_MAX_INTEGER_OPS];
1433 unsigned int cost, alt_cost;
1434
1435 cost = mips_build_shift (codes, value);
1436 alt_cost = mips_build_lower (alt_codes, value);
1437 if (alt_cost < cost)
1438 {
1439 memcpy (codes, alt_codes, alt_cost * sizeof (codes[0]));
1440 cost = alt_cost;
1441 }
1442 return cost;
1443 }
1444 }
1445 \f
1446 /* Return true if symbols of type TYPE require a GOT access. */
1447
1448 static bool
1449 mips_got_symbol_type_p (enum mips_symbol_type type)
1450 {
1451 switch (type)
1452 {
1453 case SYMBOL_GOT_PAGE_OFST:
1454 case SYMBOL_GOT_DISP:
1455 return true;
1456
1457 default:
1458 return false;
1459 }
1460 }
1461
1462 /* Return true if X is a thread-local symbol. */
1463
1464 static bool
1465 mips_tls_symbol_p (rtx x)
1466 {
1467 return GET_CODE (x) == SYMBOL_REF && SYMBOL_REF_TLS_MODEL (x) != 0;
1468 }
1469
1470 /* Return true if SYMBOL_REF X is associated with a global symbol
1471 (in the STB_GLOBAL sense). */
1472
1473 static bool
1474 mips_global_symbol_p (const_rtx x)
1475 {
1476 const_tree decl = SYMBOL_REF_DECL (x);
1477
1478 if (!decl)
1479 return !SYMBOL_REF_LOCAL_P (x) || SYMBOL_REF_EXTERNAL_P (x);
1480
1481 /* Weakref symbols are not TREE_PUBLIC, but their targets are global
1482 or weak symbols. Relocations in the object file will be against
1483 the target symbol, so it's that symbol's binding that matters here. */
1484 return DECL_P (decl) && (TREE_PUBLIC (decl) || DECL_WEAK (decl));
1485 }
1486
1487 /* Return true if function X is a libgcc MIPS16 stub function. */
1488
1489 static bool
1490 mips16_stub_function_p (const_rtx x)
1491 {
1492 return (GET_CODE (x) == SYMBOL_REF
1493 && strncmp (XSTR (x, 0), "__mips16_", 9) == 0);
1494 }
1495
1496 /* Return true if function X is a locally-defined and locally-binding
1497 MIPS16 function. */
1498
1499 static bool
1500 mips16_local_function_p (const_rtx x)
1501 {
1502 return (GET_CODE (x) == SYMBOL_REF
1503 && SYMBOL_REF_LOCAL_P (x)
1504 && !SYMBOL_REF_EXTERNAL_P (x)
1505 && mips_use_mips16_mode_p (SYMBOL_REF_DECL (x)));
1506 }
1507
1508 /* Return true if SYMBOL_REF X binds locally. */
1509
1510 static bool
1511 mips_symbol_binds_local_p (const_rtx x)
1512 {
1513 return (SYMBOL_REF_DECL (x)
1514 ? targetm.binds_local_p (SYMBOL_REF_DECL (x))
1515 : SYMBOL_REF_LOCAL_P (x));
1516 }
1517
1518 /* Return true if rtx constants of mode MODE should be put into a small
1519 data section. */
1520
1521 static bool
1522 mips_rtx_constant_in_small_data_p (enum machine_mode mode)
1523 {
1524 return (!TARGET_EMBEDDED_DATA
1525 && TARGET_LOCAL_SDATA
1526 && GET_MODE_SIZE (mode) <= mips_small_data_threshold);
1527 }
1528
1529 /* Return true if X should not be moved directly into register $25.
1530 We need this because many versions of GAS will treat "la $25,foo" as
1531 part of a call sequence and so allow a global "foo" to be lazily bound. */
1532
1533 bool
1534 mips_dangerous_for_la25_p (rtx x)
1535 {
1536 return (!TARGET_EXPLICIT_RELOCS
1537 && TARGET_USE_GOT
1538 && GET_CODE (x) == SYMBOL_REF
1539 && mips_global_symbol_p (x));
1540 }
1541
1542 /* Return true if calls to X might need $25 to be valid on entry. */
1543
1544 bool
1545 mips_use_pic_fn_addr_reg_p (const_rtx x)
1546 {
1547 if (!TARGET_USE_PIC_FN_ADDR_REG)
1548 return false;
1549
1550 /* MIPS16 stub functions are guaranteed not to use $25. */
1551 if (mips16_stub_function_p (x))
1552 return false;
1553
1554 if (GET_CODE (x) == SYMBOL_REF)
1555 {
1556 /* If PLTs and copy relocations are available, the static linker
1557 will make sure that $25 is valid on entry to the target function. */
1558 if (TARGET_ABICALLS_PIC0)
1559 return false;
1560
1561 /* Locally-defined functions use absolute accesses to set up
1562 the global pointer. */
1563 if (TARGET_ABSOLUTE_ABICALLS
1564 && mips_symbol_binds_local_p (x)
1565 && !SYMBOL_REF_EXTERNAL_P (x))
1566 return false;
1567 }
1568
1569 return true;
1570 }
1571
1572 /* Return the method that should be used to access SYMBOL_REF or
1573 LABEL_REF X in context CONTEXT. */
1574
1575 static enum mips_symbol_type
1576 mips_classify_symbol (const_rtx x, enum mips_symbol_context context)
1577 {
1578 if (TARGET_RTP_PIC)
1579 return SYMBOL_GOT_DISP;
1580
1581 if (GET_CODE (x) == LABEL_REF)
1582 {
1583 /* LABEL_REFs are used for jump tables as well as text labels.
1584 Only return SYMBOL_PC_RELATIVE if we know the label is in
1585 the text section. */
1586 if (TARGET_MIPS16_SHORT_JUMP_TABLES)
1587 return SYMBOL_PC_RELATIVE;
1588
1589 if (TARGET_ABICALLS && !TARGET_ABSOLUTE_ABICALLS)
1590 return SYMBOL_GOT_PAGE_OFST;
1591
1592 return SYMBOL_ABSOLUTE;
1593 }
1594
1595 gcc_assert (GET_CODE (x) == SYMBOL_REF);
1596
1597 if (SYMBOL_REF_TLS_MODEL (x))
1598 return SYMBOL_TLS;
1599
1600 if (CONSTANT_POOL_ADDRESS_P (x))
1601 {
1602 if (TARGET_MIPS16_TEXT_LOADS)
1603 return SYMBOL_PC_RELATIVE;
1604
1605 if (TARGET_MIPS16_PCREL_LOADS && context == SYMBOL_CONTEXT_MEM)
1606 return SYMBOL_PC_RELATIVE;
1607
1608 if (mips_rtx_constant_in_small_data_p (get_pool_mode (x)))
1609 return SYMBOL_GP_RELATIVE;
1610 }
1611
1612 /* Do not use small-data accesses for weak symbols; they may end up
1613 being zero. */
1614 if (TARGET_GPOPT && SYMBOL_REF_SMALL_P (x) && !SYMBOL_REF_WEAK (x))
1615 return SYMBOL_GP_RELATIVE;
1616
1617 /* Don't use GOT accesses for locally-binding symbols when -mno-shared
1618 is in effect. */
1619 if (TARGET_ABICALLS_PIC2
1620 && !(TARGET_ABSOLUTE_ABICALLS && mips_symbol_binds_local_p (x)))
1621 {
1622 /* There are three cases to consider:
1623
1624 - o32 PIC (either with or without explicit relocs)
1625 - n32/n64 PIC without explicit relocs
1626 - n32/n64 PIC with explicit relocs
1627
1628 In the first case, both local and global accesses will use an
1629 R_MIPS_GOT16 relocation. We must correctly predict which of
1630 the two semantics (local or global) the assembler and linker
1631 will apply. The choice depends on the symbol's binding rather
1632 than its visibility.
1633
1634 In the second case, the assembler will not use R_MIPS_GOT16
1635 relocations, but it chooses between local and global accesses
1636 in the same way as for o32 PIC.
1637
1638 In the third case we have more freedom since both forms of
1639 access will work for any kind of symbol. However, there seems
1640 little point in doing things differently. */
1641 if (mips_global_symbol_p (x))
1642 return SYMBOL_GOT_DISP;
1643
1644 return SYMBOL_GOT_PAGE_OFST;
1645 }
1646
1647 if (TARGET_MIPS16_PCREL_LOADS && context != SYMBOL_CONTEXT_CALL)
1648 return SYMBOL_FORCE_TO_MEM;
1649
1650 return SYMBOL_ABSOLUTE;
1651 }
1652
1653 /* Classify the base of symbolic expression X, given that X appears in
1654 context CONTEXT. */
1655
1656 static enum mips_symbol_type
1657 mips_classify_symbolic_expression (rtx x, enum mips_symbol_context context)
1658 {
1659 rtx offset;
1660
1661 split_const (x, &x, &offset);
1662 if (UNSPEC_ADDRESS_P (x))
1663 return UNSPEC_ADDRESS_TYPE (x);
1664
1665 return mips_classify_symbol (x, context);
1666 }
1667
1668 /* Return true if OFFSET is within the range [0, ALIGN), where ALIGN
1669 is the alignment in bytes of SYMBOL_REF X. */
1670
1671 static bool
1672 mips_offset_within_alignment_p (rtx x, HOST_WIDE_INT offset)
1673 {
1674 HOST_WIDE_INT align;
1675
1676 align = SYMBOL_REF_DECL (x) ? DECL_ALIGN_UNIT (SYMBOL_REF_DECL (x)) : 1;
1677 return IN_RANGE (offset, 0, align - 1);
1678 }
1679
1680 /* Return true if X is a symbolic constant that can be used in context
1681 CONTEXT. If it is, store the type of the symbol in *SYMBOL_TYPE. */
1682
1683 bool
1684 mips_symbolic_constant_p (rtx x, enum mips_symbol_context context,
1685 enum mips_symbol_type *symbol_type)
1686 {
1687 rtx offset;
1688
1689 split_const (x, &x, &offset);
1690 if (UNSPEC_ADDRESS_P (x))
1691 {
1692 *symbol_type = UNSPEC_ADDRESS_TYPE (x);
1693 x = UNSPEC_ADDRESS (x);
1694 }
1695 else if (GET_CODE (x) == SYMBOL_REF || GET_CODE (x) == LABEL_REF)
1696 {
1697 *symbol_type = mips_classify_symbol (x, context);
1698 if (*symbol_type == SYMBOL_TLS)
1699 return false;
1700 }
1701 else
1702 return false;
1703
1704 if (offset == const0_rtx)
1705 return true;
1706
1707 /* Check whether a nonzero offset is valid for the underlying
1708 relocations. */
1709 switch (*symbol_type)
1710 {
1711 case SYMBOL_ABSOLUTE:
1712 case SYMBOL_FORCE_TO_MEM:
1713 case SYMBOL_32_HIGH:
1714 case SYMBOL_64_HIGH:
1715 case SYMBOL_64_MID:
1716 case SYMBOL_64_LOW:
1717 /* If the target has 64-bit pointers and the object file only
1718 supports 32-bit symbols, the values of those symbols will be
1719 sign-extended. In this case we can't allow an arbitrary offset
1720 in case the 32-bit value X + OFFSET has a different sign from X. */
1721 if (Pmode == DImode && !ABI_HAS_64BIT_SYMBOLS)
1722 return offset_within_block_p (x, INTVAL (offset));
1723
1724 /* In other cases the relocations can handle any offset. */
1725 return true;
1726
1727 case SYMBOL_PC_RELATIVE:
1728 /* Allow constant pool references to be converted to LABEL+CONSTANT.
1729 In this case, we no longer have access to the underlying constant,
1730 but the original symbol-based access was known to be valid. */
1731 if (GET_CODE (x) == LABEL_REF)
1732 return true;
1733
1734 /* Fall through. */
1735
1736 case SYMBOL_GP_RELATIVE:
1737 /* Make sure that the offset refers to something within the
1738 same object block. This should guarantee that the final
1739 PC- or GP-relative offset is within the 16-bit limit. */
1740 return offset_within_block_p (x, INTVAL (offset));
1741
1742 case SYMBOL_GOT_PAGE_OFST:
1743 case SYMBOL_GOTOFF_PAGE:
1744 /* If the symbol is global, the GOT entry will contain the symbol's
1745 address, and we will apply a 16-bit offset after loading it.
1746 If the symbol is local, the linker should provide enough local
1747 GOT entries for a 16-bit offset, but larger offsets may lead
1748 to GOT overflow. */
1749 return SMALL_INT (offset);
1750
1751 case SYMBOL_TPREL:
1752 case SYMBOL_DTPREL:
1753 /* There is no carry between the HI and LO REL relocations, so the
1754 offset is only valid if we know it won't lead to such a carry. */
1755 return mips_offset_within_alignment_p (x, INTVAL (offset));
1756
1757 case SYMBOL_GOT_DISP:
1758 case SYMBOL_GOTOFF_DISP:
1759 case SYMBOL_GOTOFF_CALL:
1760 case SYMBOL_GOTOFF_LOADGP:
1761 case SYMBOL_TLSGD:
1762 case SYMBOL_TLSLDM:
1763 case SYMBOL_GOTTPREL:
1764 case SYMBOL_TLS:
1765 case SYMBOL_HALF:
1766 return false;
1767 }
1768 gcc_unreachable ();
1769 }
1770 \f
1771 /* Like mips_symbol_insns, but treat extended MIPS16 instructions as a
1772 single instruction. We rely on the fact that, in the worst case,
1773 all instructions involved in a MIPS16 address calculation are usually
1774 extended ones. */
1775
1776 static int
1777 mips_symbol_insns_1 (enum mips_symbol_type type, enum machine_mode mode)
1778 {
1779 switch (type)
1780 {
1781 case SYMBOL_ABSOLUTE:
1782 /* When using 64-bit symbols, we need 5 preparatory instructions,
1783 such as:
1784
1785 lui $at,%highest(symbol)
1786 daddiu $at,$at,%higher(symbol)
1787 dsll $at,$at,16
1788 daddiu $at,$at,%hi(symbol)
1789 dsll $at,$at,16
1790
1791 The final address is then $at + %lo(symbol). With 32-bit
1792 symbols we just need a preparatory LUI for normal mode and
1793 a preparatory LI and SLL for MIPS16. */
1794 return ABI_HAS_64BIT_SYMBOLS ? 6 : TARGET_MIPS16 ? 3 : 2;
1795
1796 case SYMBOL_GP_RELATIVE:
1797 /* Treat GP-relative accesses as taking a single instruction on
1798 MIPS16 too; the copy of $gp can often be shared. */
1799 return 1;
1800
1801 case SYMBOL_PC_RELATIVE:
1802 /* PC-relative constants can be only be used with ADDIUPC,
1803 DADDIUPC, LWPC and LDPC. */
1804 if (mode == MAX_MACHINE_MODE
1805 || GET_MODE_SIZE (mode) == 4
1806 || GET_MODE_SIZE (mode) == 8)
1807 return 1;
1808
1809 /* The constant must be loaded using ADDIUPC or DADDIUPC first. */
1810 return 0;
1811
1812 case SYMBOL_FORCE_TO_MEM:
1813 /* LEAs will be converted into constant-pool references by
1814 mips_reorg. */
1815 if (mode == MAX_MACHINE_MODE)
1816 return 1;
1817
1818 /* The constant must be loaded and then dereferenced. */
1819 return 0;
1820
1821 case SYMBOL_GOT_DISP:
1822 /* The constant will have to be loaded from the GOT before it
1823 is used in an address. */
1824 if (mode != MAX_MACHINE_MODE)
1825 return 0;
1826
1827 /* Fall through. */
1828
1829 case SYMBOL_GOT_PAGE_OFST:
1830 /* Unless -funit-at-a-time is in effect, we can't be sure whether the
1831 local/global classification is accurate. The worst cases are:
1832
1833 (1) For local symbols when generating o32 or o64 code. The assembler
1834 will use:
1835
1836 lw $at,%got(symbol)
1837 nop
1838
1839 ...and the final address will be $at + %lo(symbol).
1840
1841 (2) For global symbols when -mxgot. The assembler will use:
1842
1843 lui $at,%got_hi(symbol)
1844 (d)addu $at,$at,$gp
1845
1846 ...and the final address will be $at + %got_lo(symbol). */
1847 return 3;
1848
1849 case SYMBOL_GOTOFF_PAGE:
1850 case SYMBOL_GOTOFF_DISP:
1851 case SYMBOL_GOTOFF_CALL:
1852 case SYMBOL_GOTOFF_LOADGP:
1853 case SYMBOL_32_HIGH:
1854 case SYMBOL_64_HIGH:
1855 case SYMBOL_64_MID:
1856 case SYMBOL_64_LOW:
1857 case SYMBOL_TLSGD:
1858 case SYMBOL_TLSLDM:
1859 case SYMBOL_DTPREL:
1860 case SYMBOL_GOTTPREL:
1861 case SYMBOL_TPREL:
1862 case SYMBOL_HALF:
1863 /* A 16-bit constant formed by a single relocation, or a 32-bit
1864 constant formed from a high 16-bit relocation and a low 16-bit
1865 relocation. Use mips_split_p to determine which. 32-bit
1866 constants need an "lui; addiu" sequence for normal mode and
1867 an "li; sll; addiu" sequence for MIPS16 mode. */
1868 return !mips_split_p[type] ? 1 : TARGET_MIPS16 ? 3 : 2;
1869
1870 case SYMBOL_TLS:
1871 /* We don't treat a bare TLS symbol as a constant. */
1872 return 0;
1873 }
1874 gcc_unreachable ();
1875 }
1876
1877 /* If MODE is MAX_MACHINE_MODE, return the number of instructions needed
1878 to load symbols of type TYPE into a register. Return 0 if the given
1879 type of symbol cannot be used as an immediate operand.
1880
1881 Otherwise, return the number of instructions needed to load or store
1882 values of mode MODE to or from addresses of type TYPE. Return 0 if
1883 the given type of symbol is not valid in addresses.
1884
1885 In both cases, treat extended MIPS16 instructions as two instructions. */
1886
1887 static int
1888 mips_symbol_insns (enum mips_symbol_type type, enum machine_mode mode)
1889 {
1890 return mips_symbol_insns_1 (type, mode) * (TARGET_MIPS16 ? 2 : 1);
1891 }
1892 \f
1893 /* A for_each_rtx callback. Stop the search if *X references a
1894 thread-local symbol. */
1895
1896 static int
1897 mips_tls_symbol_ref_1 (rtx *x, void *data ATTRIBUTE_UNUSED)
1898 {
1899 return mips_tls_symbol_p (*x);
1900 }
1901
1902 /* Implement TARGET_CANNOT_FORCE_CONST_MEM. */
1903
1904 static bool
1905 mips_cannot_force_const_mem (rtx x)
1906 {
1907 enum mips_symbol_type type;
1908 rtx base, offset;
1909
1910 /* There is no assembler syntax for expressing an address-sized
1911 high part. */
1912 if (GET_CODE (x) == HIGH)
1913 return true;
1914
1915 /* As an optimization, reject constants that mips_legitimize_move
1916 can expand inline.
1917
1918 Suppose we have a multi-instruction sequence that loads constant C
1919 into register R. If R does not get allocated a hard register, and
1920 R is used in an operand that allows both registers and memory
1921 references, reload will consider forcing C into memory and using
1922 one of the instruction's memory alternatives. Returning false
1923 here will force it to use an input reload instead. */
1924 if (GET_CODE (x) == CONST_INT && LEGITIMATE_CONSTANT_P (x))
1925 return true;
1926
1927 split_const (x, &base, &offset);
1928 if (mips_symbolic_constant_p (base, SYMBOL_CONTEXT_LEA, &type)
1929 && type != SYMBOL_FORCE_TO_MEM)
1930 {
1931 /* The same optimization as for CONST_INT. */
1932 if (SMALL_INT (offset) && mips_symbol_insns (type, MAX_MACHINE_MODE) > 0)
1933 return true;
1934
1935 /* If MIPS16 constant pools live in the text section, they should
1936 not refer to anything that might need run-time relocation. */
1937 if (TARGET_MIPS16_PCREL_LOADS && mips_got_symbol_type_p (type))
1938 return true;
1939 }
1940
1941 /* TLS symbols must be computed by mips_legitimize_move. */
1942 if (for_each_rtx (&x, &mips_tls_symbol_ref_1, NULL))
1943 return true;
1944
1945 return false;
1946 }
1947
1948 /* Implement TARGET_USE_BLOCKS_FOR_CONSTANT_P. We can't use blocks for
1949 constants when we're using a per-function constant pool. */
1950
1951 static bool
1952 mips_use_blocks_for_constant_p (enum machine_mode mode ATTRIBUTE_UNUSED,
1953 const_rtx x ATTRIBUTE_UNUSED)
1954 {
1955 return !TARGET_MIPS16_PCREL_LOADS;
1956 }
1957 \f
1958 /* Return true if register REGNO is a valid base register for mode MODE.
1959 STRICT_P is true if REG_OK_STRICT is in effect. */
1960
1961 int
1962 mips_regno_mode_ok_for_base_p (int regno, enum machine_mode mode,
1963 bool strict_p)
1964 {
1965 if (!HARD_REGISTER_NUM_P (regno))
1966 {
1967 if (!strict_p)
1968 return true;
1969 regno = reg_renumber[regno];
1970 }
1971
1972 /* These fake registers will be eliminated to either the stack or
1973 hard frame pointer, both of which are usually valid base registers.
1974 Reload deals with the cases where the eliminated form isn't valid. */
1975 if (regno == ARG_POINTER_REGNUM || regno == FRAME_POINTER_REGNUM)
1976 return true;
1977
1978 /* In MIPS16 mode, the stack pointer can only address word and doubleword
1979 values, nothing smaller. There are two problems here:
1980
1981 (a) Instantiating virtual registers can introduce new uses of the
1982 stack pointer. If these virtual registers are valid addresses,
1983 the stack pointer should be too.
1984
1985 (b) Most uses of the stack pointer are not made explicit until
1986 FRAME_POINTER_REGNUM and ARG_POINTER_REGNUM have been eliminated.
1987 We don't know until that stage whether we'll be eliminating to the
1988 stack pointer (which needs the restriction) or the hard frame
1989 pointer (which doesn't).
1990
1991 All in all, it seems more consistent to only enforce this restriction
1992 during and after reload. */
1993 if (TARGET_MIPS16 && regno == STACK_POINTER_REGNUM)
1994 return !strict_p || GET_MODE_SIZE (mode) == 4 || GET_MODE_SIZE (mode) == 8;
1995
1996 return TARGET_MIPS16 ? M16_REG_P (regno) : GP_REG_P (regno);
1997 }
1998
1999 /* Return true if X is a valid base register for mode MODE.
2000 STRICT_P is true if REG_OK_STRICT is in effect. */
2001
2002 static bool
2003 mips_valid_base_register_p (rtx x, enum machine_mode mode, bool strict_p)
2004 {
2005 if (!strict_p && GET_CODE (x) == SUBREG)
2006 x = SUBREG_REG (x);
2007
2008 return (REG_P (x)
2009 && mips_regno_mode_ok_for_base_p (REGNO (x), mode, strict_p));
2010 }
2011
2012 /* Return true if, for every base register BASE_REG, (plus BASE_REG X)
2013 can address a value of mode MODE. */
2014
2015 static bool
2016 mips_valid_offset_p (rtx x, enum machine_mode mode)
2017 {
2018 /* Check that X is a signed 16-bit number. */
2019 if (!const_arith_operand (x, Pmode))
2020 return false;
2021
2022 /* We may need to split multiword moves, so make sure that every word
2023 is accessible. */
2024 if (GET_MODE_SIZE (mode) > UNITS_PER_WORD
2025 && !SMALL_OPERAND (INTVAL (x) + GET_MODE_SIZE (mode) - UNITS_PER_WORD))
2026 return false;
2027
2028 return true;
2029 }
2030
2031 /* Return true if a LO_SUM can address a value of mode MODE when the
2032 LO_SUM symbol has type SYMBOL_TYPE. */
2033
2034 static bool
2035 mips_valid_lo_sum_p (enum mips_symbol_type symbol_type, enum machine_mode mode)
2036 {
2037 /* Check that symbols of type SYMBOL_TYPE can be used to access values
2038 of mode MODE. */
2039 if (mips_symbol_insns (symbol_type, mode) == 0)
2040 return false;
2041
2042 /* Check that there is a known low-part relocation. */
2043 if (mips_lo_relocs[symbol_type] == NULL)
2044 return false;
2045
2046 /* We may need to split multiword moves, so make sure that each word
2047 can be accessed without inducing a carry. This is mainly needed
2048 for o64, which has historically only guaranteed 64-bit alignment
2049 for 128-bit types. */
2050 if (GET_MODE_SIZE (mode) > UNITS_PER_WORD
2051 && GET_MODE_BITSIZE (mode) > GET_MODE_ALIGNMENT (mode))
2052 return false;
2053
2054 return true;
2055 }
2056
2057 /* Return true if X is a valid address for machine mode MODE. If it is,
2058 fill in INFO appropriately. STRICT_P is true if REG_OK_STRICT is in
2059 effect. */
2060
2061 static bool
2062 mips_classify_address (struct mips_address_info *info, rtx x,
2063 enum machine_mode mode, bool strict_p)
2064 {
2065 switch (GET_CODE (x))
2066 {
2067 case REG:
2068 case SUBREG:
2069 info->type = ADDRESS_REG;
2070 info->reg = x;
2071 info->offset = const0_rtx;
2072 return mips_valid_base_register_p (info->reg, mode, strict_p);
2073
2074 case PLUS:
2075 info->type = ADDRESS_REG;
2076 info->reg = XEXP (x, 0);
2077 info->offset = XEXP (x, 1);
2078 return (mips_valid_base_register_p (info->reg, mode, strict_p)
2079 && mips_valid_offset_p (info->offset, mode));
2080
2081 case LO_SUM:
2082 info->type = ADDRESS_LO_SUM;
2083 info->reg = XEXP (x, 0);
2084 info->offset = XEXP (x, 1);
2085 /* We have to trust the creator of the LO_SUM to do something vaguely
2086 sane. Target-independent code that creates a LO_SUM should also
2087 create and verify the matching HIGH. Target-independent code that
2088 adds an offset to a LO_SUM must prove that the offset will not
2089 induce a carry. Failure to do either of these things would be
2090 a bug, and we are not required to check for it here. The MIPS
2091 backend itself should only create LO_SUMs for valid symbolic
2092 constants, with the high part being either a HIGH or a copy
2093 of _gp. */
2094 info->symbol_type
2095 = mips_classify_symbolic_expression (info->offset, SYMBOL_CONTEXT_MEM);
2096 return (mips_valid_base_register_p (info->reg, mode, strict_p)
2097 && mips_valid_lo_sum_p (info->symbol_type, mode));
2098
2099 case CONST_INT:
2100 /* Small-integer addresses don't occur very often, but they
2101 are legitimate if $0 is a valid base register. */
2102 info->type = ADDRESS_CONST_INT;
2103 return !TARGET_MIPS16 && SMALL_INT (x);
2104
2105 case CONST:
2106 case LABEL_REF:
2107 case SYMBOL_REF:
2108 info->type = ADDRESS_SYMBOLIC;
2109 return (mips_symbolic_constant_p (x, SYMBOL_CONTEXT_MEM,
2110 &info->symbol_type)
2111 && mips_symbol_insns (info->symbol_type, mode) > 0
2112 && !mips_split_p[info->symbol_type]);
2113
2114 default:
2115 return false;
2116 }
2117 }
2118
2119 /* Implement TARGET_LEGITIMATE_ADDRESS_P. */
2120
2121 static bool
2122 mips_legitimate_address_p (enum machine_mode mode, rtx x, bool strict_p)
2123 {
2124 struct mips_address_info addr;
2125
2126 return mips_classify_address (&addr, x, mode, strict_p);
2127 }
2128
2129 /* Return true if X is a legitimate $sp-based address for mode MDOE. */
2130
2131 bool
2132 mips_stack_address_p (rtx x, enum machine_mode mode)
2133 {
2134 struct mips_address_info addr;
2135
2136 return (mips_classify_address (&addr, x, mode, false)
2137 && addr.type == ADDRESS_REG
2138 && addr.reg == stack_pointer_rtx);
2139 }
2140
2141 /* Return true if ADDR matches the pattern for the LWXS load scaled indexed
2142 address instruction. Note that such addresses are not considered
2143 legitimate in the TARGET_LEGITIMATE_ADDRESS_P sense, because their use
2144 is so restricted. */
2145
2146 static bool
2147 mips_lwxs_address_p (rtx addr)
2148 {
2149 if (ISA_HAS_LWXS
2150 && GET_CODE (addr) == PLUS
2151 && REG_P (XEXP (addr, 1)))
2152 {
2153 rtx offset = XEXP (addr, 0);
2154 if (GET_CODE (offset) == MULT
2155 && REG_P (XEXP (offset, 0))
2156 && GET_CODE (XEXP (offset, 1)) == CONST_INT
2157 && INTVAL (XEXP (offset, 1)) == 4)
2158 return true;
2159 }
2160 return false;
2161 }
2162 \f
2163 /* Return true if a value at OFFSET bytes from base register BASE can be
2164 accessed using an unextended MIPS16 instruction. MODE is the mode of
2165 the value.
2166
2167 Usually the offset in an unextended instruction is a 5-bit field.
2168 The offset is unsigned and shifted left once for LH and SH, twice
2169 for LW and SW, and so on. An exception is LWSP and SWSP, which have
2170 an 8-bit immediate field that's shifted left twice. */
2171
2172 static bool
2173 mips16_unextended_reference_p (enum machine_mode mode, rtx base,
2174 unsigned HOST_WIDE_INT offset)
2175 {
2176 if (offset % GET_MODE_SIZE (mode) == 0)
2177 {
2178 if (GET_MODE_SIZE (mode) == 4 && base == stack_pointer_rtx)
2179 return offset < 256U * GET_MODE_SIZE (mode);
2180 return offset < 32U * GET_MODE_SIZE (mode);
2181 }
2182 return false;
2183 }
2184
2185 /* Return the number of instructions needed to load or store a value
2186 of mode MODE at address X. Return 0 if X isn't valid for MODE.
2187 Assume that multiword moves may need to be split into word moves
2188 if MIGHT_SPLIT_P, otherwise assume that a single load or store is
2189 enough.
2190
2191 For MIPS16 code, count extended instructions as two instructions. */
2192
2193 int
2194 mips_address_insns (rtx x, enum machine_mode mode, bool might_split_p)
2195 {
2196 struct mips_address_info addr;
2197 int factor;
2198
2199 /* BLKmode is used for single unaligned loads and stores and should
2200 not count as a multiword mode. (GET_MODE_SIZE (BLKmode) is pretty
2201 meaningless, so we have to single it out as a special case one way
2202 or the other.) */
2203 if (mode != BLKmode && might_split_p)
2204 factor = (GET_MODE_SIZE (mode) + UNITS_PER_WORD - 1) / UNITS_PER_WORD;
2205 else
2206 factor = 1;
2207
2208 if (mips_classify_address (&addr, x, mode, false))
2209 switch (addr.type)
2210 {
2211 case ADDRESS_REG:
2212 if (TARGET_MIPS16
2213 && !mips16_unextended_reference_p (mode, addr.reg,
2214 UINTVAL (addr.offset)))
2215 return factor * 2;
2216 return factor;
2217
2218 case ADDRESS_LO_SUM:
2219 return TARGET_MIPS16 ? factor * 2 : factor;
2220
2221 case ADDRESS_CONST_INT:
2222 return factor;
2223
2224 case ADDRESS_SYMBOLIC:
2225 return factor * mips_symbol_insns (addr.symbol_type, mode);
2226 }
2227 return 0;
2228 }
2229
2230 /* Return the number of instructions needed to load constant X.
2231 Return 0 if X isn't a valid constant. */
2232
2233 int
2234 mips_const_insns (rtx x)
2235 {
2236 struct mips_integer_op codes[MIPS_MAX_INTEGER_OPS];
2237 enum mips_symbol_type symbol_type;
2238 rtx offset;
2239
2240 switch (GET_CODE (x))
2241 {
2242 case HIGH:
2243 if (!mips_symbolic_constant_p (XEXP (x, 0), SYMBOL_CONTEXT_LEA,
2244 &symbol_type)
2245 || !mips_split_p[symbol_type])
2246 return 0;
2247
2248 /* This is simply an LUI for normal mode. It is an extended
2249 LI followed by an extended SLL for MIPS16. */
2250 return TARGET_MIPS16 ? 4 : 1;
2251
2252 case CONST_INT:
2253 if (TARGET_MIPS16)
2254 /* Unsigned 8-bit constants can be loaded using an unextended
2255 LI instruction. Unsigned 16-bit constants can be loaded
2256 using an extended LI. Negative constants must be loaded
2257 using LI and then negated. */
2258 return (IN_RANGE (INTVAL (x), 0, 255) ? 1
2259 : SMALL_OPERAND_UNSIGNED (INTVAL (x)) ? 2
2260 : IN_RANGE (-INTVAL (x), 0, 255) ? 2
2261 : SMALL_OPERAND_UNSIGNED (-INTVAL (x)) ? 3
2262 : 0);
2263
2264 return mips_build_integer (codes, INTVAL (x));
2265
2266 case CONST_DOUBLE:
2267 case CONST_VECTOR:
2268 /* Allow zeros for normal mode, where we can use $0. */
2269 return !TARGET_MIPS16 && x == CONST0_RTX (GET_MODE (x)) ? 1 : 0;
2270
2271 case CONST:
2272 if (CONST_GP_P (x))
2273 return 1;
2274
2275 /* See if we can refer to X directly. */
2276 if (mips_symbolic_constant_p (x, SYMBOL_CONTEXT_LEA, &symbol_type))
2277 return mips_symbol_insns (symbol_type, MAX_MACHINE_MODE);
2278
2279 /* Otherwise try splitting the constant into a base and offset.
2280 If the offset is a 16-bit value, we can load the base address
2281 into a register and then use (D)ADDIU to add in the offset.
2282 If the offset is larger, we can load the base and offset
2283 into separate registers and add them together with (D)ADDU.
2284 However, the latter is only possible before reload; during
2285 and after reload, we must have the option of forcing the
2286 constant into the pool instead. */
2287 split_const (x, &x, &offset);
2288 if (offset != 0)
2289 {
2290 int n = mips_const_insns (x);
2291 if (n != 0)
2292 {
2293 if (SMALL_INT (offset))
2294 return n + 1;
2295 else if (!targetm.cannot_force_const_mem (x))
2296 return n + 1 + mips_build_integer (codes, INTVAL (offset));
2297 }
2298 }
2299 return 0;
2300
2301 case SYMBOL_REF:
2302 case LABEL_REF:
2303 return mips_symbol_insns (mips_classify_symbol (x, SYMBOL_CONTEXT_LEA),
2304 MAX_MACHINE_MODE);
2305
2306 default:
2307 return 0;
2308 }
2309 }
2310
2311 /* X is a doubleword constant that can be handled by splitting it into
2312 two words and loading each word separately. Return the number of
2313 instructions required to do this. */
2314
2315 int
2316 mips_split_const_insns (rtx x)
2317 {
2318 unsigned int low, high;
2319
2320 low = mips_const_insns (mips_subword (x, false));
2321 high = mips_const_insns (mips_subword (x, true));
2322 gcc_assert (low > 0 && high > 0);
2323 return low + high;
2324 }
2325
2326 /* Return the number of instructions needed to implement INSN,
2327 given that it loads from or stores to MEM. Count extended
2328 MIPS16 instructions as two instructions. */
2329
2330 int
2331 mips_load_store_insns (rtx mem, rtx insn)
2332 {
2333 enum machine_mode mode;
2334 bool might_split_p;
2335 rtx set;
2336
2337 gcc_assert (MEM_P (mem));
2338 mode = GET_MODE (mem);
2339
2340 /* Try to prove that INSN does not need to be split. */
2341 might_split_p = true;
2342 if (GET_MODE_BITSIZE (mode) == 64)
2343 {
2344 set = single_set (insn);
2345 if (set && !mips_split_64bit_move_p (SET_DEST (set), SET_SRC (set)))
2346 might_split_p = false;
2347 }
2348
2349 return mips_address_insns (XEXP (mem, 0), mode, might_split_p);
2350 }
2351
2352 /* Return the number of instructions needed for an integer division. */
2353
2354 int
2355 mips_idiv_insns (void)
2356 {
2357 int count;
2358
2359 count = 1;
2360 if (TARGET_CHECK_ZERO_DIV)
2361 {
2362 if (GENERATE_DIVIDE_TRAPS)
2363 count++;
2364 else
2365 count += 2;
2366 }
2367
2368 if (TARGET_FIX_R4000 || TARGET_FIX_R4400)
2369 count++;
2370 return count;
2371 }
2372 \f
2373 /* Emit a move from SRC to DEST. Assume that the move expanders can
2374 handle all moves if !can_create_pseudo_p (). The distinction is
2375 important because, unlike emit_move_insn, the move expanders know
2376 how to force Pmode objects into the constant pool even when the
2377 constant pool address is not itself legitimate. */
2378
2379 rtx
2380 mips_emit_move (rtx dest, rtx src)
2381 {
2382 return (can_create_pseudo_p ()
2383 ? emit_move_insn (dest, src)
2384 : emit_move_insn_1 (dest, src));
2385 }
2386
2387 /* Emit an instruction of the form (set TARGET (CODE OP0 OP1)). */
2388
2389 static void
2390 mips_emit_binary (enum rtx_code code, rtx target, rtx op0, rtx op1)
2391 {
2392 emit_insn (gen_rtx_SET (VOIDmode, target,
2393 gen_rtx_fmt_ee (code, GET_MODE (target), op0, op1)));
2394 }
2395
2396 /* Compute (CODE OP0 OP1) and store the result in a new register
2397 of mode MODE. Return that new register. */
2398
2399 static rtx
2400 mips_force_binary (enum machine_mode mode, enum rtx_code code, rtx op0, rtx op1)
2401 {
2402 rtx reg;
2403
2404 reg = gen_reg_rtx (mode);
2405 mips_emit_binary (code, reg, op0, op1);
2406 return reg;
2407 }
2408
2409 /* Copy VALUE to a register and return that register. If new pseudos
2410 are allowed, copy it into a new register, otherwise use DEST. */
2411
2412 static rtx
2413 mips_force_temporary (rtx dest, rtx value)
2414 {
2415 if (can_create_pseudo_p ())
2416 return force_reg (Pmode, value);
2417 else
2418 {
2419 mips_emit_move (dest, value);
2420 return dest;
2421 }
2422 }
2423
2424 /* Emit a call sequence with call pattern PATTERN and return the call
2425 instruction itself (which is not necessarily the last instruction
2426 emitted). ORIG_ADDR is the original, unlegitimized address,
2427 ADDR is the legitimized form, and LAZY_P is true if the call
2428 address is lazily-bound. */
2429
2430 static rtx
2431 mips_emit_call_insn (rtx pattern, rtx orig_addr, rtx addr, bool lazy_p)
2432 {
2433 rtx insn, reg;
2434
2435 insn = emit_call_insn (pattern);
2436
2437 if (TARGET_MIPS16 && mips_use_pic_fn_addr_reg_p (orig_addr))
2438 {
2439 /* MIPS16 JALRs only take MIPS16 registers. If the target
2440 function requires $25 to be valid on entry, we must copy it
2441 there separately. The move instruction can be put in the
2442 call's delay slot. */
2443 reg = gen_rtx_REG (Pmode, PIC_FUNCTION_ADDR_REGNUM);
2444 emit_insn_before (gen_move_insn (reg, addr), insn);
2445 use_reg (&CALL_INSN_FUNCTION_USAGE (insn), reg);
2446 }
2447
2448 if (lazy_p)
2449 /* Lazy-binding stubs require $gp to be valid on entry. */
2450 use_reg (&CALL_INSN_FUNCTION_USAGE (insn), pic_offset_table_rtx);
2451
2452 if (TARGET_USE_GOT)
2453 {
2454 /* See the comment above load_call<mode> for details. */
2455 use_reg (&CALL_INSN_FUNCTION_USAGE (insn),
2456 gen_rtx_REG (Pmode, GOT_VERSION_REGNUM));
2457 emit_insn (gen_update_got_version ());
2458 }
2459 return insn;
2460 }
2461 \f
2462 /* Wrap symbol or label BASE in an UNSPEC address of type SYMBOL_TYPE,
2463 then add CONST_INT OFFSET to the result. */
2464
2465 static rtx
2466 mips_unspec_address_offset (rtx base, rtx offset,
2467 enum mips_symbol_type symbol_type)
2468 {
2469 base = gen_rtx_UNSPEC (Pmode, gen_rtvec (1, base),
2470 UNSPEC_ADDRESS_FIRST + symbol_type);
2471 if (offset != const0_rtx)
2472 base = gen_rtx_PLUS (Pmode, base, offset);
2473 return gen_rtx_CONST (Pmode, base);
2474 }
2475
2476 /* Return an UNSPEC address with underlying address ADDRESS and symbol
2477 type SYMBOL_TYPE. */
2478
2479 rtx
2480 mips_unspec_address (rtx address, enum mips_symbol_type symbol_type)
2481 {
2482 rtx base, offset;
2483
2484 split_const (address, &base, &offset);
2485 return mips_unspec_address_offset (base, offset, symbol_type);
2486 }
2487
2488 /* If mips_unspec_address (ADDR, SYMBOL_TYPE) is a 32-bit value, add the
2489 high part to BASE and return the result. Just return BASE otherwise.
2490 TEMP is as for mips_force_temporary.
2491
2492 The returned expression can be used as the first operand to a LO_SUM. */
2493
2494 static rtx
2495 mips_unspec_offset_high (rtx temp, rtx base, rtx addr,
2496 enum mips_symbol_type symbol_type)
2497 {
2498 if (mips_split_p[symbol_type])
2499 {
2500 addr = gen_rtx_HIGH (Pmode, mips_unspec_address (addr, symbol_type));
2501 addr = mips_force_temporary (temp, addr);
2502 base = mips_force_temporary (temp, gen_rtx_PLUS (Pmode, addr, base));
2503 }
2504 return base;
2505 }
2506 \f
2507 /* Return an instruction that copies $gp into register REG. We want
2508 GCC to treat the register's value as constant, so that its value
2509 can be rematerialized on demand. */
2510
2511 static rtx
2512 gen_load_const_gp (rtx reg)
2513 {
2514 return (Pmode == SImode
2515 ? gen_load_const_gp_si (reg)
2516 : gen_load_const_gp_di (reg));
2517 }
2518
2519 /* Return a pseudo register that contains the value of $gp throughout
2520 the current function. Such registers are needed by MIPS16 functions,
2521 for which $gp itself is not a valid base register or addition operand. */
2522
2523 static rtx
2524 mips16_gp_pseudo_reg (void)
2525 {
2526 if (cfun->machine->mips16_gp_pseudo_rtx == NULL_RTX)
2527 cfun->machine->mips16_gp_pseudo_rtx = gen_reg_rtx (Pmode);
2528
2529 /* Don't emit an instruction to initialize the pseudo register if
2530 we are being called from the tree optimizers' cost-calculation
2531 routines. */
2532 if (!cfun->machine->initialized_mips16_gp_pseudo_p
2533 && (current_ir_type () != IR_GIMPLE || currently_expanding_to_rtl))
2534 {
2535 rtx insn, scan;
2536
2537 push_topmost_sequence ();
2538
2539 scan = get_insns ();
2540 while (NEXT_INSN (scan) && !INSN_P (NEXT_INSN (scan)))
2541 scan = NEXT_INSN (scan);
2542
2543 insn = gen_load_const_gp (cfun->machine->mips16_gp_pseudo_rtx);
2544 emit_insn_after (insn, scan);
2545
2546 pop_topmost_sequence ();
2547
2548 cfun->machine->initialized_mips16_gp_pseudo_p = true;
2549 }
2550
2551 return cfun->machine->mips16_gp_pseudo_rtx;
2552 }
2553
2554 /* Return a base register that holds pic_offset_table_rtx.
2555 TEMP, if nonnull, is a scratch Pmode base register. */
2556
2557 rtx
2558 mips_pic_base_register (rtx temp)
2559 {
2560 if (!TARGET_MIPS16)
2561 return pic_offset_table_rtx;
2562
2563 if (can_create_pseudo_p ())
2564 return mips16_gp_pseudo_reg ();
2565
2566 if (TARGET_USE_GOT)
2567 /* The first post-reload split exposes all references to $gp
2568 (both uses and definitions). All references must remain
2569 explicit after that point.
2570
2571 It is safe to introduce uses of $gp at any time, so for
2572 simplicity, we do that before the split too. */
2573 mips_emit_move (temp, pic_offset_table_rtx);
2574 else
2575 emit_insn (gen_load_const_gp (temp));
2576 return temp;
2577 }
2578
2579 /* Create and return a GOT reference of type TYPE for address ADDR.
2580 TEMP, if nonnull, is a scratch Pmode base register. */
2581
2582 rtx
2583 mips_got_load (rtx temp, rtx addr, enum mips_symbol_type type)
2584 {
2585 rtx base, high, lo_sum_symbol;
2586
2587 base = mips_pic_base_register (temp);
2588
2589 /* If we used the temporary register to load $gp, we can't use
2590 it for the high part as well. */
2591 if (temp != NULL && reg_overlap_mentioned_p (base, temp))
2592 temp = NULL;
2593
2594 high = mips_unspec_offset_high (temp, base, addr, type);
2595 lo_sum_symbol = mips_unspec_address (addr, type);
2596
2597 if (type == SYMBOL_GOTOFF_CALL)
2598 return (Pmode == SImode
2599 ? gen_unspec_callsi (high, lo_sum_symbol)
2600 : gen_unspec_calldi (high, lo_sum_symbol));
2601 else
2602 return (Pmode == SImode
2603 ? gen_unspec_gotsi (high, lo_sum_symbol)
2604 : gen_unspec_gotdi (high, lo_sum_symbol));
2605 }
2606
2607 /* If MODE is MAX_MACHINE_MODE, ADDR appears as a move operand, otherwise
2608 it appears in a MEM of that mode. Return true if ADDR is a legitimate
2609 constant in that context and can be split into high and low parts.
2610 If so, and if LOW_OUT is nonnull, emit the high part and store the
2611 low part in *LOW_OUT. Leave *LOW_OUT unchanged otherwise.
2612
2613 TEMP is as for mips_force_temporary and is used to load the high
2614 part into a register.
2615
2616 When MODE is MAX_MACHINE_MODE, the low part is guaranteed to be
2617 a legitimize SET_SRC for an .md pattern, otherwise the low part
2618 is guaranteed to be a legitimate address for mode MODE. */
2619
2620 bool
2621 mips_split_symbol (rtx temp, rtx addr, enum machine_mode mode, rtx *low_out)
2622 {
2623 enum mips_symbol_context context;
2624 enum mips_symbol_type symbol_type;
2625 rtx high;
2626
2627 context = (mode == MAX_MACHINE_MODE
2628 ? SYMBOL_CONTEXT_LEA
2629 : SYMBOL_CONTEXT_MEM);
2630 if (GET_CODE (addr) == HIGH && context == SYMBOL_CONTEXT_LEA)
2631 {
2632 addr = XEXP (addr, 0);
2633 if (mips_symbolic_constant_p (addr, context, &symbol_type)
2634 && mips_symbol_insns (symbol_type, mode) > 0
2635 && mips_split_hi_p[symbol_type])
2636 {
2637 if (low_out)
2638 switch (symbol_type)
2639 {
2640 case SYMBOL_GOT_PAGE_OFST:
2641 /* The high part of a page/ofst pair is loaded from the GOT. */
2642 *low_out = mips_got_load (temp, addr, SYMBOL_GOTOFF_PAGE);
2643 break;
2644
2645 default:
2646 gcc_unreachable ();
2647 }
2648 return true;
2649 }
2650 }
2651 else
2652 {
2653 if (mips_symbolic_constant_p (addr, context, &symbol_type)
2654 && mips_symbol_insns (symbol_type, mode) > 0
2655 && mips_split_p[symbol_type])
2656 {
2657 if (low_out)
2658 switch (symbol_type)
2659 {
2660 case SYMBOL_GOT_DISP:
2661 /* SYMBOL_GOT_DISP symbols are loaded from the GOT. */
2662 *low_out = mips_got_load (temp, addr, SYMBOL_GOTOFF_DISP);
2663 break;
2664
2665 case SYMBOL_GP_RELATIVE:
2666 high = mips_pic_base_register (temp);
2667 *low_out = gen_rtx_LO_SUM (Pmode, high, addr);
2668 break;
2669
2670 default:
2671 high = gen_rtx_HIGH (Pmode, copy_rtx (addr));
2672 high = mips_force_temporary (temp, high);
2673 *low_out = gen_rtx_LO_SUM (Pmode, high, addr);
2674 break;
2675 }
2676 return true;
2677 }
2678 }
2679 return false;
2680 }
2681
2682 /* Return a legitimate address for REG + OFFSET. TEMP is as for
2683 mips_force_temporary; it is only needed when OFFSET is not a
2684 SMALL_OPERAND. */
2685
2686 static rtx
2687 mips_add_offset (rtx temp, rtx reg, HOST_WIDE_INT offset)
2688 {
2689 if (!SMALL_OPERAND (offset))
2690 {
2691 rtx high;
2692
2693 if (TARGET_MIPS16)
2694 {
2695 /* Load the full offset into a register so that we can use
2696 an unextended instruction for the address itself. */
2697 high = GEN_INT (offset);
2698 offset = 0;
2699 }
2700 else
2701 {
2702 /* Leave OFFSET as a 16-bit offset and put the excess in HIGH.
2703 The addition inside the macro CONST_HIGH_PART may cause an
2704 overflow, so we need to force a sign-extension check. */
2705 high = gen_int_mode (CONST_HIGH_PART (offset), Pmode);
2706 offset = CONST_LOW_PART (offset);
2707 }
2708 high = mips_force_temporary (temp, high);
2709 reg = mips_force_temporary (temp, gen_rtx_PLUS (Pmode, high, reg));
2710 }
2711 return plus_constant (reg, offset);
2712 }
2713 \f
2714 /* The __tls_get_attr symbol. */
2715 static GTY(()) rtx mips_tls_symbol;
2716
2717 /* Return an instruction sequence that calls __tls_get_addr. SYM is
2718 the TLS symbol we are referencing and TYPE is the symbol type to use
2719 (either global dynamic or local dynamic). V0 is an RTX for the
2720 return value location. */
2721
2722 static rtx
2723 mips_call_tls_get_addr (rtx sym, enum mips_symbol_type type, rtx v0)
2724 {
2725 rtx insn, loc, a0;
2726
2727 a0 = gen_rtx_REG (Pmode, GP_ARG_FIRST);
2728
2729 if (!mips_tls_symbol)
2730 mips_tls_symbol = init_one_libfunc ("__tls_get_addr");
2731
2732 loc = mips_unspec_address (sym, type);
2733
2734 start_sequence ();
2735
2736 emit_insn (gen_rtx_SET (Pmode, a0,
2737 gen_rtx_LO_SUM (Pmode, pic_offset_table_rtx, loc)));
2738 insn = mips_expand_call (MIPS_CALL_NORMAL, v0, mips_tls_symbol,
2739 const0_rtx, NULL_RTX, false);
2740 RTL_CONST_CALL_P (insn) = 1;
2741 use_reg (&CALL_INSN_FUNCTION_USAGE (insn), a0);
2742 insn = get_insns ();
2743
2744 end_sequence ();
2745
2746 return insn;
2747 }
2748
2749 /* Return a pseudo register that contains the current thread pointer. */
2750
2751 static rtx
2752 mips_get_tp (void)
2753 {
2754 rtx tp;
2755
2756 tp = gen_reg_rtx (Pmode);
2757 if (Pmode == DImode)
2758 emit_insn (gen_tls_get_tp_di (tp));
2759 else
2760 emit_insn (gen_tls_get_tp_si (tp));
2761 return tp;
2762 }
2763
2764 /* Generate the code to access LOC, a thread-local SYMBOL_REF, and return
2765 its address. The return value will be both a valid address and a valid
2766 SET_SRC (either a REG or a LO_SUM). */
2767
2768 static rtx
2769 mips_legitimize_tls_address (rtx loc)
2770 {
2771 rtx dest, insn, v0, tp, tmp1, tmp2, eqv;
2772 enum tls_model model;
2773
2774 if (TARGET_MIPS16)
2775 {
2776 sorry ("MIPS16 TLS");
2777 return gen_reg_rtx (Pmode);
2778 }
2779
2780 model = SYMBOL_REF_TLS_MODEL (loc);
2781 /* Only TARGET_ABICALLS code can have more than one module; other
2782 code must be be static and should not use a GOT. All TLS models
2783 reduce to local exec in this situation. */
2784 if (!TARGET_ABICALLS)
2785 model = TLS_MODEL_LOCAL_EXEC;
2786
2787 switch (model)
2788 {
2789 case TLS_MODEL_GLOBAL_DYNAMIC:
2790 v0 = gen_rtx_REG (Pmode, GP_RETURN);
2791 insn = mips_call_tls_get_addr (loc, SYMBOL_TLSGD, v0);
2792 dest = gen_reg_rtx (Pmode);
2793 emit_libcall_block (insn, dest, v0, loc);
2794 break;
2795
2796 case TLS_MODEL_LOCAL_DYNAMIC:
2797 v0 = gen_rtx_REG (Pmode, GP_RETURN);
2798 insn = mips_call_tls_get_addr (loc, SYMBOL_TLSLDM, v0);
2799 tmp1 = gen_reg_rtx (Pmode);
2800
2801 /* Attach a unique REG_EQUIV, to allow the RTL optimizers to
2802 share the LDM result with other LD model accesses. */
2803 eqv = gen_rtx_UNSPEC (Pmode, gen_rtvec (1, const0_rtx),
2804 UNSPEC_TLS_LDM);
2805 emit_libcall_block (insn, tmp1, v0, eqv);
2806
2807 tmp2 = mips_unspec_offset_high (NULL, tmp1, loc, SYMBOL_DTPREL);
2808 dest = gen_rtx_LO_SUM (Pmode, tmp2,
2809 mips_unspec_address (loc, SYMBOL_DTPREL));
2810 break;
2811
2812 case TLS_MODEL_INITIAL_EXEC:
2813 tp = mips_get_tp ();
2814 tmp1 = gen_reg_rtx (Pmode);
2815 tmp2 = mips_unspec_address (loc, SYMBOL_GOTTPREL);
2816 if (Pmode == DImode)
2817 emit_insn (gen_load_gotdi (tmp1, pic_offset_table_rtx, tmp2));
2818 else
2819 emit_insn (gen_load_gotsi (tmp1, pic_offset_table_rtx, tmp2));
2820 dest = gen_reg_rtx (Pmode);
2821 emit_insn (gen_add3_insn (dest, tmp1, tp));
2822 break;
2823
2824 case TLS_MODEL_LOCAL_EXEC:
2825 tp = mips_get_tp ();
2826 tmp1 = mips_unspec_offset_high (NULL, tp, loc, SYMBOL_TPREL);
2827 dest = gen_rtx_LO_SUM (Pmode, tmp1,
2828 mips_unspec_address (loc, SYMBOL_TPREL));
2829 break;
2830
2831 default:
2832 gcc_unreachable ();
2833 }
2834 return dest;
2835 }
2836 \f
2837 /* If X is not a valid address for mode MODE, force it into a register. */
2838
2839 static rtx
2840 mips_force_address (rtx x, enum machine_mode mode)
2841 {
2842 if (!mips_legitimate_address_p (mode, x, false))
2843 x = force_reg (Pmode, x);
2844 return x;
2845 }
2846
2847 /* This function is used to implement LEGITIMIZE_ADDRESS. If X can
2848 be legitimized in a way that the generic machinery might not expect,
2849 return a new address, otherwise return NULL. MODE is the mode of
2850 the memory being accessed. */
2851
2852 static rtx
2853 mips_legitimize_address (rtx x, rtx oldx ATTRIBUTE_UNUSED,
2854 enum machine_mode mode)
2855 {
2856 rtx base, addr;
2857 HOST_WIDE_INT offset;
2858
2859 if (mips_tls_symbol_p (x))
2860 return mips_legitimize_tls_address (x);
2861
2862 /* See if the address can split into a high part and a LO_SUM. */
2863 if (mips_split_symbol (NULL, x, mode, &addr))
2864 return mips_force_address (addr, mode);
2865
2866 /* Handle BASE + OFFSET using mips_add_offset. */
2867 mips_split_plus (x, &base, &offset);
2868 if (offset != 0)
2869 {
2870 if (!mips_valid_base_register_p (base, mode, false))
2871 base = copy_to_mode_reg (Pmode, base);
2872 addr = mips_add_offset (NULL, base, offset);
2873 return mips_force_address (addr, mode);
2874 }
2875
2876 return x;
2877 }
2878
2879 /* Load VALUE into DEST. TEMP is as for mips_force_temporary. */
2880
2881 void
2882 mips_move_integer (rtx temp, rtx dest, unsigned HOST_WIDE_INT value)
2883 {
2884 struct mips_integer_op codes[MIPS_MAX_INTEGER_OPS];
2885 enum machine_mode mode;
2886 unsigned int i, num_ops;
2887 rtx x;
2888
2889 mode = GET_MODE (dest);
2890 num_ops = mips_build_integer (codes, value);
2891
2892 /* Apply each binary operation to X. Invariant: X is a legitimate
2893 source operand for a SET pattern. */
2894 x = GEN_INT (codes[0].value);
2895 for (i = 1; i < num_ops; i++)
2896 {
2897 if (!can_create_pseudo_p ())
2898 {
2899 emit_insn (gen_rtx_SET (VOIDmode, temp, x));
2900 x = temp;
2901 }
2902 else
2903 x = force_reg (mode, x);
2904 x = gen_rtx_fmt_ee (codes[i].code, mode, x, GEN_INT (codes[i].value));
2905 }
2906
2907 emit_insn (gen_rtx_SET (VOIDmode, dest, x));
2908 }
2909
2910 /* Subroutine of mips_legitimize_move. Move constant SRC into register
2911 DEST given that SRC satisfies immediate_operand but doesn't satisfy
2912 move_operand. */
2913
2914 static void
2915 mips_legitimize_const_move (enum machine_mode mode, rtx dest, rtx src)
2916 {
2917 rtx base, offset;
2918
2919 /* Split moves of big integers into smaller pieces. */
2920 if (splittable_const_int_operand (src, mode))
2921 {
2922 mips_move_integer (dest, dest, INTVAL (src));
2923 return;
2924 }
2925
2926 /* Split moves of symbolic constants into high/low pairs. */
2927 if (mips_split_symbol (dest, src, MAX_MACHINE_MODE, &src))
2928 {
2929 emit_insn (gen_rtx_SET (VOIDmode, dest, src));
2930 return;
2931 }
2932
2933 /* Generate the appropriate access sequences for TLS symbols. */
2934 if (mips_tls_symbol_p (src))
2935 {
2936 mips_emit_move (dest, mips_legitimize_tls_address (src));
2937 return;
2938 }
2939
2940 /* If we have (const (plus symbol offset)), and that expression cannot
2941 be forced into memory, load the symbol first and add in the offset.
2942 In non-MIPS16 mode, prefer to do this even if the constant _can_ be
2943 forced into memory, as it usually produces better code. */
2944 split_const (src, &base, &offset);
2945 if (offset != const0_rtx
2946 && (targetm.cannot_force_const_mem (src)
2947 || (!TARGET_MIPS16 && can_create_pseudo_p ())))
2948 {
2949 base = mips_force_temporary (dest, base);
2950 mips_emit_move (dest, mips_add_offset (NULL, base, INTVAL (offset)));
2951 return;
2952 }
2953
2954 src = force_const_mem (mode, src);
2955
2956 /* When using explicit relocs, constant pool references are sometimes
2957 not legitimate addresses. */
2958 mips_split_symbol (dest, XEXP (src, 0), mode, &XEXP (src, 0));
2959 mips_emit_move (dest, src);
2960 }
2961
2962 /* If (set DEST SRC) is not a valid move instruction, emit an equivalent
2963 sequence that is valid. */
2964
2965 bool
2966 mips_legitimize_move (enum machine_mode mode, rtx dest, rtx src)
2967 {
2968 if (!register_operand (dest, mode) && !reg_or_0_operand (src, mode))
2969 {
2970 mips_emit_move (dest, force_reg (mode, src));
2971 return true;
2972 }
2973
2974 /* We need to deal with constants that would be legitimate
2975 immediate_operands but aren't legitimate move_operands. */
2976 if (CONSTANT_P (src) && !move_operand (src, mode))
2977 {
2978 mips_legitimize_const_move (mode, dest, src);
2979 set_unique_reg_note (get_last_insn (), REG_EQUAL, copy_rtx (src));
2980 return true;
2981 }
2982 return false;
2983 }
2984 \f
2985 /* Return true if value X in context CONTEXT is a small-data address
2986 that can be rewritten as a LO_SUM. */
2987
2988 static bool
2989 mips_rewrite_small_data_p (rtx x, enum mips_symbol_context context)
2990 {
2991 enum mips_symbol_type symbol_type;
2992
2993 return (mips_lo_relocs[SYMBOL_GP_RELATIVE]
2994 && !mips_split_p[SYMBOL_GP_RELATIVE]
2995 && mips_symbolic_constant_p (x, context, &symbol_type)
2996 && symbol_type == SYMBOL_GP_RELATIVE);
2997 }
2998
2999 /* A for_each_rtx callback for mips_small_data_pattern_p. DATA is the
3000 containing MEM, or null if none. */
3001
3002 static int
3003 mips_small_data_pattern_1 (rtx *loc, void *data)
3004 {
3005 enum mips_symbol_context context;
3006
3007 if (GET_CODE (*loc) == LO_SUM)
3008 return -1;
3009
3010 if (MEM_P (*loc))
3011 {
3012 if (for_each_rtx (&XEXP (*loc, 0), mips_small_data_pattern_1, *loc))
3013 return 1;
3014 return -1;
3015 }
3016
3017 context = data ? SYMBOL_CONTEXT_MEM : SYMBOL_CONTEXT_LEA;
3018 return mips_rewrite_small_data_p (*loc, context);
3019 }
3020
3021 /* Return true if OP refers to small data symbols directly, not through
3022 a LO_SUM. */
3023
3024 bool
3025 mips_small_data_pattern_p (rtx op)
3026 {
3027 return for_each_rtx (&op, mips_small_data_pattern_1, NULL);
3028 }
3029
3030 /* A for_each_rtx callback, used by mips_rewrite_small_data.
3031 DATA is the containing MEM, or null if none. */
3032
3033 static int
3034 mips_rewrite_small_data_1 (rtx *loc, void *data)
3035 {
3036 enum mips_symbol_context context;
3037
3038 if (MEM_P (*loc))
3039 {
3040 for_each_rtx (&XEXP (*loc, 0), mips_rewrite_small_data_1, *loc);
3041 return -1;
3042 }
3043
3044 context = data ? SYMBOL_CONTEXT_MEM : SYMBOL_CONTEXT_LEA;
3045 if (mips_rewrite_small_data_p (*loc, context))
3046 *loc = gen_rtx_LO_SUM (Pmode, pic_offset_table_rtx, *loc);
3047
3048 if (GET_CODE (*loc) == LO_SUM)
3049 return -1;
3050
3051 return 0;
3052 }
3053
3054 /* Rewrite instruction pattern PATTERN so that it refers to small data
3055 using explicit relocations. */
3056
3057 rtx
3058 mips_rewrite_small_data (rtx pattern)
3059 {
3060 pattern = copy_insn (pattern);
3061 for_each_rtx (&pattern, mips_rewrite_small_data_1, NULL);
3062 return pattern;
3063 }
3064 \f
3065 /* We need a lot of little routines to check the range of MIPS16 immediate
3066 operands. */
3067
3068 static int
3069 m16_check_op (rtx op, int low, int high, int mask)
3070 {
3071 return (GET_CODE (op) == CONST_INT
3072 && IN_RANGE (INTVAL (op), low, high)
3073 && (INTVAL (op) & mask) == 0);
3074 }
3075
3076 int
3077 m16_uimm3_b (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED)
3078 {
3079 return m16_check_op (op, 0x1, 0x8, 0);
3080 }
3081
3082 int
3083 m16_simm4_1 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED)
3084 {
3085 return m16_check_op (op, -0x8, 0x7, 0);
3086 }
3087
3088 int
3089 m16_nsimm4_1 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED)
3090 {
3091 return m16_check_op (op, -0x7, 0x8, 0);
3092 }
3093
3094 int
3095 m16_simm5_1 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED)
3096 {
3097 return m16_check_op (op, -0x10, 0xf, 0);
3098 }
3099
3100 int
3101 m16_nsimm5_1 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED)
3102 {
3103 return m16_check_op (op, -0xf, 0x10, 0);
3104 }
3105
3106 int
3107 m16_uimm5_4 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED)
3108 {
3109 return m16_check_op (op, -0x10 << 2, 0xf << 2, 3);
3110 }
3111
3112 int
3113 m16_nuimm5_4 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED)
3114 {
3115 return m16_check_op (op, -0xf << 2, 0x10 << 2, 3);
3116 }
3117
3118 int
3119 m16_simm8_1 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED)
3120 {
3121 return m16_check_op (op, -0x80, 0x7f, 0);
3122 }
3123
3124 int
3125 m16_nsimm8_1 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED)
3126 {
3127 return m16_check_op (op, -0x7f, 0x80, 0);
3128 }
3129
3130 int
3131 m16_uimm8_1 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED)
3132 {
3133 return m16_check_op (op, 0x0, 0xff, 0);
3134 }
3135
3136 int
3137 m16_nuimm8_1 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED)
3138 {
3139 return m16_check_op (op, -0xff, 0x0, 0);
3140 }
3141
3142 int
3143 m16_uimm8_m1_1 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED)
3144 {
3145 return m16_check_op (op, -0x1, 0xfe, 0);
3146 }
3147
3148 int
3149 m16_uimm8_4 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED)
3150 {
3151 return m16_check_op (op, 0x0, 0xff << 2, 3);
3152 }
3153
3154 int
3155 m16_nuimm8_4 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED)
3156 {
3157 return m16_check_op (op, -0xff << 2, 0x0, 3);
3158 }
3159
3160 int
3161 m16_simm8_8 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED)
3162 {
3163 return m16_check_op (op, -0x80 << 3, 0x7f << 3, 7);
3164 }
3165
3166 int
3167 m16_nsimm8_8 (rtx op, enum machine_mode mode ATTRIBUTE_UNUSED)
3168 {
3169 return m16_check_op (op, -0x7f << 3, 0x80 << 3, 7);
3170 }
3171 \f
3172 /* The cost of loading values from the constant pool. It should be
3173 larger than the cost of any constant we want to synthesize inline. */
3174 #define CONSTANT_POOL_COST COSTS_N_INSNS (TARGET_MIPS16 ? 4 : 8)
3175
3176 /* Return the cost of X when used as an operand to the MIPS16 instruction
3177 that implements CODE. Return -1 if there is no such instruction, or if
3178 X is not a valid immediate operand for it. */
3179
3180 static int
3181 mips16_constant_cost (int code, HOST_WIDE_INT x)
3182 {
3183 switch (code)
3184 {
3185 case ASHIFT:
3186 case ASHIFTRT:
3187 case LSHIFTRT:
3188 /* Shifts by between 1 and 8 bits (inclusive) are unextended,
3189 other shifts are extended. The shift patterns truncate the shift
3190 count to the right size, so there are no out-of-range values. */
3191 if (IN_RANGE (x, 1, 8))
3192 return 0;
3193 return COSTS_N_INSNS (1);
3194
3195 case PLUS:
3196 if (IN_RANGE (x, -128, 127))
3197 return 0;
3198 if (SMALL_OPERAND (x))
3199 return COSTS_N_INSNS (1);
3200 return -1;
3201
3202 case LEU:
3203 /* Like LE, but reject the always-true case. */
3204 if (x == -1)
3205 return -1;
3206 case LE:
3207 /* We add 1 to the immediate and use SLT. */
3208 x += 1;
3209 case XOR:
3210 /* We can use CMPI for an xor with an unsigned 16-bit X. */
3211 case LT:
3212 case LTU:
3213 if (IN_RANGE (x, 0, 255))
3214 return 0;
3215 if (SMALL_OPERAND_UNSIGNED (x))
3216 return COSTS_N_INSNS (1);
3217 return -1;
3218
3219 case EQ:
3220 case NE:
3221 /* Equality comparisons with 0 are cheap. */
3222 if (x == 0)
3223 return 0;
3224 return -1;
3225
3226 default:
3227 return -1;
3228 }
3229 }
3230
3231 /* Return true if there is a non-MIPS16 instruction that implements CODE
3232 and if that instruction accepts X as an immediate operand. */
3233
3234 static int
3235 mips_immediate_operand_p (int code, HOST_WIDE_INT x)
3236 {
3237 switch (code)
3238 {
3239 case ASHIFT:
3240 case ASHIFTRT:
3241 case LSHIFTRT:
3242 /* All shift counts are truncated to a valid constant. */
3243 return true;
3244
3245 case ROTATE:
3246 case ROTATERT:
3247 /* Likewise rotates, if the target supports rotates at all. */
3248 return ISA_HAS_ROR;
3249
3250 case AND:
3251 case IOR:
3252 case XOR:
3253 /* These instructions take 16-bit unsigned immediates. */
3254 return SMALL_OPERAND_UNSIGNED (x);
3255
3256 case PLUS:
3257 case LT:
3258 case LTU:
3259 /* These instructions take 16-bit signed immediates. */
3260 return SMALL_OPERAND (x);
3261
3262 case EQ:
3263 case NE:
3264 case GT:
3265 case GTU:
3266 /* The "immediate" forms of these instructions are really
3267 implemented as comparisons with register 0. */
3268 return x == 0;
3269
3270 case GE:
3271 case GEU:
3272 /* Likewise, meaning that the only valid immediate operand is 1. */
3273 return x == 1;
3274
3275 case LE:
3276 /* We add 1 to the immediate and use SLT. */
3277 return SMALL_OPERAND (x + 1);
3278
3279 case LEU:
3280 /* Likewise SLTU, but reject the always-true case. */
3281 return SMALL_OPERAND (x + 1) && x + 1 != 0;
3282
3283 case SIGN_EXTRACT:
3284 case ZERO_EXTRACT:
3285 /* The bit position and size are immediate operands. */
3286 return ISA_HAS_EXT_INS;
3287
3288 default:
3289 /* By default assume that $0 can be used for 0. */
3290 return x == 0;
3291 }
3292 }
3293
3294 /* Return the cost of binary operation X, given that the instruction
3295 sequence for a word-sized or smaller operation has cost SINGLE_COST
3296 and that the sequence of a double-word operation has cost DOUBLE_COST. */
3297
3298 static int
3299 mips_binary_cost (rtx x, int single_cost, int double_cost)
3300 {
3301 int cost;
3302
3303 if (GET_MODE_SIZE (GET_MODE (x)) == UNITS_PER_WORD * 2)
3304 cost = double_cost;
3305 else
3306 cost = single_cost;
3307 return (cost
3308 + rtx_cost (XEXP (x, 0), SET, !optimize_size)
3309 + rtx_cost (XEXP (x, 1), GET_CODE (x), !optimize_size));
3310 }
3311
3312 /* Return the cost of floating-point multiplications of mode MODE. */
3313
3314 static int
3315 mips_fp_mult_cost (enum machine_mode mode)
3316 {
3317 return mode == DFmode ? mips_cost->fp_mult_df : mips_cost->fp_mult_sf;
3318 }
3319
3320 /* Return the cost of floating-point divisions of mode MODE. */
3321
3322 static int
3323 mips_fp_div_cost (enum machine_mode mode)
3324 {
3325 return mode == DFmode ? mips_cost->fp_div_df : mips_cost->fp_div_sf;
3326 }
3327
3328 /* Return the cost of sign-extending OP to mode MODE, not including the
3329 cost of OP itself. */
3330
3331 static int
3332 mips_sign_extend_cost (enum machine_mode mode, rtx op)
3333 {
3334 if (MEM_P (op))
3335 /* Extended loads are as cheap as unextended ones. */
3336 return 0;
3337
3338 if (TARGET_64BIT && mode == DImode && GET_MODE (op) == SImode)
3339 /* A sign extension from SImode to DImode in 64-bit mode is free. */
3340 return 0;
3341
3342 if (ISA_HAS_SEB_SEH || GENERATE_MIPS16E)
3343 /* We can use SEB or SEH. */
3344 return COSTS_N_INSNS (1);
3345
3346 /* We need to use a shift left and a shift right. */
3347 return COSTS_N_INSNS (TARGET_MIPS16 ? 4 : 2);
3348 }
3349
3350 /* Return the cost of zero-extending OP to mode MODE, not including the
3351 cost of OP itself. */
3352
3353 static int
3354 mips_zero_extend_cost (enum machine_mode mode, rtx op)
3355 {
3356 if (MEM_P (op))
3357 /* Extended loads are as cheap as unextended ones. */
3358 return 0;
3359
3360 if (TARGET_64BIT && mode == DImode && GET_MODE (op) == SImode)
3361 /* We need a shift left by 32 bits and a shift right by 32 bits. */
3362 return COSTS_N_INSNS (TARGET_MIPS16 ? 4 : 2);
3363
3364 if (GENERATE_MIPS16E)
3365 /* We can use ZEB or ZEH. */
3366 return COSTS_N_INSNS (1);
3367
3368 if (TARGET_MIPS16)
3369 /* We need to load 0xff or 0xffff into a register and use AND. */
3370 return COSTS_N_INSNS (GET_MODE (op) == QImode ? 2 : 3);
3371
3372 /* We can use ANDI. */
3373 return COSTS_N_INSNS (1);
3374 }
3375
3376 /* Implement TARGET_RTX_COSTS. */
3377
3378 static bool
3379 mips_rtx_costs (rtx x, int code, int outer_code, int *total,
3380 bool speed)
3381 {
3382 enum machine_mode mode = GET_MODE (x);
3383 bool float_mode_p = FLOAT_MODE_P (mode);
3384 int cost;
3385 rtx addr;
3386
3387 /* The cost of a COMPARE is hard to define for MIPS. COMPAREs don't
3388 appear in the instruction stream, and the cost of a comparison is
3389 really the cost of the branch or scc condition. At the time of
3390 writing, GCC only uses an explicit outer COMPARE code when optabs
3391 is testing whether a constant is expensive enough to force into a
3392 register. We want optabs to pass such constants through the MIPS
3393 expanders instead, so make all constants very cheap here. */
3394 if (outer_code == COMPARE)
3395 {
3396 gcc_assert (CONSTANT_P (x));
3397 *total = 0;
3398 return true;
3399 }
3400
3401 switch (code)
3402 {
3403 case CONST_INT:
3404 /* Treat *clear_upper32-style ANDs as having zero cost in the
3405 second operand. The cost is entirely in the first operand.
3406
3407 ??? This is needed because we would otherwise try to CSE
3408 the constant operand. Although that's the right thing for
3409 instructions that continue to be a register operation throughout
3410 compilation, it is disastrous for instructions that could
3411 later be converted into a memory operation. */
3412 if (TARGET_64BIT
3413 && outer_code == AND
3414 && UINTVAL (x) == 0xffffffff)
3415 {
3416 *total = 0;
3417 return true;
3418 }
3419
3420 if (TARGET_MIPS16)
3421 {
3422 cost = mips16_constant_cost (outer_code, INTVAL (x));
3423 if (cost >= 0)
3424 {
3425 *total = cost;
3426 return true;
3427 }
3428 }
3429 else
3430 {
3431 /* When not optimizing for size, we care more about the cost
3432 of hot code, and hot code is often in a loop. If a constant
3433 operand needs to be forced into a register, we will often be
3434 able to hoist the constant load out of the loop, so the load
3435 should not contribute to the cost. */
3436 if (!optimize_size
3437 || mips_immediate_operand_p (outer_code, INTVAL (x)))
3438 {
3439 *total = 0;
3440 return true;
3441 }
3442 }
3443 /* Fall through. */
3444
3445 case CONST:
3446 case SYMBOL_REF:
3447 case LABEL_REF:
3448 case CONST_DOUBLE:
3449 if (force_to_mem_operand (x, VOIDmode))
3450 {
3451 *total = COSTS_N_INSNS (1);
3452 return true;
3453 }
3454 cost = mips_const_insns (x);
3455 if (cost > 0)
3456 {
3457 /* If the constant is likely to be stored in a GPR, SETs of
3458 single-insn constants are as cheap as register sets; we
3459 never want to CSE them.
3460
3461 Don't reduce the cost of storing a floating-point zero in
3462 FPRs. If we have a zero in an FPR for other reasons, we
3463 can get better cfg-cleanup and delayed-branch results by
3464 using it consistently, rather than using $0 sometimes and
3465 an FPR at other times. Also, moves between floating-point
3466 registers are sometimes cheaper than (D)MTC1 $0. */
3467 if (cost == 1
3468 && outer_code == SET
3469 && !(float_mode_p && TARGET_HARD_FLOAT))
3470 cost = 0;
3471 /* When non-MIPS16 code loads a constant N>1 times, we rarely
3472 want to CSE the constant itself. It is usually better to
3473 have N copies of the last operation in the sequence and one
3474 shared copy of the other operations. (Note that this is
3475 not true for MIPS16 code, where the final operation in the
3476 sequence is often an extended instruction.)
3477
3478 Also, if we have a CONST_INT, we don't know whether it is
3479 for a word or doubleword operation, so we cannot rely on
3480 the result of mips_build_integer. */
3481 else if (!TARGET_MIPS16
3482 && (outer_code == SET || mode == VOIDmode))
3483 cost = 1;
3484 *total = COSTS_N_INSNS (cost);
3485 return true;
3486 }
3487 /* The value will need to be fetched from the constant pool. */
3488 *total = CONSTANT_POOL_COST;
3489 return true;
3490
3491 case MEM:
3492 /* If the address is legitimate, return the number of
3493 instructions it needs. */
3494 addr = XEXP (x, 0);
3495 cost = mips_address_insns (addr, mode, true);
3496 if (cost > 0)
3497 {
3498 *total = COSTS_N_INSNS (cost + 1);
3499 return true;
3500 }
3501 /* Check for a scaled indexed address. */
3502 if (mips_lwxs_address_p (addr))
3503 {
3504 *total = COSTS_N_INSNS (2);
3505 return true;
3506 }
3507 /* Otherwise use the default handling. */
3508 return false;
3509
3510 case FFS:
3511 *total = COSTS_N_INSNS (6);
3512 return false;
3513
3514 case NOT:
3515 *total = COSTS_N_INSNS (GET_MODE_SIZE (mode) > UNITS_PER_WORD ? 2 : 1);
3516 return false;
3517
3518 case AND:
3519 /* Check for a *clear_upper32 pattern and treat it like a zero
3520 extension. See the pattern's comment for details. */
3521 if (TARGET_64BIT
3522 && mode == DImode
3523 && CONST_INT_P (XEXP (x, 1))
3524 && UINTVAL (XEXP (x, 1)) == 0xffffffff)
3525 {
3526 *total = (mips_zero_extend_cost (mode, XEXP (x, 0))
3527 + rtx_cost (XEXP (x, 0), SET, speed));
3528 return true;
3529 }
3530 /* Fall through. */
3531
3532 case IOR:
3533 case XOR:
3534 /* Double-word operations use two single-word operations. */
3535 *total = mips_binary_cost (x, COSTS_N_INSNS (1), COSTS_N_INSNS (2));
3536 return true;
3537
3538 case ASHIFT:
3539 case ASHIFTRT:
3540 case LSHIFTRT:
3541 case ROTATE:
3542 case ROTATERT:
3543 if (CONSTANT_P (XEXP (x, 1)))
3544 *total = mips_binary_cost (x, COSTS_N_INSNS (1), COSTS_N_INSNS (4));
3545 else
3546 *total = mips_binary_cost (x, COSTS_N_INSNS (1), COSTS_N_INSNS (12));
3547 return true;
3548
3549 case ABS:
3550 if (float_mode_p)
3551 *total = mips_cost->fp_add;
3552 else
3553 *total = COSTS_N_INSNS (4);
3554 return false;
3555
3556 case LO_SUM:
3557 /* Low-part immediates need an extended MIPS16 instruction. */
3558 *total = (COSTS_N_INSNS (TARGET_MIPS16 ? 2 : 1)
3559 + rtx_cost (XEXP (x, 0), SET, speed));
3560 return true;
3561
3562 case LT:
3563 case LTU:
3564 case LE:
3565 case LEU:
3566 case GT:
3567 case GTU:
3568 case GE:
3569 case GEU:
3570 case EQ:
3571 case NE:
3572 case UNORDERED:
3573 case LTGT:
3574 /* Branch comparisons have VOIDmode, so use the first operand's
3575 mode instead. */
3576 mode = GET_MODE (XEXP (x, 0));
3577 if (FLOAT_MODE_P (mode))
3578 {
3579 *total = mips_cost->fp_add;
3580 return false;
3581 }
3582 *total = mips_binary_cost (x, COSTS_N_INSNS (1), COSTS_N_INSNS (4));
3583 return true;
3584
3585 case MINUS:
3586 if (float_mode_p
3587 && (ISA_HAS_NMADD4_NMSUB4 (mode) || ISA_HAS_NMADD3_NMSUB3 (mode))
3588 && TARGET_FUSED_MADD
3589 && !HONOR_NANS (mode)
3590 && !HONOR_SIGNED_ZEROS (mode))
3591 {
3592 /* See if we can use NMADD or NMSUB. See mips.md for the
3593 associated patterns. */
3594 rtx op0 = XEXP (x, 0);
3595 rtx op1 = XEXP (x, 1);
3596 if (GET_CODE (op0) == MULT && GET_CODE (XEXP (op0, 0)) == NEG)
3597 {
3598 *total = (mips_fp_mult_cost (mode)
3599 + rtx_cost (XEXP (XEXP (op0, 0), 0), SET, speed)
3600 + rtx_cost (XEXP (op0, 1), SET, speed)
3601 + rtx_cost (op1, SET, speed));
3602 return true;
3603 }
3604 if (GET_CODE (op1) == MULT)
3605 {
3606 *total = (mips_fp_mult_cost (mode)
3607 + rtx_cost (op0, SET, speed)
3608 + rtx_cost (XEXP (op1, 0), SET, speed)
3609 + rtx_cost (XEXP (op1, 1), SET, speed));
3610 return true;
3611 }
3612 }
3613 /* Fall through. */
3614
3615 case PLUS:
3616 if (float_mode_p)
3617 {
3618 /* If this is part of a MADD or MSUB, treat the PLUS as
3619 being free. */
3620 if (ISA_HAS_FP4
3621 && TARGET_FUSED_MADD
3622 && GET_CODE (XEXP (x, 0)) == MULT)
3623 *total = 0;
3624 else
3625 *total = mips_cost->fp_add;
3626 return false;
3627 }
3628
3629 /* Double-word operations require three single-word operations and
3630 an SLTU. The MIPS16 version then needs to move the result of
3631 the SLTU from $24 to a MIPS16 register. */
3632 *total = mips_binary_cost (x, COSTS_N_INSNS (1),
3633 COSTS_N_INSNS (TARGET_MIPS16 ? 5 : 4));
3634 return true;
3635
3636 case NEG:
3637 if (float_mode_p
3638 && (ISA_HAS_NMADD4_NMSUB4 (mode) || ISA_HAS_NMADD3_NMSUB3 (mode))
3639 && TARGET_FUSED_MADD
3640 && !HONOR_NANS (mode)
3641 && HONOR_SIGNED_ZEROS (mode))
3642 {
3643 /* See if we can use NMADD or NMSUB. See mips.md for the
3644 associated patterns. */
3645 rtx op = XEXP (x, 0);
3646 if ((GET_CODE (op) == PLUS || GET_CODE (op) == MINUS)
3647 && GET_CODE (XEXP (op, 0)) == MULT)
3648 {
3649 *total = (mips_fp_mult_cost (mode)
3650 + rtx_cost (XEXP (XEXP (op, 0), 0), SET, speed)
3651 + rtx_cost (XEXP (XEXP (op, 0), 1), SET, speed)
3652 + rtx_cost (XEXP (op, 1), SET, speed));
3653 return true;
3654 }
3655 }
3656
3657 if (float_mode_p)
3658 *total = mips_cost->fp_add;
3659 else
3660 *total = COSTS_N_INSNS (GET_MODE_SIZE (mode) > UNITS_PER_WORD ? 4 : 1);
3661 return false;
3662
3663 case MULT:
3664 if (float_mode_p)
3665 *total = mips_fp_mult_cost (mode);
3666 else if (mode == DImode && !TARGET_64BIT)
3667 /* Synthesized from 2 mulsi3s, 1 mulsidi3 and two additions,
3668 where the mulsidi3 always includes an MFHI and an MFLO. */
3669 *total = (optimize_size
3670 ? COSTS_N_INSNS (ISA_HAS_MUL3 ? 7 : 9)
3671 : mips_cost->int_mult_si * 3 + 6);
3672 else if (optimize_size)
3673 *total = (ISA_HAS_MUL3 ? 1 : 2);
3674 else if (mode == DImode)
3675 *total = mips_cost->int_mult_di;
3676 else
3677 *total = mips_cost->int_mult_si;
3678 return false;
3679
3680 case DIV:
3681 /* Check for a reciprocal. */
3682 if (float_mode_p
3683 && ISA_HAS_FP4
3684 && flag_unsafe_math_optimizations
3685 && XEXP (x, 0) == CONST1_RTX (mode))
3686 {
3687 if (outer_code == SQRT || GET_CODE (XEXP (x, 1)) == SQRT)
3688 /* An rsqrt<mode>a or rsqrt<mode>b pattern. Count the
3689 division as being free. */
3690 *total = rtx_cost (XEXP (x, 1), SET, speed);
3691 else
3692 *total = (mips_fp_div_cost (mode)
3693 + rtx_cost (XEXP (x, 1), SET, speed));
3694 return true;
3695 }
3696 /* Fall through. */
3697
3698 case SQRT:
3699 case MOD:
3700 if (float_mode_p)
3701 {
3702 *total = mips_fp_div_cost (mode);
3703 return false;
3704 }
3705 /* Fall through. */
3706
3707 case UDIV:
3708 case UMOD:
3709 if (optimize_size)
3710 {
3711 /* It is our responsibility to make division by a power of 2
3712 as cheap as 2 register additions if we want the division
3713 expanders to be used for such operations; see the setting
3714 of sdiv_pow2_cheap in optabs.c. Using (D)DIV for MIPS16
3715 should always produce shorter code than using
3716 expand_sdiv2_pow2. */
3717 if (TARGET_MIPS16
3718 && CONST_INT_P (XEXP (x, 1))
3719 && exact_log2 (INTVAL (XEXP (x, 1))) >= 0)
3720 {
3721 *total = COSTS_N_INSNS (2) + rtx_cost (XEXP (x, 0), SET, speed);
3722 return true;
3723 }
3724 *total = COSTS_N_INSNS (mips_idiv_insns ());
3725 }
3726 else if (mode == DImode)
3727 *total = mips_cost->int_div_di;
3728 else
3729 *total = mips_cost->int_div_si;
3730 return false;
3731
3732 case SIGN_EXTEND:
3733 *total = mips_sign_extend_cost (mode, XEXP (x, 0));
3734 return false;
3735
3736 case ZERO_EXTEND:
3737 *total = mips_zero_extend_cost (mode, XEXP (x, 0));
3738 return false;
3739
3740 case FLOAT:
3741 case UNSIGNED_FLOAT:
3742 case FIX:
3743 case FLOAT_EXTEND:
3744 case FLOAT_TRUNCATE:
3745 *total = mips_cost->fp_add;
3746 return false;
3747
3748 default:
3749 return false;
3750 }
3751 }
3752
3753 /* Implement TARGET_ADDRESS_COST. */
3754
3755 static int
3756 mips_address_cost (rtx addr, bool speed ATTRIBUTE_UNUSED)
3757 {
3758 return mips_address_insns (addr, SImode, false);
3759 }
3760 \f
3761 /* Return one word of double-word value OP, taking into account the fixed
3762 endianness of certain registers. HIGH_P is true to select the high part,
3763 false to select the low part. */
3764
3765 rtx
3766 mips_subword (rtx op, bool high_p)
3767 {
3768 unsigned int byte, offset;
3769 enum machine_mode mode;
3770
3771 mode = GET_MODE (op);
3772 if (mode == VOIDmode)
3773 mode = TARGET_64BIT ? TImode : DImode;
3774
3775 if (TARGET_BIG_ENDIAN ? !high_p : high_p)
3776 byte = UNITS_PER_WORD;
3777 else
3778 byte = 0;
3779
3780 if (FP_REG_RTX_P (op))
3781 {
3782 /* Paired FPRs are always ordered little-endian. */
3783 offset = (UNITS_PER_WORD < UNITS_PER_HWFPVALUE ? high_p : byte != 0);
3784 return gen_rtx_REG (word_mode, REGNO (op) + offset);
3785 }
3786
3787 if (MEM_P (op))
3788 return mips_rewrite_small_data (adjust_address (op, word_mode, byte));
3789
3790 return simplify_gen_subreg (word_mode, op, mode, byte);
3791 }
3792
3793 /* Return true if a 64-bit move from SRC to DEST should be split into two. */
3794
3795 bool
3796 mips_split_64bit_move_p (rtx dest, rtx src)
3797 {
3798 if (TARGET_64BIT)
3799 return false;
3800
3801 /* FPR-to-FPR moves can be done in a single instruction, if they're
3802 allowed at all. */
3803 if (FP_REG_RTX_P (src) && FP_REG_RTX_P (dest))
3804 return false;
3805
3806 /* Check for floating-point loads and stores. */
3807 if (ISA_HAS_LDC1_SDC1)
3808 {
3809 if (FP_REG_RTX_P (dest) && MEM_P (src))
3810 return false;
3811 if (FP_REG_RTX_P (src) && MEM_P (dest))
3812 return false;
3813 }
3814 return true;
3815 }
3816
3817 /* Split a doubleword move from SRC to DEST. On 32-bit targets,
3818 this function handles 64-bit moves for which mips_split_64bit_move_p
3819 holds. For 64-bit targets, this function handles 128-bit moves. */
3820
3821 void
3822 mips_split_doubleword_move (rtx dest, rtx src)
3823 {
3824 rtx low_dest;
3825
3826 if (FP_REG_RTX_P (dest) || FP_REG_RTX_P (src))
3827 {
3828 if (!TARGET_64BIT && GET_MODE (dest) == DImode)
3829 emit_insn (gen_move_doubleword_fprdi (dest, src));
3830 else if (!TARGET_64BIT && GET_MODE (dest) == DFmode)
3831 emit_insn (gen_move_doubleword_fprdf (dest, src));
3832 else if (!TARGET_64BIT && GET_MODE (dest) == V2SFmode)
3833 emit_insn (gen_move_doubleword_fprv2sf (dest, src));
3834 else if (!TARGET_64BIT && GET_MODE (dest) == V2SImode)
3835 emit_insn (gen_move_doubleword_fprv2si (dest, src));
3836 else if (!TARGET_64BIT && GET_MODE (dest) == V4HImode)
3837 emit_insn (gen_move_doubleword_fprv4hi (dest, src));
3838 else if (!TARGET_64BIT && GET_MODE (dest) == V8QImode)
3839 emit_insn (gen_move_doubleword_fprv8qi (dest, src));
3840 else if (TARGET_64BIT && GET_MODE (dest) == TFmode)
3841 emit_insn (gen_move_doubleword_fprtf (dest, src));
3842 else
3843 gcc_unreachable ();
3844 }
3845 else if (REG_P (dest) && REGNO (dest) == MD_REG_FIRST)
3846 {
3847 low_dest = mips_subword (dest, false);
3848 mips_emit_move (low_dest, mips_subword (src, false));
3849 if (TARGET_64BIT)
3850 emit_insn (gen_mthidi_ti (dest, mips_subword (src, true), low_dest));
3851 else
3852 emit_insn (gen_mthisi_di (dest, mips_subword (src, true), low_dest));
3853 }
3854 else if (REG_P (src) && REGNO (src) == MD_REG_FIRST)
3855 {
3856 mips_emit_move (mips_subword (dest, false), mips_subword (src, false));
3857 if (TARGET_64BIT)
3858 emit_insn (gen_mfhidi_ti (mips_subword (dest, true), src));
3859 else
3860 emit_insn (gen_mfhisi_di (mips_subword (dest, true), src));
3861 }
3862 else
3863 {
3864 /* The operation can be split into two normal moves. Decide in
3865 which order to do them. */
3866 low_dest = mips_subword (dest, false);
3867 if (REG_P (low_dest)
3868 && reg_overlap_mentioned_p (low_dest, src))
3869 {
3870 mips_emit_move (mips_subword (dest, true), mips_subword (src, true));
3871 mips_emit_move (low_dest, mips_subword (src, false));
3872 }
3873 else
3874 {
3875 mips_emit_move (low_dest, mips_subword (src, false));
3876 mips_emit_move (mips_subword (dest, true), mips_subword (src, true));
3877 }
3878 }
3879 }
3880 \f
3881 /* Return the appropriate instructions to move SRC into DEST. Assume
3882 that SRC is operand 1 and DEST is operand 0. */
3883
3884 const char *
3885 mips_output_move (rtx dest, rtx src)
3886 {
3887 enum rtx_code dest_code, src_code;
3888 enum machine_mode mode;
3889 enum mips_symbol_type symbol_type;
3890 bool dbl_p;
3891
3892 dest_code = GET_CODE (dest);
3893 src_code = GET_CODE (src);
3894 mode = GET_MODE (dest);
3895 dbl_p = (GET_MODE_SIZE (mode) == 8);
3896
3897 if (dbl_p && mips_split_64bit_move_p (dest, src))
3898 return "#";
3899
3900 if ((src_code == REG && GP_REG_P (REGNO (src)))
3901 || (!TARGET_MIPS16 && src == CONST0_RTX (mode)))
3902 {
3903 if (dest_code == REG)
3904 {
3905 if (GP_REG_P (REGNO (dest)))
3906 return "move\t%0,%z1";
3907
3908 /* Moves to HI are handled by special .md insns. */
3909 if (REGNO (dest) == LO_REGNUM)
3910 return "mtlo\t%z1";
3911
3912 if (DSP_ACC_REG_P (REGNO (dest)))
3913 {
3914 static char retval[] = "mt__\t%z1,%q0";
3915
3916 retval[2] = reg_names[REGNO (dest)][4];
3917 retval[3] = reg_names[REGNO (dest)][5];
3918 return retval;
3919 }
3920
3921 if (FP_REG_P (REGNO (dest)))
3922 return dbl_p ? "dmtc1\t%z1,%0" : "mtc1\t%z1,%0";
3923
3924 if (ALL_COP_REG_P (REGNO (dest)))
3925 {
3926 static char retval[] = "dmtc_\t%z1,%0";
3927
3928 retval[4] = COPNUM_AS_CHAR_FROM_REGNUM (REGNO (dest));
3929 return dbl_p ? retval : retval + 1;
3930 }
3931 }
3932 if (dest_code == MEM)
3933 switch (GET_MODE_SIZE (mode))
3934 {
3935 case 1: return "sb\t%z1,%0";
3936 case 2: return "sh\t%z1,%0";
3937 case 4: return "sw\t%z1,%0";
3938 case 8: return "sd\t%z1,%0";
3939 }
3940 }
3941 if (dest_code == REG && GP_REG_P (REGNO (dest)))
3942 {
3943 if (src_code == REG)
3944 {
3945 /* Moves from HI are handled by special .md insns. */
3946 if (REGNO (src) == LO_REGNUM)
3947 {
3948 /* When generating VR4120 or VR4130 code, we use MACC and
3949 DMACC instead of MFLO. This avoids both the normal
3950 MIPS III HI/LO hazards and the errata related to
3951 -mfix-vr4130. */
3952 if (ISA_HAS_MACCHI)
3953 return dbl_p ? "dmacc\t%0,%.,%." : "macc\t%0,%.,%.";
3954 return "mflo\t%0";
3955 }
3956
3957 if (DSP_ACC_REG_P (REGNO (src)))
3958 {
3959 static char retval[] = "mf__\t%0,%q1";
3960
3961 retval[2] = reg_names[REGNO (src)][4];
3962 retval[3] = reg_names[REGNO (src)][5];
3963 return retval;
3964 }
3965
3966 if (FP_REG_P (REGNO (src)))
3967 return dbl_p ? "dmfc1\t%0,%1" : "mfc1\t%0,%1";
3968
3969 if (ALL_COP_REG_P (REGNO (src)))
3970 {
3971 static char retval[] = "dmfc_\t%0,%1";
3972
3973 retval[4] = COPNUM_AS_CHAR_FROM_REGNUM (REGNO (src));
3974 return dbl_p ? retval : retval + 1;
3975 }
3976
3977 if (ST_REG_P (REGNO (src)) && ISA_HAS_8CC)
3978 return "lui\t%0,0x3f80\n\tmovf\t%0,%.,%1";
3979 }
3980
3981 if (src_code == MEM)
3982 switch (GET_MODE_SIZE (mode))
3983 {
3984 case 1: return "lbu\t%0,%1";
3985 case 2: return "lhu\t%0,%1";
3986 case 4: return "lw\t%0,%1";
3987 case 8: return "ld\t%0,%1";
3988 }
3989
3990 if (src_code == CONST_INT)
3991 {
3992 /* Don't use the X format for the operand itself, because that
3993 will give out-of-range numbers for 64-bit hosts and 32-bit
3994 targets. */
3995 if (!TARGET_MIPS16)
3996 return "li\t%0,%1\t\t\t# %X1";
3997
3998 if (SMALL_OPERAND_UNSIGNED (INTVAL (src)))
3999 return "li\t%0,%1";
4000
4001 if (SMALL_OPERAND_UNSIGNED (-INTVAL (src)))
4002 return "#";
4003 }
4004
4005 if (src_code == HIGH)
4006 return TARGET_MIPS16 ? "#" : "lui\t%0,%h1";
4007
4008 if (CONST_GP_P (src))
4009 return "move\t%0,%1";
4010
4011 if (mips_symbolic_constant_p (src, SYMBOL_CONTEXT_LEA, &symbol_type)
4012 && mips_lo_relocs[symbol_type] != 0)
4013 {
4014 /* A signed 16-bit constant formed by applying a relocation
4015 operator to a symbolic address. */
4016 gcc_assert (!mips_split_p[symbol_type]);
4017 return "li\t%0,%R1";
4018 }
4019
4020 if (symbolic_operand (src, VOIDmode))
4021 {
4022 gcc_assert (TARGET_MIPS16
4023 ? TARGET_MIPS16_TEXT_LOADS
4024 : !TARGET_EXPLICIT_RELOCS);
4025 return dbl_p ? "dla\t%0,%1" : "la\t%0,%1";
4026 }
4027 }
4028 if (src_code == REG && FP_REG_P (REGNO (src)))
4029 {
4030 if (dest_code == REG && FP_REG_P (REGNO (dest)))
4031 {
4032 if (GET_MODE (dest) == V2SFmode)
4033 return "mov.ps\t%0,%1";
4034 else
4035 return dbl_p ? "mov.d\t%0,%1" : "mov.s\t%0,%1";
4036 }
4037
4038 if (dest_code == MEM)
4039 return dbl_p ? "sdc1\t%1,%0" : "swc1\t%1,%0";
4040 }
4041 if (dest_code == REG && FP_REG_P (REGNO (dest)))
4042 {
4043 if (src_code == MEM)
4044 return dbl_p ? "ldc1\t%0,%1" : "lwc1\t%0,%1";
4045 }
4046 if (dest_code == REG && ALL_COP_REG_P (REGNO (dest)) && src_code == MEM)
4047 {
4048 static char retval[] = "l_c_\t%0,%1";
4049
4050 retval[1] = (dbl_p ? 'd' : 'w');
4051 retval[3] = COPNUM_AS_CHAR_FROM_REGNUM (REGNO (dest));
4052 return retval;
4053 }
4054 if (dest_code == MEM && src_code == REG && ALL_COP_REG_P (REGNO (src)))
4055 {
4056 static char retval[] = "s_c_\t%1,%0";
4057
4058 retval[1] = (dbl_p ? 'd' : 'w');
4059 retval[3] = COPNUM_AS_CHAR_FROM_REGNUM (REGNO (src));
4060 return retval;
4061 }
4062 gcc_unreachable ();
4063 }
4064 \f
4065 /* Return true if CMP1 is a suitable second operand for integer ordering
4066 test CODE. See also the *sCC patterns in mips.md. */
4067
4068 static bool
4069 mips_int_order_operand_ok_p (enum rtx_code code, rtx cmp1)
4070 {
4071 switch (code)
4072 {
4073 case GT:
4074 case GTU:
4075 return reg_or_0_operand (cmp1, VOIDmode);
4076
4077 case GE:
4078 case GEU:
4079 return !TARGET_MIPS16 && cmp1 == const1_rtx;
4080
4081 case LT:
4082 case LTU:
4083 return arith_operand (cmp1, VOIDmode);
4084
4085 case LE:
4086 return sle_operand (cmp1, VOIDmode);
4087
4088 case LEU:
4089 return sleu_operand (cmp1, VOIDmode);
4090
4091 default:
4092 gcc_unreachable ();
4093 }
4094 }
4095
4096 /* Return true if *CMP1 (of mode MODE) is a valid second operand for
4097 integer ordering test *CODE, or if an equivalent combination can
4098 be formed by adjusting *CODE and *CMP1. When returning true, update
4099 *CODE and *CMP1 with the chosen code and operand, otherwise leave
4100 them alone. */
4101
4102 static bool
4103 mips_canonicalize_int_order_test (enum rtx_code *code, rtx *cmp1,
4104 enum machine_mode mode)
4105 {
4106 HOST_WIDE_INT plus_one;
4107
4108 if (mips_int_order_operand_ok_p (*code, *cmp1))
4109 return true;
4110
4111 if (GET_CODE (*cmp1) == CONST_INT)
4112 switch (*code)
4113 {
4114 case LE:
4115 plus_one = trunc_int_for_mode (UINTVAL (*cmp1) + 1, mode);
4116 if (INTVAL (*cmp1) < plus_one)
4117 {
4118 *code = LT;
4119 *cmp1 = force_reg (mode, GEN_INT (plus_one));
4120 return true;
4121 }
4122 break;
4123
4124 case LEU:
4125 plus_one = trunc_int_for_mode (UINTVAL (*cmp1) + 1, mode);
4126 if (plus_one != 0)
4127 {
4128 *code = LTU;
4129 *cmp1 = force_reg (mode, GEN_INT (plus_one));
4130 return true;
4131 }
4132 break;
4133
4134 default:
4135 break;
4136 }
4137 return false;
4138 }
4139
4140 /* Compare CMP0 and CMP1 using ordering test CODE and store the result
4141 in TARGET. CMP0 and TARGET are register_operands. If INVERT_PTR
4142 is nonnull, it's OK to set TARGET to the inverse of the result and
4143 flip *INVERT_PTR instead. */
4144
4145 static void
4146 mips_emit_int_order_test (enum rtx_code code, bool *invert_ptr,
4147 rtx target, rtx cmp0, rtx cmp1)
4148 {
4149 enum machine_mode mode;
4150
4151 /* First see if there is a MIPS instruction that can do this operation.
4152 If not, try doing the same for the inverse operation. If that also
4153 fails, force CMP1 into a register and try again. */
4154 mode = GET_MODE (cmp0);
4155 if (mips_canonicalize_int_order_test (&code, &cmp1, mode))
4156 mips_emit_binary (code, target, cmp0, cmp1);
4157 else
4158 {
4159 enum rtx_code inv_code = reverse_condition (code);
4160 if (!mips_canonicalize_int_order_test (&inv_code, &cmp1, mode))
4161 {
4162 cmp1 = force_reg (mode, cmp1);
4163 mips_emit_int_order_test (code, invert_ptr, target, cmp0, cmp1);
4164 }
4165 else if (invert_ptr == 0)
4166 {
4167 rtx inv_target;
4168
4169 inv_target = mips_force_binary (GET_MODE (target),
4170 inv_code, cmp0, cmp1);
4171 mips_emit_binary (XOR, target, inv_target, const1_rtx);
4172 }
4173 else
4174 {
4175 *invert_ptr = !*invert_ptr;
4176 mips_emit_binary (inv_code, target, cmp0, cmp1);
4177 }
4178 }
4179 }
4180
4181 /* Return a register that is zero iff CMP0 and CMP1 are equal.
4182 The register will have the same mode as CMP0. */
4183
4184 static rtx
4185 mips_zero_if_equal (rtx cmp0, rtx cmp1)
4186 {
4187 if (cmp1 == const0_rtx)
4188 return cmp0;
4189
4190 if (uns_arith_operand (cmp1, VOIDmode))
4191 return expand_binop (GET_MODE (cmp0), xor_optab,
4192 cmp0, cmp1, 0, 0, OPTAB_DIRECT);
4193
4194 return expand_binop (GET_MODE (cmp0), sub_optab,
4195 cmp0, cmp1, 0, 0, OPTAB_DIRECT);
4196 }
4197
4198 /* Convert *CODE into a code that can be used in a floating-point
4199 scc instruction (C.cond.fmt). Return true if the values of
4200 the condition code registers will be inverted, with 0 indicating
4201 that the condition holds. */
4202
4203 static bool
4204 mips_reversed_fp_cond (enum rtx_code *code)
4205 {
4206 switch (*code)
4207 {
4208 case NE:
4209 case LTGT:
4210 case ORDERED:
4211 *code = reverse_condition_maybe_unordered (*code);
4212 return true;
4213
4214 default:
4215 return false;
4216 }
4217 }
4218
4219 /* Convert a comparison into something that can be used in a branch or
4220 conditional move. On entry, *OP0 and *OP1 are the values being
4221 compared and *CODE is the code used to compare them.
4222
4223 Update *CODE, *OP0 and *OP1 so that they describe the final comparison.
4224 If NEED_EQ_NE_P, then only EQ or NE comparisons against zero are possible,
4225 otherwise any standard branch condition can be used. The standard branch
4226 conditions are:
4227
4228 - EQ or NE between two registers.
4229 - any comparison between a register and zero. */
4230
4231 static void
4232 mips_emit_compare (enum rtx_code *code, rtx *op0, rtx *op1, bool need_eq_ne_p)
4233 {
4234 rtx cmp_op0 = *op0;
4235 rtx cmp_op1 = *op1;
4236
4237 if (GET_MODE_CLASS (GET_MODE (*op0)) == MODE_INT)
4238 {
4239 if (!need_eq_ne_p && *op1 == const0_rtx)
4240 ;
4241 else if (*code == EQ || *code == NE)
4242 {
4243 if (need_eq_ne_p)
4244 {
4245 *op0 = mips_zero_if_equal (cmp_op0, cmp_op1);
4246 *op1 = const0_rtx;
4247 }
4248 else
4249 *op1 = force_reg (GET_MODE (cmp_op0), cmp_op1);
4250 }
4251 else
4252 {
4253 /* The comparison needs a separate scc instruction. Store the
4254 result of the scc in *OP0 and compare it against zero. */
4255 bool invert = false;
4256 *op0 = gen_reg_rtx (GET_MODE (cmp_op0));
4257 mips_emit_int_order_test (*code, &invert, *op0, cmp_op0, cmp_op1);
4258 *code = (invert ? EQ : NE);
4259 *op1 = const0_rtx;
4260 }
4261 }
4262 else if (ALL_FIXED_POINT_MODE_P (GET_MODE (cmp_op0)))
4263 {
4264 *op0 = gen_rtx_REG (CCDSPmode, CCDSP_CC_REGNUM);
4265 mips_emit_binary (*code, *op0, cmp_op0, cmp_op1);
4266 *code = NE;
4267 *op1 = const0_rtx;
4268 }
4269 else
4270 {
4271 enum rtx_code cmp_code;
4272
4273 /* Floating-point tests use a separate C.cond.fmt comparison to
4274 set a condition code register. The branch or conditional move
4275 will then compare that register against zero.
4276
4277 Set CMP_CODE to the code of the comparison instruction and
4278 *CODE to the code that the branch or move should use. */
4279 cmp_code = *code;
4280 *code = mips_reversed_fp_cond (&cmp_code) ? EQ : NE;
4281 *op0 = (ISA_HAS_8CC
4282 ? gen_reg_rtx (CCmode)
4283 : gen_rtx_REG (CCmode, FPSW_REGNUM));
4284 *op1 = const0_rtx;
4285 mips_emit_binary (cmp_code, *op0, cmp_op0, cmp_op1);
4286 }
4287 }
4288 \f
4289 /* Try performing the comparison in OPERANDS[1], whose arms are OPERANDS[2]
4290 and OPERAND[3]. Store the result in OPERANDS[0].
4291
4292 On 64-bit targets, the mode of the comparison and target will always be
4293 SImode, thus possibly narrower than that of the comparison's operands. */
4294
4295 void
4296 mips_expand_scc (rtx operands[])
4297 {
4298 rtx target = operands[0];
4299 enum rtx_code code = GET_CODE (operands[1]);
4300 rtx op0 = operands[2];
4301 rtx op1 = operands[3];
4302
4303 gcc_assert (GET_MODE_CLASS (GET_MODE (op0)) == MODE_INT);
4304
4305 if (code == EQ || code == NE)
4306 {
4307 if (ISA_HAS_SEQ_SNE
4308 && reg_imm10_operand (op1, GET_MODE (op1)))
4309 mips_emit_binary (code, target, op0, op1);
4310 else
4311 {
4312 rtx zie = mips_zero_if_equal (op0, op1);
4313 mips_emit_binary (code, target, zie, const0_rtx);
4314 }
4315 }
4316 else
4317 mips_emit_int_order_test (code, 0, target, op0, op1);
4318 }
4319
4320 /* Compare OPERANDS[1] with OPERANDS[2] using comparison code
4321 CODE and jump to OPERANDS[3] if the condition holds. */
4322
4323 void
4324 mips_expand_conditional_branch (rtx *operands)
4325 {
4326 enum rtx_code code = GET_CODE (operands[0]);
4327 rtx op0 = operands[1];
4328 rtx op1 = operands[2];
4329 rtx condition;
4330
4331 mips_emit_compare (&code, &op0, &op1, TARGET_MIPS16);
4332 condition = gen_rtx_fmt_ee (code, VOIDmode, op0, op1);
4333 emit_jump_insn (gen_condjump (condition, operands[3]));
4334 }
4335
4336 /* Implement:
4337
4338 (set temp (COND:CCV2 CMP_OP0 CMP_OP1))
4339 (set DEST (unspec [TRUE_SRC FALSE_SRC temp] UNSPEC_MOVE_TF_PS)) */
4340
4341 void
4342 mips_expand_vcondv2sf (rtx dest, rtx true_src, rtx false_src,
4343 enum rtx_code cond, rtx cmp_op0, rtx cmp_op1)
4344 {
4345 rtx cmp_result;
4346 bool reversed_p;
4347
4348 reversed_p = mips_reversed_fp_cond (&cond);
4349 cmp_result = gen_reg_rtx (CCV2mode);
4350 emit_insn (gen_scc_ps (cmp_result,
4351 gen_rtx_fmt_ee (cond, VOIDmode, cmp_op0, cmp_op1)));
4352 if (reversed_p)
4353 emit_insn (gen_mips_cond_move_tf_ps (dest, false_src, true_src,
4354 cmp_result));
4355 else
4356 emit_insn (gen_mips_cond_move_tf_ps (dest, true_src, false_src,
4357 cmp_result));
4358 }
4359
4360 /* Perform the comparison in OPERANDS[1]. Move OPERANDS[2] into OPERANDS[0]
4361 if the condition holds, otherwise move OPERANDS[3] into OPERANDS[0]. */
4362
4363 void
4364 mips_expand_conditional_move (rtx *operands)
4365 {
4366 rtx cond;
4367 enum rtx_code code = GET_CODE (operands[1]);
4368 rtx op0 = XEXP (operands[1], 0);
4369 rtx op1 = XEXP (operands[1], 1);
4370
4371 mips_emit_compare (&code, &op0, &op1, true);
4372 cond = gen_rtx_fmt_ee (code, GET_MODE (op0), op0, op1);
4373 emit_insn (gen_rtx_SET (VOIDmode, operands[0],
4374 gen_rtx_IF_THEN_ELSE (GET_MODE (operands[0]), cond,
4375 operands[2], operands[3])));
4376 }
4377
4378 /* Perform the comparison in COMPARISON, then trap if the condition holds. */
4379
4380 void
4381 mips_expand_conditional_trap (rtx comparison)
4382 {
4383 rtx op0, op1;
4384 enum machine_mode mode;
4385 enum rtx_code code;
4386
4387 /* MIPS conditional trap instructions don't have GT or LE flavors,
4388 so we must swap the operands and convert to LT and GE respectively. */
4389 code = GET_CODE (comparison);
4390 switch (code)
4391 {
4392 case GT:
4393 case LE:
4394 case GTU:
4395 case LEU:
4396 code = swap_condition (code);
4397 op0 = XEXP (comparison, 1);
4398 op1 = XEXP (comparison, 0);
4399 break;
4400
4401 default:
4402 op0 = XEXP (comparison, 0);
4403 op1 = XEXP (comparison, 1);
4404 break;
4405 }
4406
4407 mode = GET_MODE (XEXP (comparison, 0));
4408 op0 = force_reg (mode, op0);
4409 if (!arith_operand (op1, mode))
4410 op1 = force_reg (mode, op1);
4411
4412 emit_insn (gen_rtx_TRAP_IF (VOIDmode,
4413 gen_rtx_fmt_ee (code, mode, op0, op1),
4414 const0_rtx));
4415 }
4416 \f
4417 /* Initialize *CUM for a call to a function of type FNTYPE. */
4418
4419 void
4420 mips_init_cumulative_args (CUMULATIVE_ARGS *cum, tree fntype)
4421 {
4422 memset (cum, 0, sizeof (*cum));
4423 cum->prototype = (fntype && prototype_p (fntype));
4424 cum->gp_reg_found = (cum->prototype && stdarg_p (fntype));
4425 }
4426
4427 /* Fill INFO with information about a single argument. CUM is the
4428 cumulative state for earlier arguments. MODE is the mode of this
4429 argument and TYPE is its type (if known). NAMED is true if this
4430 is a named (fixed) argument rather than a variable one. */
4431
4432 static void
4433 mips_get_arg_info (struct mips_arg_info *info, const CUMULATIVE_ARGS *cum,
4434 enum machine_mode mode, tree type, int named)
4435 {
4436 bool doubleword_aligned_p;
4437 unsigned int num_bytes, num_words, max_regs;
4438
4439 /* Work out the size of the argument. */
4440 num_bytes = type ? int_size_in_bytes (type) : GET_MODE_SIZE (mode);
4441 num_words = (num_bytes + UNITS_PER_WORD - 1) / UNITS_PER_WORD;
4442
4443 /* Decide whether it should go in a floating-point register, assuming
4444 one is free. Later code checks for availability.
4445
4446 The checks against UNITS_PER_FPVALUE handle the soft-float and
4447 single-float cases. */
4448 switch (mips_abi)
4449 {
4450 case ABI_EABI:
4451 /* The EABI conventions have traditionally been defined in terms
4452 of TYPE_MODE, regardless of the actual type. */
4453 info->fpr_p = ((GET_MODE_CLASS (mode) == MODE_FLOAT
4454 || GET_MODE_CLASS (mode) == MODE_VECTOR_FLOAT)
4455 && GET_MODE_SIZE (mode) <= UNITS_PER_FPVALUE);
4456 break;
4457
4458 case ABI_32:
4459 case ABI_O64:
4460 /* Only leading floating-point scalars are passed in
4461 floating-point registers. We also handle vector floats the same
4462 say, which is OK because they are not covered by the standard ABI. */
4463 info->fpr_p = (!cum->gp_reg_found
4464 && cum->arg_number < 2
4465 && (type == 0
4466 || SCALAR_FLOAT_TYPE_P (type)
4467 || VECTOR_FLOAT_TYPE_P (type))
4468 && (GET_MODE_CLASS (mode) == MODE_FLOAT
4469 || GET_MODE_CLASS (mode) == MODE_VECTOR_FLOAT)
4470 && GET_MODE_SIZE (mode) <= UNITS_PER_FPVALUE);
4471 break;
4472
4473 case ABI_N32:
4474 case ABI_64:
4475 /* Scalar, complex and vector floating-point types are passed in
4476 floating-point registers, as long as this is a named rather
4477 than a variable argument. */
4478 info->fpr_p = (named
4479 && (type == 0 || FLOAT_TYPE_P (type))
4480 && (GET_MODE_CLASS (mode) == MODE_FLOAT
4481 || GET_MODE_CLASS (mode) == MODE_COMPLEX_FLOAT
4482 || GET_MODE_CLASS (mode) == MODE_VECTOR_FLOAT)
4483 && GET_MODE_UNIT_SIZE (mode) <= UNITS_PER_FPVALUE);
4484
4485 /* ??? According to the ABI documentation, the real and imaginary
4486 parts of complex floats should be passed in individual registers.
4487 The real and imaginary parts of stack arguments are supposed
4488 to be contiguous and there should be an extra word of padding
4489 at the end.
4490
4491 This has two problems. First, it makes it impossible to use a
4492 single "void *" va_list type, since register and stack arguments
4493 are passed differently. (At the time of writing, MIPSpro cannot
4494 handle complex float varargs correctly.) Second, it's unclear
4495 what should happen when there is only one register free.
4496
4497 For now, we assume that named complex floats should go into FPRs
4498 if there are two FPRs free, otherwise they should be passed in the
4499 same way as a struct containing two floats. */
4500 if (info->fpr_p
4501 && GET_MODE_CLASS (mode) == MODE_COMPLEX_FLOAT
4502 && GET_MODE_UNIT_SIZE (mode) < UNITS_PER_FPVALUE)
4503 {
4504 if (cum->num_gprs >= MAX_ARGS_IN_REGISTERS - 1)
4505 info->fpr_p = false;
4506 else
4507 num_words = 2;
4508 }
4509 break;
4510
4511 default:
4512 gcc_unreachable ();
4513 }
4514
4515 /* See whether the argument has doubleword alignment. */
4516 doubleword_aligned_p = FUNCTION_ARG_BOUNDARY (mode, type) > BITS_PER_WORD;
4517
4518 /* Set REG_OFFSET to the register count we're interested in.
4519 The EABI allocates the floating-point registers separately,
4520 but the other ABIs allocate them like integer registers. */
4521 info->reg_offset = (mips_abi == ABI_EABI && info->fpr_p
4522 ? cum->num_fprs
4523 : cum->num_gprs);
4524
4525 /* Advance to an even register if the argument is doubleword-aligned. */
4526 if (doubleword_aligned_p)
4527 info->reg_offset += info->reg_offset & 1;
4528
4529 /* Work out the offset of a stack argument. */
4530 info->stack_offset = cum->stack_words;
4531 if (doubleword_aligned_p)
4532 info->stack_offset += info->stack_offset & 1;
4533
4534 max_regs = MAX_ARGS_IN_REGISTERS - info->reg_offset;
4535
4536 /* Partition the argument between registers and stack. */
4537 info->reg_words = MIN (num_words, max_regs);
4538 info->stack_words = num_words - info->reg_words;
4539 }
4540
4541 /* INFO describes a register argument that has the normal format for the
4542 argument's mode. Return the register it uses, assuming that FPRs are
4543 available if HARD_FLOAT_P. */
4544
4545 static unsigned int
4546 mips_arg_regno (const struct mips_arg_info *info, bool hard_float_p)
4547 {
4548 if (!info->fpr_p || !hard_float_p)
4549 return GP_ARG_FIRST + info->reg_offset;
4550 else if (mips_abi == ABI_32 && TARGET_DOUBLE_FLOAT && info->reg_offset > 0)
4551 /* In o32, the second argument is always passed in $f14
4552 for TARGET_DOUBLE_FLOAT, regardless of whether the
4553 first argument was a word or doubleword. */
4554 return FP_ARG_FIRST + 2;
4555 else
4556 return FP_ARG_FIRST + info->reg_offset;
4557 }
4558
4559 /* Implement TARGET_STRICT_ARGUMENT_NAMING. */
4560
4561 static bool
4562 mips_strict_argument_naming (CUMULATIVE_ARGS *ca ATTRIBUTE_UNUSED)
4563 {
4564 return !TARGET_OLDABI;
4565 }
4566
4567 /* Implement FUNCTION_ARG. */
4568
4569 rtx
4570 mips_function_arg (const CUMULATIVE_ARGS *cum, enum machine_mode mode,
4571 tree type, int named)
4572 {
4573 struct mips_arg_info info;
4574
4575 /* We will be called with a mode of VOIDmode after the last argument
4576 has been seen. Whatever we return will be passed to the call expander.
4577 If we need a MIPS16 fp_code, return a REG with the code stored as
4578 the mode. */
4579 if (mode == VOIDmode)
4580 {
4581 if (TARGET_MIPS16 && cum->fp_code != 0)
4582 return gen_rtx_REG ((enum machine_mode) cum->fp_code, 0);
4583 else
4584 return NULL;
4585 }
4586
4587 mips_get_arg_info (&info, cum, mode, type, named);
4588
4589 /* Return straight away if the whole argument is passed on the stack. */
4590 if (info.reg_offset == MAX_ARGS_IN_REGISTERS)
4591 return NULL;
4592
4593 /* The n32 and n64 ABIs say that if any 64-bit chunk of the structure
4594 contains a double in its entirety, then that 64-bit chunk is passed
4595 in a floating-point register. */
4596 if (TARGET_NEWABI
4597 && TARGET_HARD_FLOAT
4598 && named
4599 && type != 0
4600 && TREE_CODE (type) == RECORD_TYPE
4601 && TYPE_SIZE_UNIT (type)
4602 && host_integerp (TYPE_SIZE_UNIT (type), 1))
4603 {
4604 tree field;
4605
4606 /* First check to see if there is any such field. */
4607 for (field = TYPE_FIELDS (type); field; field = TREE_CHAIN (field))
4608 if (TREE_CODE (field) == FIELD_DECL
4609 && SCALAR_FLOAT_TYPE_P (TREE_TYPE (field))
4610 && TYPE_PRECISION (TREE_TYPE (field)) == BITS_PER_WORD
4611 && host_integerp (bit_position (field), 0)
4612 && int_bit_position (field) % BITS_PER_WORD == 0)
4613 break;
4614
4615 if (field != 0)
4616 {
4617 /* Now handle the special case by returning a PARALLEL
4618 indicating where each 64-bit chunk goes. INFO.REG_WORDS
4619 chunks are passed in registers. */
4620 unsigned int i;
4621 HOST_WIDE_INT bitpos;
4622 rtx ret;
4623
4624 /* assign_parms checks the mode of ENTRY_PARM, so we must
4625 use the actual mode here. */
4626 ret = gen_rtx_PARALLEL (mode, rtvec_alloc (info.reg_words));
4627
4628 bitpos = 0;
4629 field = TYPE_FIELDS (type);
4630 for (i = 0; i < info.reg_words; i++)
4631 {
4632 rtx reg;
4633
4634 for (; field; field = TREE_CHAIN (field))
4635 if (TREE_CODE (field) == FIELD_DECL
4636 && int_bit_position (field) >= bitpos)
4637 break;
4638
4639 if (field
4640 && int_bit_position (field) == bitpos
4641 && SCALAR_FLOAT_TYPE_P (TREE_TYPE (field))
4642 && TYPE_PRECISION (TREE_TYPE (field)) == BITS_PER_WORD)
4643 reg = gen_rtx_REG (DFmode, FP_ARG_FIRST + info.reg_offset + i);
4644 else
4645 reg = gen_rtx_REG (DImode, GP_ARG_FIRST + info.reg_offset + i);
4646
4647 XVECEXP (ret, 0, i)
4648 = gen_rtx_EXPR_LIST (VOIDmode, reg,
4649 GEN_INT (bitpos / BITS_PER_UNIT));
4650
4651 bitpos += BITS_PER_WORD;
4652 }
4653 return ret;
4654 }
4655 }
4656
4657 /* Handle the n32/n64 conventions for passing complex floating-point
4658 arguments in FPR pairs. The real part goes in the lower register
4659 and the imaginary part goes in the upper register. */
4660 if (TARGET_NEWABI
4661 && info.fpr_p
4662 && GET_MODE_CLASS (mode) == MODE_COMPLEX_FLOAT)
4663 {
4664 rtx real, imag;
4665 enum machine_mode inner;
4666 unsigned int regno;
4667
4668 inner = GET_MODE_INNER (mode);
4669 regno = FP_ARG_FIRST + info.reg_offset;
4670 if (info.reg_words * UNITS_PER_WORD == GET_MODE_SIZE (inner))
4671 {
4672 /* Real part in registers, imaginary part on stack. */
4673 gcc_assert (info.stack_words == info.reg_words);
4674 return gen_rtx_REG (inner, regno);
4675 }
4676 else
4677 {
4678 gcc_assert (info.stack_words == 0);
4679 real = gen_rtx_EXPR_LIST (VOIDmode,
4680 gen_rtx_REG (inner, regno),
4681 const0_rtx);
4682 imag = gen_rtx_EXPR_LIST (VOIDmode,
4683 gen_rtx_REG (inner,
4684 regno + info.reg_words / 2),
4685 GEN_INT (GET_MODE_SIZE (inner)));
4686 return gen_rtx_PARALLEL (mode, gen_rtvec (2, real, imag));
4687 }
4688 }
4689
4690 return gen_rtx_REG (mode, mips_arg_regno (&info, TARGET_HARD_FLOAT));
4691 }
4692
4693 /* Implement FUNCTION_ARG_ADVANCE. */
4694
4695 void
4696 mips_function_arg_advance (CUMULATIVE_ARGS *cum, enum machine_mode mode,
4697 tree type, int named)
4698 {
4699 struct mips_arg_info info;
4700
4701 mips_get_arg_info (&info, cum, mode, type, named);
4702
4703 if (!info.fpr_p)
4704 cum->gp_reg_found = true;
4705
4706 /* See the comment above the CUMULATIVE_ARGS structure in mips.h for
4707 an explanation of what this code does. It assumes that we're using
4708 either the o32 or the o64 ABI, both of which pass at most 2 arguments
4709 in FPRs. */
4710 if (cum->arg_number < 2 && info.fpr_p)
4711 cum->fp_code += (mode == SFmode ? 1 : 2) << (cum->arg_number * 2);
4712
4713 /* Advance the register count. This has the effect of setting
4714 num_gprs to MAX_ARGS_IN_REGISTERS if a doubleword-aligned
4715 argument required us to skip the final GPR and pass the whole
4716 argument on the stack. */
4717 if (mips_abi != ABI_EABI || !info.fpr_p)
4718 cum->num_gprs = info.reg_offset + info.reg_words;
4719 else if (info.reg_words > 0)
4720 cum->num_fprs += MAX_FPRS_PER_FMT;
4721
4722 /* Advance the stack word count. */
4723 if (info.stack_words > 0)
4724 cum->stack_words = info.stack_offset + info.stack_words;
4725
4726 cum->arg_number++;
4727 }
4728
4729 /* Implement TARGET_ARG_PARTIAL_BYTES. */
4730
4731 static int
4732 mips_arg_partial_bytes (CUMULATIVE_ARGS *cum,
4733 enum machine_mode mode, tree type, bool named)
4734 {
4735 struct mips_arg_info info;
4736
4737 mips_get_arg_info (&info, cum, mode, type, named);
4738 return info.stack_words > 0 ? info.reg_words * UNITS_PER_WORD : 0;
4739 }
4740
4741 /* Implement FUNCTION_ARG_BOUNDARY. Every parameter gets at least
4742 PARM_BOUNDARY bits of alignment, but will be given anything up
4743 to STACK_BOUNDARY bits if the type requires it. */
4744
4745 int
4746 mips_function_arg_boundary (enum machine_mode mode, tree type)
4747 {
4748 unsigned int alignment;
4749
4750 alignment = type ? TYPE_ALIGN (type) : GET_MODE_ALIGNMENT (mode);
4751 if (alignment < PARM_BOUNDARY)
4752 alignment = PARM_BOUNDARY;
4753 if (alignment > STACK_BOUNDARY)
4754 alignment = STACK_BOUNDARY;
4755 return alignment;
4756 }
4757
4758 /* Return true if FUNCTION_ARG_PADDING (MODE, TYPE) should return
4759 upward rather than downward. In other words, return true if the
4760 first byte of the stack slot has useful data, false if the last
4761 byte does. */
4762
4763 bool
4764 mips_pad_arg_upward (enum machine_mode mode, const_tree type)
4765 {
4766 /* On little-endian targets, the first byte of every stack argument
4767 is passed in the first byte of the stack slot. */
4768 if (!BYTES_BIG_ENDIAN)
4769 return true;
4770
4771 /* Otherwise, integral types are padded downward: the last byte of a
4772 stack argument is passed in the last byte of the stack slot. */
4773 if (type != 0
4774 ? (INTEGRAL_TYPE_P (type)
4775 || POINTER_TYPE_P (type)
4776 || FIXED_POINT_TYPE_P (type))
4777 : (SCALAR_INT_MODE_P (mode)
4778 || ALL_SCALAR_FIXED_POINT_MODE_P (mode)))
4779 return false;
4780
4781 /* Big-endian o64 pads floating-point arguments downward. */
4782 if (mips_abi == ABI_O64)
4783 if (type != 0 ? FLOAT_TYPE_P (type) : GET_MODE_CLASS (mode) == MODE_FLOAT)
4784 return false;
4785
4786 /* Other types are padded upward for o32, o64, n32 and n64. */
4787 if (mips_abi != ABI_EABI)
4788 return true;
4789
4790 /* Arguments smaller than a stack slot are padded downward. */
4791 if (mode != BLKmode)
4792 return GET_MODE_BITSIZE (mode) >= PARM_BOUNDARY;
4793 else
4794 return int_size_in_bytes (type) >= (PARM_BOUNDARY / BITS_PER_UNIT);
4795 }
4796
4797 /* Likewise BLOCK_REG_PADDING (MODE, TYPE, ...). Return !BYTES_BIG_ENDIAN
4798 if the least significant byte of the register has useful data. Return
4799 the opposite if the most significant byte does. */
4800
4801 bool
4802 mips_pad_reg_upward (enum machine_mode mode, tree type)
4803 {
4804 /* No shifting is required for floating-point arguments. */
4805 if (type != 0 ? FLOAT_TYPE_P (type) : GET_MODE_CLASS (mode) == MODE_FLOAT)
4806 return !BYTES_BIG_ENDIAN;
4807
4808 /* Otherwise, apply the same padding to register arguments as we do
4809 to stack arguments. */
4810 return mips_pad_arg_upward (mode, type);
4811 }
4812
4813 /* Return nonzero when an argument must be passed by reference. */
4814
4815 static bool
4816 mips_pass_by_reference (CUMULATIVE_ARGS *cum ATTRIBUTE_UNUSED,
4817 enum machine_mode mode, const_tree type,
4818 bool named ATTRIBUTE_UNUSED)
4819 {
4820 if (mips_abi == ABI_EABI)
4821 {
4822 int size;
4823
4824 /* ??? How should SCmode be handled? */
4825 if (mode == DImode || mode == DFmode
4826 || mode == DQmode || mode == UDQmode
4827 || mode == DAmode || mode == UDAmode)
4828 return 0;
4829
4830 size = type ? int_size_in_bytes (type) : GET_MODE_SIZE (mode);
4831 return size == -1 || size > UNITS_PER_WORD;
4832 }
4833 else
4834 {
4835 /* If we have a variable-sized parameter, we have no choice. */
4836 return targetm.calls.must_pass_in_stack (mode, type);
4837 }
4838 }
4839
4840 /* Implement TARGET_CALLEE_COPIES. */
4841
4842 static bool
4843 mips_callee_copies (CUMULATIVE_ARGS *cum ATTRIBUTE_UNUSED,
4844 enum machine_mode mode ATTRIBUTE_UNUSED,
4845 const_tree type ATTRIBUTE_UNUSED, bool named)
4846 {
4847 return mips_abi == ABI_EABI && named;
4848 }
4849 \f
4850 /* See whether VALTYPE is a record whose fields should be returned in
4851 floating-point registers. If so, return the number of fields and
4852 list them in FIELDS (which should have two elements). Return 0
4853 otherwise.
4854
4855 For n32 & n64, a structure with one or two fields is returned in
4856 floating-point registers as long as every field has a floating-point
4857 type. */
4858
4859 static int
4860 mips_fpr_return_fields (const_tree valtype, tree *fields)
4861 {
4862 tree field;
4863 int i;
4864
4865 if (!TARGET_NEWABI)
4866 return 0;
4867
4868 if (TREE_CODE (valtype) != RECORD_TYPE)
4869 return 0;
4870
4871 i = 0;
4872 for (field = TYPE_FIELDS (valtype); field != 0; field = TREE_CHAIN (field))
4873 {
4874 if (TREE_CODE (field) != FIELD_DECL)
4875 continue;
4876
4877 if (!SCALAR_FLOAT_TYPE_P (TREE_TYPE (field)))
4878 return 0;
4879
4880 if (i == 2)
4881 return 0;
4882
4883 fields[i++] = field;
4884 }
4885 return i;
4886 }
4887
4888 /* Implement TARGET_RETURN_IN_MSB. For n32 & n64, we should return
4889 a value in the most significant part of $2/$3 if:
4890
4891 - the target is big-endian;
4892
4893 - the value has a structure or union type (we generalize this to
4894 cover aggregates from other languages too); and
4895
4896 - the structure is not returned in floating-point registers. */
4897
4898 static bool
4899 mips_return_in_msb (const_tree valtype)
4900 {
4901 tree fields[2];
4902
4903 return (TARGET_NEWABI
4904 && TARGET_BIG_ENDIAN
4905 && AGGREGATE_TYPE_P (valtype)
4906 && mips_fpr_return_fields (valtype, fields) == 0);
4907 }
4908
4909 /* Return true if the function return value MODE will get returned in a
4910 floating-point register. */
4911
4912 static bool
4913 mips_return_mode_in_fpr_p (enum machine_mode mode)
4914 {
4915 return ((GET_MODE_CLASS (mode) == MODE_FLOAT
4916 || GET_MODE_CLASS (mode) == MODE_VECTOR_FLOAT
4917 || GET_MODE_CLASS (mode) == MODE_COMPLEX_FLOAT)
4918 && GET_MODE_UNIT_SIZE (mode) <= UNITS_PER_HWFPVALUE);
4919 }
4920
4921 /* Return the representation of an FPR return register when the
4922 value being returned in FP_RETURN has mode VALUE_MODE and the
4923 return type itself has mode TYPE_MODE. On NewABI targets,
4924 the two modes may be different for structures like:
4925
4926 struct __attribute__((packed)) foo { float f; }
4927
4928 where we return the SFmode value of "f" in FP_RETURN, but where
4929 the structure itself has mode BLKmode. */
4930
4931 static rtx
4932 mips_return_fpr_single (enum machine_mode type_mode,
4933 enum machine_mode value_mode)
4934 {
4935 rtx x;
4936
4937 x = gen_rtx_REG (value_mode, FP_RETURN);
4938 if (type_mode != value_mode)
4939 {
4940 x = gen_rtx_EXPR_LIST (VOIDmode, x, const0_rtx);
4941 x = gen_rtx_PARALLEL (type_mode, gen_rtvec (1, x));
4942 }
4943 return x;
4944 }
4945
4946 /* Return a composite value in a pair of floating-point registers.
4947 MODE1 and OFFSET1 are the mode and byte offset for the first value,
4948 likewise MODE2 and OFFSET2 for the second. MODE is the mode of the
4949 complete value.
4950
4951 For n32 & n64, $f0 always holds the first value and $f2 the second.
4952 Otherwise the values are packed together as closely as possible. */
4953
4954 static rtx
4955 mips_return_fpr_pair (enum machine_mode mode,
4956 enum machine_mode mode1, HOST_WIDE_INT offset1,
4957 enum machine_mode mode2, HOST_WIDE_INT offset2)
4958 {
4959 int inc;
4960
4961 inc = (TARGET_NEWABI ? 2 : MAX_FPRS_PER_FMT);
4962 return gen_rtx_PARALLEL
4963 (mode,
4964 gen_rtvec (2,
4965 gen_rtx_EXPR_LIST (VOIDmode,
4966 gen_rtx_REG (mode1, FP_RETURN),
4967 GEN_INT (offset1)),
4968 gen_rtx_EXPR_LIST (VOIDmode,
4969 gen_rtx_REG (mode2, FP_RETURN + inc),
4970 GEN_INT (offset2))));
4971
4972 }
4973
4974 /* Implement FUNCTION_VALUE and LIBCALL_VALUE. For normal calls,
4975 VALTYPE is the return type and MODE is VOIDmode. For libcalls,
4976 VALTYPE is null and MODE is the mode of the return value. */
4977
4978 rtx
4979 mips_function_value (const_tree valtype, enum machine_mode mode)
4980 {
4981 if (valtype)
4982 {
4983 tree fields[2];
4984 int unsigned_p;
4985
4986 mode = TYPE_MODE (valtype);
4987 unsigned_p = TYPE_UNSIGNED (valtype);
4988
4989 /* Since TARGET_PROMOTE_FUNCTION_RETURN unconditionally returns true,
4990 we must promote the mode just as PROMOTE_MODE does. */
4991 mode = promote_mode (valtype, mode, &unsigned_p, 1);
4992
4993 /* Handle structures whose fields are returned in $f0/$f2. */
4994 switch (mips_fpr_return_fields (valtype, fields))
4995 {
4996 case 1:
4997 return mips_return_fpr_single (mode,
4998 TYPE_MODE (TREE_TYPE (fields[0])));
4999
5000 case 2:
5001 return mips_return_fpr_pair (mode,
5002 TYPE_MODE (TREE_TYPE (fields[0])),
5003 int_byte_position (fields[0]),
5004 TYPE_MODE (TREE_TYPE (fields[1])),
5005 int_byte_position (fields[1]));
5006 }
5007
5008 /* If a value is passed in the most significant part of a register, see
5009 whether we have to round the mode up to a whole number of words. */
5010 if (mips_return_in_msb (valtype))
5011 {
5012 HOST_WIDE_INT size = int_size_in_bytes (valtype);
5013 if (size % UNITS_PER_WORD != 0)
5014 {
5015 size += UNITS_PER_WORD - size % UNITS_PER_WORD;
5016 mode = mode_for_size (size * BITS_PER_UNIT, MODE_INT, 0);
5017 }
5018 }
5019
5020 /* For EABI, the class of return register depends entirely on MODE.
5021 For example, "struct { some_type x; }" and "union { some_type x; }"
5022 are returned in the same way as a bare "some_type" would be.
5023 Other ABIs only use FPRs for scalar, complex or vector types. */
5024 if (mips_abi != ABI_EABI && !FLOAT_TYPE_P (valtype))
5025 return gen_rtx_REG (mode, GP_RETURN);
5026 }
5027
5028 if (!TARGET_MIPS16)
5029 {
5030 /* Handle long doubles for n32 & n64. */
5031 if (mode == TFmode)
5032 return mips_return_fpr_pair (mode,
5033 DImode, 0,
5034 DImode, GET_MODE_SIZE (mode) / 2);
5035
5036 if (mips_return_mode_in_fpr_p (mode))
5037 {
5038 if (GET_MODE_CLASS (mode) == MODE_COMPLEX_FLOAT)
5039 return mips_return_fpr_pair (mode,
5040 GET_MODE_INNER (mode), 0,
5041 GET_MODE_INNER (mode),
5042 GET_MODE_SIZE (mode) / 2);
5043 else
5044 return gen_rtx_REG (mode, FP_RETURN);
5045 }
5046 }
5047
5048 return gen_rtx_REG (mode, GP_RETURN);
5049 }
5050
5051 /* Implement TARGET_RETURN_IN_MEMORY. Under the o32 and o64 ABIs,
5052 all BLKmode objects are returned in memory. Under the n32, n64
5053 and embedded ABIs, small structures are returned in a register.
5054 Objects with varying size must still be returned in memory, of
5055 course. */
5056
5057 static bool
5058 mips_return_in_memory (const_tree type, const_tree fndecl ATTRIBUTE_UNUSED)
5059 {
5060 return (TARGET_OLDABI
5061 ? TYPE_MODE (type) == BLKmode
5062 : !IN_RANGE (int_size_in_bytes (type), 0, 2 * UNITS_PER_WORD));
5063 }
5064 \f
5065 /* Implement TARGET_SETUP_INCOMING_VARARGS. */
5066
5067 static void
5068 mips_setup_incoming_varargs (CUMULATIVE_ARGS *cum, enum machine_mode mode,
5069 tree type, int *pretend_size ATTRIBUTE_UNUSED,
5070 int no_rtl)
5071 {
5072 CUMULATIVE_ARGS local_cum;
5073 int gp_saved, fp_saved;
5074
5075 /* The caller has advanced CUM up to, but not beyond, the last named
5076 argument. Advance a local copy of CUM past the last "real" named
5077 argument, to find out how many registers are left over. */
5078 local_cum = *cum;
5079 FUNCTION_ARG_ADVANCE (local_cum, mode, type, true);
5080
5081 /* Found out how many registers we need to save. */
5082 gp_saved = MAX_ARGS_IN_REGISTERS - local_cum.num_gprs;
5083 fp_saved = (EABI_FLOAT_VARARGS_P
5084 ? MAX_ARGS_IN_REGISTERS - local_cum.num_fprs
5085 : 0);
5086
5087 if (!no_rtl)
5088 {
5089 if (gp_saved > 0)
5090 {
5091 rtx ptr, mem;
5092
5093 ptr = plus_constant (virtual_incoming_args_rtx,
5094 REG_PARM_STACK_SPACE (cfun->decl)
5095 - gp_saved * UNITS_PER_WORD);
5096 mem = gen_frame_mem (BLKmode, ptr);
5097 set_mem_alias_set (mem, get_varargs_alias_set ());
5098
5099 move_block_from_reg (local_cum.num_gprs + GP_ARG_FIRST,
5100 mem, gp_saved);
5101 }
5102 if (fp_saved > 0)
5103 {
5104 /* We can't use move_block_from_reg, because it will use
5105 the wrong mode. */
5106 enum machine_mode mode;
5107 int off, i;
5108
5109 /* Set OFF to the offset from virtual_incoming_args_rtx of
5110 the first float register. The FP save area lies below
5111 the integer one, and is aligned to UNITS_PER_FPVALUE bytes. */
5112 off = (-gp_saved * UNITS_PER_WORD) & -UNITS_PER_FPVALUE;
5113 off -= fp_saved * UNITS_PER_FPREG;
5114
5115 mode = TARGET_SINGLE_FLOAT ? SFmode : DFmode;
5116
5117 for (i = local_cum.num_fprs; i < MAX_ARGS_IN_REGISTERS;
5118 i += MAX_FPRS_PER_FMT)
5119 {
5120 rtx ptr, mem;
5121
5122 ptr = plus_constant (virtual_incoming_args_rtx, off);
5123 mem = gen_frame_mem (mode, ptr);
5124 set_mem_alias_set (mem, get_varargs_alias_set ());
5125 mips_emit_move (mem, gen_rtx_REG (mode, FP_ARG_FIRST + i));
5126 off += UNITS_PER_HWFPVALUE;
5127 }
5128 }
5129 }
5130 if (REG_PARM_STACK_SPACE (cfun->decl) == 0)
5131 cfun->machine->varargs_size = (gp_saved * UNITS_PER_WORD
5132 + fp_saved * UNITS_PER_FPREG);
5133 }
5134
5135 /* Implement TARGET_BUILTIN_VA_LIST. */
5136
5137 static tree
5138 mips_build_builtin_va_list (void)
5139 {
5140 if (EABI_FLOAT_VARARGS_P)
5141 {
5142 /* We keep 3 pointers, and two offsets.
5143
5144 Two pointers are to the overflow area, which starts at the CFA.
5145 One of these is constant, for addressing into the GPR save area
5146 below it. The other is advanced up the stack through the
5147 overflow region.
5148
5149 The third pointer is to the bottom of the GPR save area.
5150 Since the FPR save area is just below it, we can address
5151 FPR slots off this pointer.
5152
5153 We also keep two one-byte offsets, which are to be subtracted
5154 from the constant pointers to yield addresses in the GPR and
5155 FPR save areas. These are downcounted as float or non-float
5156 arguments are used, and when they get to zero, the argument
5157 must be obtained from the overflow region. */
5158 tree f_ovfl, f_gtop, f_ftop, f_goff, f_foff, f_res, record;
5159 tree array, index;
5160
5161 record = lang_hooks.types.make_type (RECORD_TYPE);
5162
5163 f_ovfl = build_decl (FIELD_DECL, get_identifier ("__overflow_argptr"),
5164 ptr_type_node);
5165 f_gtop = build_decl (FIELD_DECL, get_identifier ("__gpr_top"),
5166 ptr_type_node);
5167 f_ftop = build_decl (FIELD_DECL, get_identifier ("__fpr_top"),
5168 ptr_type_node);
5169 f_goff = build_decl (FIELD_DECL, get_identifier ("__gpr_offset"),
5170 unsigned_char_type_node);
5171 f_foff = build_decl (FIELD_DECL, get_identifier ("__fpr_offset"),
5172 unsigned_char_type_node);
5173 /* Explicitly pad to the size of a pointer, so that -Wpadded won't
5174 warn on every user file. */
5175 index = build_int_cst (NULL_TREE, GET_MODE_SIZE (ptr_mode) - 2 - 1);
5176 array = build_array_type (unsigned_char_type_node,
5177 build_index_type (index));
5178 f_res = build_decl (FIELD_DECL, get_identifier ("__reserved"), array);
5179
5180 DECL_FIELD_CONTEXT (f_ovfl) = record;
5181 DECL_FIELD_CONTEXT (f_gtop) = record;
5182 DECL_FIELD_CONTEXT (f_ftop) = record;
5183 DECL_FIELD_CONTEXT (f_goff) = record;
5184 DECL_FIELD_CONTEXT (f_foff) = record;
5185 DECL_FIELD_CONTEXT (f_res) = record;
5186
5187 TYPE_FIELDS (record) = f_ovfl;
5188 TREE_CHAIN (f_ovfl) = f_gtop;
5189 TREE_CHAIN (f_gtop) = f_ftop;
5190 TREE_CHAIN (f_ftop) = f_goff;
5191 TREE_CHAIN (f_goff) = f_foff;
5192 TREE_CHAIN (f_foff) = f_res;
5193
5194 layout_type (record);
5195 return record;
5196 }
5197 else if (TARGET_IRIX && TARGET_IRIX6)
5198 /* On IRIX 6, this type is 'char *'. */
5199 return build_pointer_type (char_type_node);
5200 else
5201 /* Otherwise, we use 'void *'. */
5202 return ptr_type_node;
5203 }
5204
5205 /* Implement TARGET_EXPAND_BUILTIN_VA_START. */
5206
5207 static void
5208 mips_va_start (tree valist, rtx nextarg)
5209 {
5210 if (EABI_FLOAT_VARARGS_P)
5211 {
5212 const CUMULATIVE_ARGS *cum;
5213 tree f_ovfl, f_gtop, f_ftop, f_goff, f_foff;
5214 tree ovfl, gtop, ftop, goff, foff;
5215 tree t;
5216 int gpr_save_area_size;
5217 int fpr_save_area_size;
5218 int fpr_offset;
5219
5220 cum = &crtl->args.info;
5221 gpr_save_area_size
5222 = (MAX_ARGS_IN_REGISTERS - cum->num_gprs) * UNITS_PER_WORD;
5223 fpr_save_area_size
5224 = (MAX_ARGS_IN_REGISTERS - cum->num_fprs) * UNITS_PER_FPREG;
5225
5226 f_ovfl = TYPE_FIELDS (va_list_type_node);
5227 f_gtop = TREE_CHAIN (f_ovfl);
5228 f_ftop = TREE_CHAIN (f_gtop);
5229 f_goff = TREE_CHAIN (f_ftop);
5230 f_foff = TREE_CHAIN (f_goff);
5231
5232 ovfl = build3 (COMPONENT_REF, TREE_TYPE (f_ovfl), valist, f_ovfl,
5233 NULL_TREE);
5234 gtop = build3 (COMPONENT_REF, TREE_TYPE (f_gtop), valist, f_gtop,
5235 NULL_TREE);
5236 ftop = build3 (COMPONENT_REF, TREE_TYPE (f_ftop), valist, f_ftop,
5237 NULL_TREE);
5238 goff = build3 (COMPONENT_REF, TREE_TYPE (f_goff), valist, f_goff,
5239 NULL_TREE);
5240 foff = build3 (COMPONENT_REF, TREE_TYPE (f_foff), valist, f_foff,
5241 NULL_TREE);
5242
5243 /* Emit code to initialize OVFL, which points to the next varargs
5244 stack argument. CUM->STACK_WORDS gives the number of stack
5245 words used by named arguments. */
5246 t = make_tree (TREE_TYPE (ovfl), virtual_incoming_args_rtx);
5247 if (cum->stack_words > 0)
5248 t = build2 (POINTER_PLUS_EXPR, TREE_TYPE (ovfl), t,
5249 size_int (cum->stack_words * UNITS_PER_WORD));
5250 t = build2 (MODIFY_EXPR, TREE_TYPE (ovfl), ovfl, t);
5251 expand_expr (t, const0_rtx, VOIDmode, EXPAND_NORMAL);
5252
5253 /* Emit code to initialize GTOP, the top of the GPR save area. */
5254 t = make_tree (TREE_TYPE (gtop), virtual_incoming_args_rtx);
5255 t = build2 (MODIFY_EXPR, TREE_TYPE (gtop), gtop, t);
5256 expand_expr (t, const0_rtx, VOIDmode, EXPAND_NORMAL);
5257
5258 /* Emit code to initialize FTOP, the top of the FPR save area.
5259 This address is gpr_save_area_bytes below GTOP, rounded
5260 down to the next fp-aligned boundary. */
5261 t = make_tree (TREE_TYPE (ftop), virtual_incoming_args_rtx);
5262 fpr_offset = gpr_save_area_size + UNITS_PER_FPVALUE - 1;
5263 fpr_offset &= -UNITS_PER_FPVALUE;
5264 if (fpr_offset)
5265 t = build2 (POINTER_PLUS_EXPR, TREE_TYPE (ftop), t,
5266 size_int (-fpr_offset));
5267 t = build2 (MODIFY_EXPR, TREE_TYPE (ftop), ftop, t);
5268 expand_expr (t, const0_rtx, VOIDmode, EXPAND_NORMAL);
5269
5270 /* Emit code to initialize GOFF, the offset from GTOP of the
5271 next GPR argument. */
5272 t = build2 (MODIFY_EXPR, TREE_TYPE (goff), goff,
5273 build_int_cst (TREE_TYPE (goff), gpr_save_area_size));
5274 expand_expr (t, const0_rtx, VOIDmode, EXPAND_NORMAL);
5275
5276 /* Likewise emit code to initialize FOFF, the offset from FTOP
5277 of the next FPR argument. */
5278 t = build2 (MODIFY_EXPR, TREE_TYPE (foff), foff,
5279 build_int_cst (TREE_TYPE (foff), fpr_save_area_size));
5280 expand_expr (t, const0_rtx, VOIDmode, EXPAND_NORMAL);
5281 }
5282 else
5283 {
5284 nextarg = plus_constant (nextarg, -cfun->machine->varargs_size);
5285 std_expand_builtin_va_start (valist, nextarg);
5286 }
5287 }
5288
5289 /* Implement TARGET_GIMPLIFY_VA_ARG_EXPR. */
5290
5291 static tree
5292 mips_gimplify_va_arg_expr (tree valist, tree type, gimple_seq *pre_p,
5293 gimple_seq *post_p)
5294 {
5295 tree addr;
5296 bool indirect_p;
5297
5298 indirect_p = pass_by_reference (NULL, TYPE_MODE (type), type, 0);
5299 if (indirect_p)
5300 type = build_pointer_type (type);
5301
5302 if (!EABI_FLOAT_VARARGS_P)
5303 addr = std_gimplify_va_arg_expr (valist, type, pre_p, post_p);
5304 else
5305 {
5306 tree f_ovfl, f_gtop, f_ftop, f_goff, f_foff;
5307 tree ovfl, top, off, align;
5308 HOST_WIDE_INT size, rsize, osize;
5309 tree t, u;
5310
5311 f_ovfl = TYPE_FIELDS (va_list_type_node);
5312 f_gtop = TREE_CHAIN (f_ovfl);
5313 f_ftop = TREE_CHAIN (f_gtop);
5314 f_goff = TREE_CHAIN (f_ftop);
5315 f_foff = TREE_CHAIN (f_goff);
5316
5317 /* Let:
5318
5319 TOP be the top of the GPR or FPR save area;
5320 OFF be the offset from TOP of the next register;
5321 ADDR_RTX be the address of the argument;
5322 SIZE be the number of bytes in the argument type;
5323 RSIZE be the number of bytes used to store the argument
5324 when it's in the register save area; and
5325 OSIZE be the number of bytes used to store it when it's
5326 in the stack overflow area.
5327
5328 The code we want is:
5329
5330 1: off &= -rsize; // round down
5331 2: if (off != 0)
5332 3: {
5333 4: addr_rtx = top - off + (BYTES_BIG_ENDIAN ? RSIZE - SIZE : 0);
5334 5: off -= rsize;
5335 6: }
5336 7: else
5337 8: {
5338 9: ovfl = ((intptr_t) ovfl + osize - 1) & -osize;
5339 10: addr_rtx = ovfl + (BYTES_BIG_ENDIAN ? OSIZE - SIZE : 0);
5340 11: ovfl += osize;
5341 14: }
5342
5343 [1] and [9] can sometimes be optimized away. */
5344
5345 ovfl = build3 (COMPONENT_REF, TREE_TYPE (f_ovfl), valist, f_ovfl,
5346 NULL_TREE);
5347 size = int_size_in_bytes (type);
5348
5349 if (GET_MODE_CLASS (TYPE_MODE (type)) == MODE_FLOAT
5350 && GET_MODE_SIZE (TYPE_MODE (type)) <= UNITS_PER_FPVALUE)
5351 {
5352 top = build3 (COMPONENT_REF, TREE_TYPE (f_ftop),
5353 unshare_expr (valist), f_ftop, NULL_TREE);
5354 off = build3 (COMPONENT_REF, TREE_TYPE (f_foff),
5355 unshare_expr (valist), f_foff, NULL_TREE);
5356
5357 /* When va_start saves FPR arguments to the stack, each slot
5358 takes up UNITS_PER_HWFPVALUE bytes, regardless of the
5359 argument's precision. */
5360 rsize = UNITS_PER_HWFPVALUE;
5361
5362 /* Overflow arguments are padded to UNITS_PER_WORD bytes
5363 (= PARM_BOUNDARY bits). This can be different from RSIZE
5364 in two cases:
5365
5366 (1) On 32-bit targets when TYPE is a structure such as:
5367
5368 struct s { float f; };
5369
5370 Such structures are passed in paired FPRs, so RSIZE
5371 will be 8 bytes. However, the structure only takes
5372 up 4 bytes of memory, so OSIZE will only be 4.
5373
5374 (2) In combinations such as -mgp64 -msingle-float
5375 -fshort-double. Doubles passed in registers will then take
5376 up 4 (UNITS_PER_HWFPVALUE) bytes, but those passed on the
5377 stack take up UNITS_PER_WORD bytes. */
5378 osize = MAX (GET_MODE_SIZE (TYPE_MODE (type)), UNITS_PER_WORD);
5379 }
5380 else
5381 {
5382 top = build3 (COMPONENT_REF, TREE_TYPE (f_gtop),
5383 unshare_expr (valist), f_gtop, NULL_TREE);
5384 off = build3 (COMPONENT_REF, TREE_TYPE (f_goff),
5385 unshare_expr (valist), f_goff, NULL_TREE);
5386 rsize = (size + UNITS_PER_WORD - 1) & -UNITS_PER_WORD;
5387 if (rsize > UNITS_PER_WORD)
5388 {
5389 /* [1] Emit code for: off &= -rsize. */
5390 t = build2 (BIT_AND_EXPR, TREE_TYPE (off), unshare_expr (off),
5391 build_int_cst (TREE_TYPE (off), -rsize));
5392 gimplify_assign (unshare_expr (off), t, pre_p);
5393 }
5394 osize = rsize;
5395 }
5396
5397 /* [2] Emit code to branch if off == 0. */
5398 t = build2 (NE_EXPR, boolean_type_node, off,
5399 build_int_cst (TREE_TYPE (off), 0));
5400 addr = build3 (COND_EXPR, ptr_type_node, t, NULL_TREE, NULL_TREE);
5401
5402 /* [5] Emit code for: off -= rsize. We do this as a form of
5403 post-decrement not available to C. */
5404 t = fold_convert (TREE_TYPE (off), build_int_cst (NULL_TREE, rsize));
5405 t = build2 (POSTDECREMENT_EXPR, TREE_TYPE (off), off, t);
5406
5407 /* [4] Emit code for:
5408 addr_rtx = top - off + (BYTES_BIG_ENDIAN ? RSIZE - SIZE : 0). */
5409 t = fold_convert (sizetype, t);
5410 t = fold_build1 (NEGATE_EXPR, sizetype, t);
5411 t = build2 (POINTER_PLUS_EXPR, TREE_TYPE (top), top, t);
5412 if (BYTES_BIG_ENDIAN && rsize > size)
5413 {
5414 u = size_int (rsize - size);
5415 t = build2 (POINTER_PLUS_EXPR, TREE_TYPE (t), t, u);
5416 }
5417 COND_EXPR_THEN (addr) = t;
5418
5419 if (osize > UNITS_PER_WORD)
5420 {
5421 /* [9] Emit: ovfl = ((intptr_t) ovfl + osize - 1) & -osize. */
5422 u = size_int (osize - 1);
5423 t = build2 (POINTER_PLUS_EXPR, TREE_TYPE (ovfl),
5424 unshare_expr (ovfl), u);
5425 t = fold_convert (sizetype, t);
5426 u = size_int (-osize);
5427 t = build2 (BIT_AND_EXPR, sizetype, t, u);
5428 t = fold_convert (TREE_TYPE (ovfl), t);
5429 align = build2 (MODIFY_EXPR, TREE_TYPE (ovfl),
5430 unshare_expr (ovfl), t);
5431 }
5432 else
5433 align = NULL;
5434
5435 /* [10, 11] Emit code for:
5436 addr_rtx = ovfl + (BYTES_BIG_ENDIAN ? OSIZE - SIZE : 0)
5437 ovfl += osize. */
5438 u = fold_convert (TREE_TYPE (ovfl), build_int_cst (NULL_TREE, osize));
5439 t = build2 (POSTINCREMENT_EXPR, TREE_TYPE (ovfl), ovfl, u);
5440 if (BYTES_BIG_ENDIAN && osize > size)
5441 {
5442 u = size_int (osize - size);
5443 t = build2 (POINTER_PLUS_EXPR, TREE_TYPE (t), t, u);
5444 }
5445
5446 /* String [9] and [10, 11] together. */
5447 if (align)
5448 t = build2 (COMPOUND_EXPR, TREE_TYPE (t), align, t);
5449 COND_EXPR_ELSE (addr) = t;
5450
5451 addr = fold_convert (build_pointer_type (type), addr);
5452 addr = build_va_arg_indirect_ref (addr);
5453 }
5454
5455 if (indirect_p)
5456 addr = build_va_arg_indirect_ref (addr);
5457
5458 return addr;
5459 }
5460 \f
5461 /* Start a definition of function NAME. MIPS16_P indicates whether the
5462 function contains MIPS16 code. */
5463
5464 static void
5465 mips_start_function_definition (const char *name, bool mips16_p)
5466 {
5467 if (mips16_p)
5468 fprintf (asm_out_file, "\t.set\tmips16\n");
5469 else
5470 fprintf (asm_out_file, "\t.set\tnomips16\n");
5471
5472 if (!flag_inhibit_size_directive)
5473 {
5474 fputs ("\t.ent\t", asm_out_file);
5475 assemble_name (asm_out_file, name);
5476 fputs ("\n", asm_out_file);
5477 }
5478
5479 ASM_OUTPUT_TYPE_DIRECTIVE (asm_out_file, name, "function");
5480
5481 /* Start the definition proper. */
5482 assemble_name (asm_out_file, name);
5483 fputs (":\n", asm_out_file);
5484 }
5485
5486 /* End a function definition started by mips_start_function_definition. */
5487
5488 static void
5489 mips_end_function_definition (const char *name)
5490 {
5491 if (!flag_inhibit_size_directive)
5492 {
5493 fputs ("\t.end\t", asm_out_file);
5494 assemble_name (asm_out_file, name);
5495 fputs ("\n", asm_out_file);
5496 }
5497 }
5498 \f
5499 /* Return true if calls to X can use R_MIPS_CALL* relocations. */
5500
5501 static bool
5502 mips_ok_for_lazy_binding_p (rtx x)
5503 {
5504 return (TARGET_USE_GOT
5505 && GET_CODE (x) == SYMBOL_REF
5506 && !SYMBOL_REF_BIND_NOW_P (x)
5507 && !mips_symbol_binds_local_p (x));
5508 }
5509
5510 /* Load function address ADDR into register DEST. TYPE is as for
5511 mips_expand_call. Return true if we used an explicit lazy-binding
5512 sequence. */
5513
5514 static bool
5515 mips_load_call_address (enum mips_call_type type, rtx dest, rtx addr)
5516 {
5517 /* If we're generating PIC, and this call is to a global function,
5518 try to allow its address to be resolved lazily. This isn't
5519 possible for sibcalls when $gp is call-saved because the value
5520 of $gp on entry to the stub would be our caller's gp, not ours. */
5521 if (TARGET_EXPLICIT_RELOCS
5522 && !(type == MIPS_CALL_SIBCALL && TARGET_CALL_SAVED_GP)
5523 && mips_ok_for_lazy_binding_p (addr))
5524 {
5525 addr = mips_got_load (dest, addr, SYMBOL_GOTOFF_CALL);
5526 emit_insn (gen_rtx_SET (VOIDmode, dest, addr));
5527 return true;
5528 }
5529 else
5530 {
5531 mips_emit_move (dest, addr);
5532 return false;
5533 }
5534 }
5535 \f
5536 /* Each locally-defined hard-float MIPS16 function has a local symbol
5537 associated with it. This hash table maps the function symbol (FUNC)
5538 to the local symbol (LOCAL). */
5539 struct GTY(()) mips16_local_alias {
5540 rtx func;
5541 rtx local;
5542 };
5543 static GTY ((param_is (struct mips16_local_alias))) htab_t mips16_local_aliases;
5544
5545 /* Hash table callbacks for mips16_local_aliases. */
5546
5547 static hashval_t
5548 mips16_local_aliases_hash (const void *entry)
5549 {
5550 const struct mips16_local_alias *alias;
5551
5552 alias = (const struct mips16_local_alias *) entry;
5553 return htab_hash_string (XSTR (alias->func, 0));
5554 }
5555
5556 static int
5557 mips16_local_aliases_eq (const void *entry1, const void *entry2)
5558 {
5559 const struct mips16_local_alias *alias1, *alias2;
5560
5561 alias1 = (const struct mips16_local_alias *) entry1;
5562 alias2 = (const struct mips16_local_alias *) entry2;
5563 return rtx_equal_p (alias1->func, alias2->func);
5564 }
5565
5566 /* FUNC is the symbol for a locally-defined hard-float MIPS16 function.
5567 Return a local alias for it, creating a new one if necessary. */
5568
5569 static rtx
5570 mips16_local_alias (rtx func)
5571 {
5572 struct mips16_local_alias *alias, tmp_alias;
5573 void **slot;
5574
5575 /* Create the hash table if this is the first call. */
5576 if (mips16_local_aliases == NULL)
5577 mips16_local_aliases = htab_create_ggc (37, mips16_local_aliases_hash,
5578 mips16_local_aliases_eq, NULL);
5579
5580 /* Look up the function symbol, creating a new entry if need be. */
5581 tmp_alias.func = func;
5582 slot = htab_find_slot (mips16_local_aliases, &tmp_alias, INSERT);
5583 gcc_assert (slot != NULL);
5584
5585 alias = (struct mips16_local_alias *) *slot;
5586 if (alias == NULL)
5587 {
5588 const char *func_name, *local_name;
5589 rtx local;
5590
5591 /* Create a new SYMBOL_REF for the local symbol. The choice of
5592 __fn_local_* is based on the __fn_stub_* names that we've
5593 traditionally used for the non-MIPS16 stub. */
5594 func_name = targetm.strip_name_encoding (XSTR (func, 0));
5595 local_name = ACONCAT (("__fn_local_", func_name, NULL));
5596 local = gen_rtx_SYMBOL_REF (Pmode, ggc_strdup (local_name));
5597 SYMBOL_REF_FLAGS (local) = SYMBOL_REF_FLAGS (func) | SYMBOL_FLAG_LOCAL;
5598
5599 /* Create a new structure to represent the mapping. */
5600 alias = GGC_NEW (struct mips16_local_alias);
5601 alias->func = func;
5602 alias->local = local;
5603 *slot = alias;
5604 }
5605 return alias->local;
5606 }
5607 \f
5608 /* A chained list of functions for which mips16_build_call_stub has already
5609 generated a stub. NAME is the name of the function and FP_RET_P is true
5610 if the function returns a value in floating-point registers. */
5611 struct mips16_stub {
5612 struct mips16_stub *next;
5613 char *name;
5614 bool fp_ret_p;
5615 };
5616 static struct mips16_stub *mips16_stubs;
5617
5618 /* Return a SYMBOL_REF for a MIPS16 function called NAME. */
5619
5620 static rtx
5621 mips16_stub_function (const char *name)
5622 {
5623 rtx x;
5624
5625 x = gen_rtx_SYMBOL_REF (Pmode, ggc_strdup (name));
5626 SYMBOL_REF_FLAGS (x) |= (SYMBOL_FLAG_EXTERNAL | SYMBOL_FLAG_FUNCTION);
5627 return x;
5628 }
5629
5630 /* Return the two-character string that identifies floating-point
5631 return mode MODE in the name of a MIPS16 function stub. */
5632
5633 static const char *
5634 mips16_call_stub_mode_suffix (enum machine_mode mode)
5635 {
5636 if (mode == SFmode)
5637 return "sf";
5638 else if (mode == DFmode)
5639 return "df";
5640 else if (mode == SCmode)
5641 return "sc";
5642 else if (mode == DCmode)
5643 return "dc";
5644 else if (mode == V2SFmode)
5645 return "df";
5646 else
5647 gcc_unreachable ();
5648 }
5649
5650 /* Write instructions to move a 32-bit value between general register
5651 GPREG and floating-point register FPREG. DIRECTION is 't' to move
5652 from GPREG to FPREG and 'f' to move in the opposite direction. */
5653
5654 static void
5655 mips_output_32bit_xfer (char direction, unsigned int gpreg, unsigned int fpreg)
5656 {
5657 fprintf (asm_out_file, "\tm%cc1\t%s,%s\n", direction,
5658 reg_names[gpreg], reg_names[fpreg]);
5659 }
5660
5661 /* Likewise for 64-bit values. */
5662
5663 static void
5664 mips_output_64bit_xfer (char direction, unsigned int gpreg, unsigned int fpreg)
5665 {
5666 if (TARGET_64BIT)
5667 fprintf (asm_out_file, "\tdm%cc1\t%s,%s\n", direction,
5668 reg_names[gpreg], reg_names[fpreg]);
5669 else if (TARGET_FLOAT64)
5670 {
5671 fprintf (asm_out_file, "\tm%cc1\t%s,%s\n", direction,
5672 reg_names[gpreg + TARGET_BIG_ENDIAN], reg_names[fpreg]);
5673 fprintf (asm_out_file, "\tm%chc1\t%s,%s\n", direction,
5674 reg_names[gpreg + TARGET_LITTLE_ENDIAN], reg_names[fpreg]);
5675 }
5676 else
5677 {
5678 /* Move the least-significant word. */
5679 fprintf (asm_out_file, "\tm%cc1\t%s,%s\n", direction,
5680 reg_names[gpreg + TARGET_BIG_ENDIAN], reg_names[fpreg]);
5681 /* ...then the most significant word. */
5682 fprintf (asm_out_file, "\tm%cc1\t%s,%s\n", direction,
5683 reg_names[gpreg + TARGET_LITTLE_ENDIAN], reg_names[fpreg + 1]);
5684 }
5685 }
5686
5687 /* Write out code to move floating-point arguments into or out of
5688 general registers. FP_CODE is the code describing which arguments
5689 are present (see the comment above the definition of CUMULATIVE_ARGS
5690 in mips.h). DIRECTION is as for mips_output_32bit_xfer. */
5691
5692 static void
5693 mips_output_args_xfer (int fp_code, char direction)
5694 {
5695 unsigned int gparg, fparg, f;
5696 CUMULATIVE_ARGS cum;
5697
5698 /* This code only works for o32 and o64. */
5699 gcc_assert (TARGET_OLDABI);
5700
5701 mips_init_cumulative_args (&cum, NULL);
5702
5703 for (f = (unsigned int) fp_code; f != 0; f >>= 2)
5704 {
5705 enum machine_mode mode;
5706 struct mips_arg_info info;
5707
5708 if ((f & 3) == 1)
5709 mode = SFmode;
5710 else if ((f & 3) == 2)
5711 mode = DFmode;
5712 else
5713 gcc_unreachable ();
5714
5715 mips_get_arg_info (&info, &cum, mode, NULL, true);
5716 gparg = mips_arg_regno (&info, false);
5717 fparg = mips_arg_regno (&info, true);
5718
5719 if (mode == SFmode)
5720 mips_output_32bit_xfer (direction, gparg, fparg);
5721 else
5722 mips_output_64bit_xfer (direction, gparg, fparg);
5723
5724 mips_function_arg_advance (&cum, mode, NULL, true);
5725 }
5726 }
5727
5728 /* Write a MIPS16 stub for the current function. This stub is used
5729 for functions which take arguments in the floating-point registers.
5730 It is normal-mode code that moves the floating-point arguments
5731 into the general registers and then jumps to the MIPS16 code. */
5732
5733 static void
5734 mips16_build_function_stub (void)
5735 {
5736 const char *fnname, *alias_name, *separator;
5737 char *secname, *stubname;
5738 tree stubdecl;
5739 unsigned int f;
5740 rtx symbol, alias;
5741
5742 /* Create the name of the stub, and its unique section. */
5743 symbol = XEXP (DECL_RTL (current_function_decl), 0);
5744 alias = mips16_local_alias (symbol);
5745
5746 fnname = targetm.strip_name_encoding (XSTR (symbol, 0));
5747 alias_name = targetm.strip_name_encoding (XSTR (alias, 0));
5748 secname = ACONCAT ((".mips16.fn.", fnname, NULL));
5749 stubname = ACONCAT (("__fn_stub_", fnname, NULL));
5750
5751 /* Build a decl for the stub. */
5752 stubdecl = build_decl (FUNCTION_DECL, get_identifier (stubname),
5753 build_function_type (void_type_node, NULL_TREE));
5754 DECL_SECTION_NAME (stubdecl) = build_string (strlen (secname), secname);
5755 DECL_RESULT (stubdecl) = build_decl (RESULT_DECL, NULL_TREE, void_type_node);
5756
5757 /* Output a comment. */
5758 fprintf (asm_out_file, "\t# Stub function for %s (",
5759 current_function_name ());
5760 separator = "";
5761 for (f = (unsigned int) crtl->args.info.fp_code; f != 0; f >>= 2)
5762 {
5763 fprintf (asm_out_file, "%s%s", separator,
5764 (f & 3) == 1 ? "float" : "double");
5765 separator = ", ";
5766 }
5767 fprintf (asm_out_file, ")\n");
5768
5769 /* Start the function definition. */
5770 assemble_start_function (stubdecl, stubname);
5771 mips_start_function_definition (stubname, false);
5772
5773 /* If generating pic2 code, either set up the global pointer or
5774 switch to pic0. */
5775 if (TARGET_ABICALLS_PIC2)
5776 {
5777 if (TARGET_ABSOLUTE_ABICALLS)
5778 fprintf (asm_out_file, "\t.option\tpic0\n");
5779 else
5780 {
5781 output_asm_insn ("%(.cpload\t%^%)", NULL);
5782 /* Emit an R_MIPS_NONE relocation to tell the linker what the
5783 target function is. Use a local GOT access when loading the
5784 symbol, to cut down on the number of unnecessary GOT entries
5785 for stubs that aren't needed. */
5786 output_asm_insn (".reloc\t0,R_MIPS_NONE,%0", &symbol);
5787 symbol = alias;
5788 }
5789 }
5790
5791 /* Load the address of the MIPS16 function into $25. Do this first so
5792 that targets with coprocessor interlocks can use an MFC1 to fill the
5793 delay slot. */
5794 output_asm_insn ("la\t%^,%0", &symbol);
5795
5796 /* Move the arguments from floating-point registers to general registers. */
5797 mips_output_args_xfer (crtl->args.info.fp_code, 'f');
5798
5799 /* Jump to the MIPS16 function. */
5800 output_asm_insn ("jr\t%^", NULL);
5801
5802 if (TARGET_ABICALLS_PIC2 && TARGET_ABSOLUTE_ABICALLS)
5803 fprintf (asm_out_file, "\t.option\tpic2\n");
5804
5805 mips_end_function_definition (stubname);
5806
5807 /* If the linker needs to create a dynamic symbol for the target
5808 function, it will associate the symbol with the stub (which,
5809 unlike the target function, follows the proper calling conventions).
5810 It is therefore useful to have a local alias for the target function,
5811 so that it can still be identified as MIPS16 code. As an optimization,
5812 this symbol can also be used for indirect MIPS16 references from
5813 within this file. */
5814 ASM_OUTPUT_DEF (asm_out_file, alias_name, fnname);
5815
5816 switch_to_section (function_section (current_function_decl));
5817 }
5818
5819 /* The current function is a MIPS16 function that returns a value in an FPR.
5820 Copy the return value from its soft-float to its hard-float location.
5821 libgcc2 has special non-MIPS16 helper functions for each case. */
5822
5823 static void
5824 mips16_copy_fpr_return_value (void)
5825 {
5826 rtx fn, insn, retval;
5827 tree return_type;
5828 enum machine_mode return_mode;
5829 const char *name;
5830
5831 return_type = DECL_RESULT (current_function_decl);
5832 return_mode = DECL_MODE (return_type);
5833
5834 name = ACONCAT (("__mips16_ret_",
5835 mips16_call_stub_mode_suffix (return_mode),
5836 NULL));
5837 fn = mips16_stub_function (name);
5838
5839 /* The function takes arguments in $2 (and possibly $3), so calls
5840 to it cannot be lazily bound. */
5841 SYMBOL_REF_FLAGS (fn) |= SYMBOL_FLAG_BIND_NOW;
5842
5843 /* Model the call as something that takes the GPR return value as
5844 argument and returns an "updated" value. */
5845 retval = gen_rtx_REG (return_mode, GP_RETURN);
5846 insn = mips_expand_call (MIPS_CALL_EPILOGUE, retval, fn,
5847 const0_rtx, NULL_RTX, false);
5848 use_reg (&CALL_INSN_FUNCTION_USAGE (insn), retval);
5849 }
5850
5851 /* Consider building a stub for a MIPS16 call to function *FN_PTR.
5852 RETVAL is the location of the return value, or null if this is
5853 a "call" rather than a "call_value". ARGS_SIZE is the size of the
5854 arguments and FP_CODE is the code built by mips_function_arg;
5855 see the comment above CUMULATIVE_ARGS for details.
5856
5857 There are three alternatives:
5858
5859 - If a stub was needed, emit the call and return the call insn itself.
5860
5861 - If we can avoid using a stub by redirecting the call, set *FN_PTR
5862 to the new target and return null.
5863
5864 - If *FN_PTR doesn't need a stub, return null and leave *FN_PTR
5865 unmodified.
5866
5867 A stub is needed for calls to functions that, in normal mode,
5868 receive arguments in FPRs or return values in FPRs. The stub
5869 copies the arguments from their soft-float positions to their
5870 hard-float positions, calls the real function, then copies the
5871 return value from its hard-float position to its soft-float
5872 position.
5873
5874 We can emit a JAL to *FN_PTR even when *FN_PTR might need a stub.
5875 If *FN_PTR turns out to be to a non-MIPS16 function, the linker
5876 automatically redirects the JAL to the stub, otherwise the JAL
5877 continues to call FN directly. */
5878
5879 static rtx
5880 mips16_build_call_stub (rtx retval, rtx *fn_ptr, rtx args_size, int fp_code)
5881 {
5882 const char *fnname;
5883 bool fp_ret_p;
5884 struct mips16_stub *l;
5885 rtx insn, fn;
5886
5887 /* We don't need to do anything if we aren't in MIPS16 mode, or if
5888 we were invoked with the -msoft-float option. */
5889 if (!TARGET_MIPS16 || TARGET_SOFT_FLOAT_ABI)
5890 return NULL_RTX;
5891
5892 /* Figure out whether the value might come back in a floating-point
5893 register. */
5894 fp_ret_p = retval && mips_return_mode_in_fpr_p (GET_MODE (retval));
5895
5896 /* We don't need to do anything if there were no floating-point
5897 arguments and the value will not be returned in a floating-point
5898 register. */
5899 if (fp_code == 0 && !fp_ret_p)
5900 return NULL_RTX;
5901
5902 /* We don't need to do anything if this is a call to a special
5903 MIPS16 support function. */
5904 fn = *fn_ptr;
5905 if (mips16_stub_function_p (fn))
5906 return NULL_RTX;
5907
5908 /* This code will only work for o32 and o64 abis. The other ABI's
5909 require more sophisticated support. */
5910 gcc_assert (TARGET_OLDABI);
5911
5912 /* If we're calling via a function pointer, use one of the magic
5913 libgcc.a stubs provided for each (FP_CODE, FP_RET_P) combination.
5914 Each stub expects the function address to arrive in register $2. */
5915 if (GET_CODE (fn) != SYMBOL_REF
5916 || !call_insn_operand (fn, VOIDmode))
5917 {
5918 char buf[30];
5919 rtx stub_fn, insn, addr;
5920 bool lazy_p;
5921
5922 /* If this is a locally-defined and locally-binding function,
5923 avoid the stub by calling the local alias directly. */
5924 if (mips16_local_function_p (fn))
5925 {
5926 *fn_ptr = mips16_local_alias (fn);
5927 return NULL_RTX;
5928 }
5929
5930 /* Create a SYMBOL_REF for the libgcc.a function. */
5931 if (fp_ret_p)
5932 sprintf (buf, "__mips16_call_stub_%s_%d",
5933 mips16_call_stub_mode_suffix (GET_MODE (retval)),
5934 fp_code);
5935 else
5936 sprintf (buf, "__mips16_call_stub_%d", fp_code);
5937 stub_fn = mips16_stub_function (buf);
5938
5939 /* The function uses $2 as an argument, so calls to it
5940 cannot be lazily bound. */
5941 SYMBOL_REF_FLAGS (stub_fn) |= SYMBOL_FLAG_BIND_NOW;
5942
5943 /* Load the target function into $2. */
5944 addr = gen_rtx_REG (Pmode, GP_REG_FIRST + 2);
5945 lazy_p = mips_load_call_address (MIPS_CALL_NORMAL, addr, fn);
5946
5947 /* Emit the call. */
5948 insn = mips_expand_call (MIPS_CALL_NORMAL, retval, stub_fn,
5949 args_size, NULL_RTX, lazy_p);
5950
5951 /* Tell GCC that this call does indeed use the value of $2. */
5952 use_reg (&CALL_INSN_FUNCTION_USAGE (insn), addr);
5953
5954 /* If we are handling a floating-point return value, we need to
5955 save $18 in the function prologue. Putting a note on the
5956 call will mean that df_regs_ever_live_p ($18) will be true if the
5957 call is not eliminated, and we can check that in the prologue
5958 code. */
5959 if (fp_ret_p)
5960 CALL_INSN_FUNCTION_USAGE (insn) =
5961 gen_rtx_EXPR_LIST (VOIDmode,
5962 gen_rtx_CLOBBER (VOIDmode,
5963 gen_rtx_REG (word_mode, 18)),
5964 CALL_INSN_FUNCTION_USAGE (insn));
5965
5966 return insn;
5967 }
5968
5969 /* We know the function we are going to call. If we have already
5970 built a stub, we don't need to do anything further. */
5971 fnname = targetm.strip_name_encoding (XSTR (fn, 0));
5972 for (l = mips16_stubs; l != NULL; l = l->next)
5973 if (strcmp (l->name, fnname) == 0)
5974 break;
5975
5976 if (l == NULL)
5977 {
5978 const char *separator;
5979 char *secname, *stubname;
5980 tree stubid, stubdecl;
5981 unsigned int f;
5982
5983 /* If the function does not return in FPRs, the special stub
5984 section is named
5985 .mips16.call.FNNAME
5986
5987 If the function does return in FPRs, the stub section is named
5988 .mips16.call.fp.FNNAME
5989
5990 Build a decl for the stub. */
5991 secname = ACONCAT ((".mips16.call.", fp_ret_p ? "fp." : "",
5992 fnname, NULL));
5993 stubname = ACONCAT (("__call_stub_", fp_ret_p ? "fp_" : "",
5994 fnname, NULL));
5995 stubid = get_identifier (stubname);
5996 stubdecl = build_decl (FUNCTION_DECL, stubid,
5997 build_function_type (void_type_node, NULL_TREE));
5998 DECL_SECTION_NAME (stubdecl) = build_string (strlen (secname), secname);
5999 DECL_RESULT (stubdecl) = build_decl (RESULT_DECL, NULL_TREE,
6000 void_type_node);
6001
6002 /* Output a comment. */
6003 fprintf (asm_out_file, "\t# Stub function to call %s%s (",
6004 (fp_ret_p
6005 ? (GET_MODE (retval) == SFmode ? "float " : "double ")
6006 : ""),
6007 fnname);
6008 separator = "";
6009 for (f = (unsigned int) fp_code; f != 0; f >>= 2)
6010 {
6011 fprintf (asm_out_file, "%s%s", separator,
6012 (f & 3) == 1 ? "float" : "double");
6013 separator = ", ";
6014 }
6015 fprintf (asm_out_file, ")\n");
6016
6017 /* Start the function definition. */
6018 assemble_start_function (stubdecl, stubname);
6019 mips_start_function_definition (stubname, false);
6020
6021 if (!fp_ret_p)
6022 {
6023 /* Load the address of the MIPS16 function into $25. Do this
6024 first so that targets with coprocessor interlocks can use
6025 an MFC1 to fill the delay slot. */
6026 if (TARGET_EXPLICIT_RELOCS)
6027 {
6028 output_asm_insn ("lui\t%^,%%hi(%0)", &fn);
6029 output_asm_insn ("addiu\t%^,%^,%%lo(%0)", &fn);
6030 }
6031 else
6032 output_asm_insn ("la\t%^,%0", &fn);
6033 }
6034
6035 /* Move the arguments from general registers to floating-point
6036 registers. */
6037 mips_output_args_xfer (fp_code, 't');
6038
6039 if (!fp_ret_p)
6040 {
6041 /* Jump to the previously-loaded address. */
6042 output_asm_insn ("jr\t%^", NULL);
6043 }
6044 else
6045 {
6046 /* Save the return address in $18 and call the non-MIPS16 function.
6047 The stub's caller knows that $18 might be clobbered, even though
6048 $18 is usually a call-saved register. */
6049 fprintf (asm_out_file, "\tmove\t%s,%s\n",
6050 reg_names[GP_REG_FIRST + 18], reg_names[GP_REG_FIRST + 31]);
6051 output_asm_insn (MIPS_CALL ("jal", &fn, 0), &fn);
6052
6053 /* Move the result from floating-point registers to
6054 general registers. */
6055 switch (GET_MODE (retval))
6056 {
6057 case SCmode:
6058 mips_output_32bit_xfer ('f', GP_RETURN + 1,
6059 FP_REG_FIRST + MAX_FPRS_PER_FMT);
6060 /* Fall though. */
6061 case SFmode:
6062 mips_output_32bit_xfer ('f', GP_RETURN, FP_REG_FIRST);
6063 if (GET_MODE (retval) == SCmode && TARGET_64BIT)
6064 {
6065 /* On 64-bit targets, complex floats are returned in
6066 a single GPR, such that "sd" on a suitably-aligned
6067 target would store the value correctly. */
6068 fprintf (asm_out_file, "\tdsll\t%s,%s,32\n",
6069 reg_names[GP_RETURN + TARGET_LITTLE_ENDIAN],
6070 reg_names[GP_RETURN + TARGET_LITTLE_ENDIAN]);
6071 fprintf (asm_out_file, "\tor\t%s,%s,%s\n",
6072 reg_names[GP_RETURN],
6073 reg_names[GP_RETURN],
6074 reg_names[GP_RETURN + 1]);
6075 }
6076 break;
6077
6078 case DCmode:
6079 mips_output_64bit_xfer ('f', GP_RETURN + (8 / UNITS_PER_WORD),
6080 FP_REG_FIRST + MAX_FPRS_PER_FMT);
6081 /* Fall though. */
6082 case DFmode:
6083 case V2SFmode:
6084 mips_output_64bit_xfer ('f', GP_RETURN, FP_REG_FIRST);
6085 break;
6086
6087 default:
6088 gcc_unreachable ();
6089 }
6090 fprintf (asm_out_file, "\tjr\t%s\n", reg_names[GP_REG_FIRST + 18]);
6091 }
6092
6093 #ifdef ASM_DECLARE_FUNCTION_SIZE
6094 ASM_DECLARE_FUNCTION_SIZE (asm_out_file, stubname, stubdecl);
6095 #endif
6096
6097 mips_end_function_definition (stubname);
6098
6099 /* Record this stub. */
6100 l = XNEW (struct mips16_stub);
6101 l->name = xstrdup (fnname);
6102 l->fp_ret_p = fp_ret_p;
6103 l->next = mips16_stubs;
6104 mips16_stubs = l;
6105 }
6106
6107 /* If we expect a floating-point return value, but we've built a
6108 stub which does not expect one, then we're in trouble. We can't
6109 use the existing stub, because it won't handle the floating-point
6110 value. We can't build a new stub, because the linker won't know
6111 which stub to use for the various calls in this object file.
6112 Fortunately, this case is illegal, since it means that a function
6113 was declared in two different ways in a single compilation. */
6114 if (fp_ret_p && !l->fp_ret_p)
6115 error ("cannot handle inconsistent calls to %qs", fnname);
6116
6117 if (retval == NULL_RTX)
6118 insn = gen_call_internal_direct (fn, args_size);
6119 else
6120 insn = gen_call_value_internal_direct (retval, fn, args_size);
6121 insn = mips_emit_call_insn (insn, fn, fn, false);
6122
6123 /* If we are calling a stub which handles a floating-point return
6124 value, we need to arrange to save $18 in the prologue. We do this
6125 by marking the function call as using the register. The prologue
6126 will later see that it is used, and emit code to save it. */
6127 if (fp_ret_p)
6128 CALL_INSN_FUNCTION_USAGE (insn) =
6129 gen_rtx_EXPR_LIST (VOIDmode,
6130 gen_rtx_CLOBBER (VOIDmode,
6131 gen_rtx_REG (word_mode, 18)),
6132 CALL_INSN_FUNCTION_USAGE (insn));
6133
6134 return insn;
6135 }
6136 \f
6137 /* Expand a call of type TYPE. RESULT is where the result will go (null
6138 for "call"s and "sibcall"s), ADDR is the address of the function,
6139 ARGS_SIZE is the size of the arguments and AUX is the value passed
6140 to us by mips_function_arg. LAZY_P is true if this call already
6141 involves a lazily-bound function address (such as when calling
6142 functions through a MIPS16 hard-float stub).
6143
6144 Return the call itself. */
6145
6146 rtx
6147 mips_expand_call (enum mips_call_type type, rtx result, rtx addr,
6148 rtx args_size, rtx aux, bool lazy_p)
6149 {
6150 rtx orig_addr, pattern, insn;
6151 int fp_code;
6152
6153 fp_code = aux == 0 ? 0 : (int) GET_MODE (aux);
6154 insn = mips16_build_call_stub (result, &addr, args_size, fp_code);
6155 if (insn)
6156 {
6157 gcc_assert (!lazy_p && type == MIPS_CALL_NORMAL);
6158 return insn;
6159 }
6160 ;
6161 orig_addr = addr;
6162 if (!call_insn_operand (addr, VOIDmode))
6163 {
6164 if (type == MIPS_CALL_EPILOGUE)
6165 addr = MIPS_EPILOGUE_TEMP (Pmode);
6166 else
6167 addr = gen_reg_rtx (Pmode);
6168 lazy_p |= mips_load_call_address (type, addr, orig_addr);
6169 }
6170
6171 if (result == 0)
6172 {
6173 rtx (*fn) (rtx, rtx);
6174
6175 if (type == MIPS_CALL_EPILOGUE && TARGET_SPLIT_CALLS)
6176 fn = gen_call_split;
6177 else if (type == MIPS_CALL_SIBCALL)
6178 fn = gen_sibcall_internal;
6179 else
6180 fn = gen_call_internal;
6181
6182 pattern = fn (addr, args_size);
6183 }
6184 else if (GET_CODE (result) == PARALLEL && XVECLEN (result, 0) == 2)
6185 {
6186 /* Handle return values created by mips_return_fpr_pair. */
6187 rtx (*fn) (rtx, rtx, rtx, rtx);
6188 rtx reg1, reg2;
6189
6190 if (type == MIPS_CALL_EPILOGUE && TARGET_SPLIT_CALLS)
6191 fn = gen_call_value_multiple_split;
6192 else if (type == MIPS_CALL_SIBCALL)
6193 fn = gen_sibcall_value_multiple_internal;
6194 else
6195 fn = gen_call_value_multiple_internal;
6196
6197 reg1 = XEXP (XVECEXP (result, 0, 0), 0);
6198 reg2 = XEXP (XVECEXP (result, 0, 1), 0);
6199 pattern = fn (reg1, addr, args_size, reg2);
6200 }
6201 else
6202 {
6203 rtx (*fn) (rtx, rtx, rtx);
6204
6205 if (type == MIPS_CALL_EPILOGUE && TARGET_SPLIT_CALLS)
6206 fn = gen_call_value_split;
6207 else if (type == MIPS_CALL_SIBCALL)
6208 fn = gen_sibcall_value_internal;
6209 else
6210 fn = gen_call_value_internal;
6211
6212 /* Handle return values created by mips_return_fpr_single. */
6213 if (GET_CODE (result) == PARALLEL && XVECLEN (result, 0) == 1)
6214 result = XEXP (XVECEXP (result, 0, 0), 0);
6215 pattern = fn (result, addr, args_size);
6216 }
6217
6218 return mips_emit_call_insn (pattern, orig_addr, addr, lazy_p);
6219 }
6220
6221 /* Split call instruction INSN into a $gp-clobbering call and
6222 (where necessary) an instruction to restore $gp from its save slot.
6223 CALL_PATTERN is the pattern of the new call. */
6224
6225 void
6226 mips_split_call (rtx insn, rtx call_pattern)
6227 {
6228 rtx new_insn;
6229
6230 new_insn = emit_call_insn (call_pattern);
6231 CALL_INSN_FUNCTION_USAGE (new_insn)
6232 = copy_rtx (CALL_INSN_FUNCTION_USAGE (insn));
6233 if (!find_reg_note (insn, REG_NORETURN, 0))
6234 /* Pick a temporary register that is suitable for both MIPS16 and
6235 non-MIPS16 code. $4 and $5 are used for returning complex double
6236 values in soft-float code, so $6 is the first suitable candidate. */
6237 mips_restore_gp (gen_rtx_REG (Pmode, GP_ARG_FIRST + 2));
6238 }
6239
6240 /* Implement TARGET_FUNCTION_OK_FOR_SIBCALL. */
6241
6242 static bool
6243 mips_function_ok_for_sibcall (tree decl, tree exp ATTRIBUTE_UNUSED)
6244 {
6245 if (!TARGET_SIBCALLS)
6246 return false;
6247
6248 /* Interrupt handlers need special epilogue code and therefore can't
6249 use sibcalls. */
6250 if (mips_interrupt_type_p (TREE_TYPE (current_function_decl)))
6251 return false;
6252
6253 /* We can't do a sibcall if the called function is a MIPS16 function
6254 because there is no direct "jx" instruction equivalent to "jalx" to
6255 switch the ISA mode. We only care about cases where the sibling
6256 and normal calls would both be direct. */
6257 if (decl
6258 && mips_use_mips16_mode_p (decl)
6259 && const_call_insn_operand (XEXP (DECL_RTL (decl), 0), VOIDmode))
6260 return false;
6261
6262 /* When -minterlink-mips16 is in effect, assume that non-locally-binding
6263 functions could be MIPS16 ones unless an attribute explicitly tells
6264 us otherwise. */
6265 if (TARGET_INTERLINK_MIPS16
6266 && decl
6267 && (DECL_EXTERNAL (decl) || !targetm.binds_local_p (decl))
6268 && !mips_nomips16_decl_p (decl)
6269 && const_call_insn_operand (XEXP (DECL_RTL (decl), 0), VOIDmode))
6270 return false;
6271
6272 /* Otherwise OK. */
6273 return true;
6274 }
6275 \f
6276 /* Emit code to move general operand SRC into condition-code
6277 register DEST given that SCRATCH is a scratch TFmode FPR.
6278 The sequence is:
6279
6280 FP1 = SRC
6281 FP2 = 0.0f
6282 DEST = FP2 < FP1
6283
6284 where FP1 and FP2 are single-precision FPRs taken from SCRATCH. */
6285
6286 void
6287 mips_expand_fcc_reload (rtx dest, rtx src, rtx scratch)
6288 {
6289 rtx fp1, fp2;
6290
6291 /* Change the source to SFmode. */
6292 if (MEM_P (src))
6293 src = adjust_address (src, SFmode, 0);
6294 else if (REG_P (src) || GET_CODE (src) == SUBREG)
6295 src = gen_rtx_REG (SFmode, true_regnum (src));
6296
6297 fp1 = gen_rtx_REG (SFmode, REGNO (scratch));
6298 fp2 = gen_rtx_REG (SFmode, REGNO (scratch) + MAX_FPRS_PER_FMT);
6299
6300 mips_emit_move (copy_rtx (fp1), src);
6301 mips_emit_move (copy_rtx (fp2), CONST0_RTX (SFmode));
6302 emit_insn (gen_slt_sf (dest, fp2, fp1));
6303 }
6304 \f
6305 /* Emit straight-line code to move LENGTH bytes from SRC to DEST.
6306 Assume that the areas do not overlap. */
6307
6308 static void
6309 mips_block_move_straight (rtx dest, rtx src, HOST_WIDE_INT length)
6310 {
6311 HOST_WIDE_INT offset, delta;
6312 unsigned HOST_WIDE_INT bits;
6313 int i;
6314 enum machine_mode mode;
6315 rtx *regs;
6316
6317 /* Work out how many bits to move at a time. If both operands have
6318 half-word alignment, it is usually better to move in half words.
6319 For instance, lh/lh/sh/sh is usually better than lwl/lwr/swl/swr
6320 and lw/lw/sw/sw is usually better than ldl/ldr/sdl/sdr.
6321 Otherwise move word-sized chunks. */
6322 if (MEM_ALIGN (src) == BITS_PER_WORD / 2
6323 && MEM_ALIGN (dest) == BITS_PER_WORD / 2)
6324 bits = BITS_PER_WORD / 2;
6325 else
6326 bits = BITS_PER_WORD;
6327
6328 mode = mode_for_size (bits, MODE_INT, 0);
6329 delta = bits / BITS_PER_UNIT;
6330
6331 /* Allocate a buffer for the temporary registers. */
6332 regs = XALLOCAVEC (rtx, length / delta);
6333
6334 /* Load as many BITS-sized chunks as possible. Use a normal load if
6335 the source has enough alignment, otherwise use left/right pairs. */
6336 for (offset = 0, i = 0; offset + delta <= length; offset += delta, i++)
6337 {
6338 regs[i] = gen_reg_rtx (mode);
6339 if (MEM_ALIGN (src) >= bits)
6340 mips_emit_move (regs[i], adjust_address (src, mode, offset));
6341 else
6342 {
6343 rtx part = adjust_address (src, BLKmode, offset);
6344 if (!mips_expand_ext_as_unaligned_load (regs[i], part, bits, 0))
6345 gcc_unreachable ();
6346 }
6347 }
6348
6349 /* Copy the chunks to the destination. */
6350 for (offset = 0, i = 0; offset + delta <= length; offset += delta, i++)
6351 if (MEM_ALIGN (dest) >= bits)
6352 mips_emit_move (adjust_address (dest, mode, offset), regs[i]);
6353 else
6354 {
6355 rtx part = adjust_address (dest, BLKmode, offset);
6356 if (!mips_expand_ins_as_unaligned_store (part, regs[i], bits, 0))
6357 gcc_unreachable ();
6358 }
6359
6360 /* Mop up any left-over bytes. */
6361 if (offset < length)
6362 {
6363 src = adjust_address (src, BLKmode, offset);
6364 dest = adjust_address (dest, BLKmode, offset);
6365 move_by_pieces (dest, src, length - offset,
6366 MIN (MEM_ALIGN (src), MEM_ALIGN (dest)), 0);
6367 }
6368 }
6369
6370 /* Helper function for doing a loop-based block operation on memory
6371 reference MEM. Each iteration of the loop will operate on LENGTH
6372 bytes of MEM.
6373
6374 Create a new base register for use within the loop and point it to
6375 the start of MEM. Create a new memory reference that uses this
6376 register. Store them in *LOOP_REG and *LOOP_MEM respectively. */
6377
6378 static void
6379 mips_adjust_block_mem (rtx mem, HOST_WIDE_INT length,
6380 rtx *loop_reg, rtx *loop_mem)
6381 {
6382 *loop_reg = copy_addr_to_reg (XEXP (mem, 0));
6383
6384 /* Although the new mem does not refer to a known location,
6385 it does keep up to LENGTH bytes of alignment. */
6386 *loop_mem = change_address (mem, BLKmode, *loop_reg);
6387 set_mem_align (*loop_mem, MIN (MEM_ALIGN (mem), length * BITS_PER_UNIT));
6388 }
6389
6390 /* Move LENGTH bytes from SRC to DEST using a loop that moves BYTES_PER_ITER
6391 bytes at a time. LENGTH must be at least BYTES_PER_ITER. Assume that
6392 the memory regions do not overlap. */
6393
6394 static void
6395 mips_block_move_loop (rtx dest, rtx src, HOST_WIDE_INT length,
6396 HOST_WIDE_INT bytes_per_iter)
6397 {
6398 rtx label, src_reg, dest_reg, final_src, test;
6399 HOST_WIDE_INT leftover;
6400
6401 leftover = length % bytes_per_iter;
6402 length -= leftover;
6403
6404 /* Create registers and memory references for use within the loop. */
6405 mips_adjust_block_mem (src, bytes_per_iter, &src_reg, &src);
6406 mips_adjust_block_mem (dest, bytes_per_iter, &dest_reg, &dest);
6407
6408 /* Calculate the value that SRC_REG should have after the last iteration
6409 of the loop. */
6410 final_src = expand_simple_binop (Pmode, PLUS, src_reg, GEN_INT (length),
6411 0, 0, OPTAB_WIDEN);
6412
6413 /* Emit the start of the loop. */
6414 label = gen_label_rtx ();
6415 emit_label (label);
6416
6417 /* Emit the loop body. */
6418 mips_block_move_straight (dest, src, bytes_per_iter);
6419
6420 /* Move on to the next block. */
6421 mips_emit_move (src_reg, plus_constant (src_reg, bytes_per_iter));
6422 mips_emit_move (dest_reg, plus_constant (dest_reg, bytes_per_iter));
6423
6424 /* Emit the loop condition. */
6425 test = gen_rtx_NE (VOIDmode, src_reg, final_src);
6426 if (Pmode == DImode)
6427 emit_jump_insn (gen_cbranchdi4 (test, src_reg, final_src, label));
6428 else
6429 emit_jump_insn (gen_cbranchsi4 (test, src_reg, final_src, label));
6430
6431 /* Mop up any left-over bytes. */
6432 if (leftover)
6433 mips_block_move_straight (dest, src, leftover);
6434 }
6435
6436 /* Expand a movmemsi instruction, which copies LENGTH bytes from
6437 memory reference SRC to memory reference DEST. */
6438
6439 bool
6440 mips_expand_block_move (rtx dest, rtx src, rtx length)
6441 {
6442 if (GET_CODE (length) == CONST_INT)
6443 {
6444 if (INTVAL (length) <= MIPS_MAX_MOVE_BYTES_STRAIGHT)
6445 {
6446 mips_block_move_straight (dest, src, INTVAL (length));
6447 return true;
6448 }
6449 else if (optimize)
6450 {
6451 mips_block_move_loop (dest, src, INTVAL (length),
6452 MIPS_MAX_MOVE_BYTES_PER_LOOP_ITER);
6453 return true;
6454 }
6455 }
6456 return false;
6457 }
6458 \f
6459 /* Expand a loop of synci insns for the address range [BEGIN, END). */
6460
6461 void
6462 mips_expand_synci_loop (rtx begin, rtx end)
6463 {
6464 rtx inc, label, cmp, cmp_result;
6465
6466 /* Load INC with the cache line size (rdhwr INC,$1). */
6467 inc = gen_reg_rtx (Pmode);
6468 emit_insn (Pmode == SImode
6469 ? gen_rdhwr_synci_step_si (inc)
6470 : gen_rdhwr_synci_step_di (inc));
6471
6472 /* Loop back to here. */
6473 label = gen_label_rtx ();
6474 emit_label (label);
6475
6476 emit_insn (gen_synci (begin));
6477
6478 cmp = mips_force_binary (Pmode, GTU, begin, end);
6479
6480 mips_emit_binary (PLUS, begin, begin, inc);
6481
6482 cmp_result = gen_rtx_EQ (VOIDmode, cmp, const0_rtx);
6483 emit_jump_insn (gen_condjump (cmp_result, label));
6484 }
6485 \f
6486 /* Expand a QI or HI mode atomic memory operation.
6487
6488 GENERATOR contains a pointer to the gen_* function that generates
6489 the SI mode underlying atomic operation using masks that we
6490 calculate.
6491
6492 RESULT is the return register for the operation. Its value is NULL
6493 if unused.
6494
6495 MEM is the location of the atomic access.
6496
6497 OLDVAL is the first operand for the operation.
6498
6499 NEWVAL is the optional second operand for the operation. Its value
6500 is NULL if unused. */
6501
6502 void
6503 mips_expand_atomic_qihi (union mips_gen_fn_ptrs generator,
6504 rtx result, rtx mem, rtx oldval, rtx newval)
6505 {
6506 rtx orig_addr, memsi_addr, memsi, shift, shiftsi, unshifted_mask;
6507 rtx unshifted_mask_reg, mask, inverted_mask, si_op;
6508 rtx res = NULL;
6509 enum machine_mode mode;
6510
6511 mode = GET_MODE (mem);
6512
6513 /* Compute the address of the containing SImode value. */
6514 orig_addr = force_reg (Pmode, XEXP (mem, 0));
6515 memsi_addr = mips_force_binary (Pmode, AND, orig_addr,
6516 force_reg (Pmode, GEN_INT (-4)));
6517
6518 /* Create a memory reference for it. */
6519 memsi = gen_rtx_MEM (SImode, memsi_addr);
6520 set_mem_alias_set (memsi, ALIAS_SET_MEMORY_BARRIER);
6521 MEM_VOLATILE_P (memsi) = MEM_VOLATILE_P (mem);
6522
6523 /* Work out the byte offset of the QImode or HImode value,
6524 counting from the least significant byte. */
6525 shift = mips_force_binary (Pmode, AND, orig_addr, GEN_INT (3));
6526 if (TARGET_BIG_ENDIAN)
6527 mips_emit_binary (XOR, shift, shift, GEN_INT (mode == QImode ? 3 : 2));
6528
6529 /* Multiply by eight to convert the shift value from bytes to bits. */
6530 mips_emit_binary (ASHIFT, shift, shift, GEN_INT (3));
6531
6532 /* Make the final shift an SImode value, so that it can be used in
6533 SImode operations. */
6534 shiftsi = force_reg (SImode, gen_lowpart (SImode, shift));
6535
6536 /* Set MASK to an inclusive mask of the QImode or HImode value. */
6537 unshifted_mask = GEN_INT (GET_MODE_MASK (mode));
6538 unshifted_mask_reg = force_reg (SImode, unshifted_mask);
6539 mask = mips_force_binary (SImode, ASHIFT, unshifted_mask_reg, shiftsi);
6540
6541 /* Compute the equivalent exclusive mask. */
6542 inverted_mask = gen_reg_rtx (SImode);
6543 emit_insn (gen_rtx_SET (VOIDmode, inverted_mask,
6544 gen_rtx_NOT (SImode, mask)));
6545
6546 /* Shift the old value into place. */
6547 if (oldval != const0_rtx)
6548 {
6549 oldval = convert_modes (SImode, mode, oldval, true);
6550 oldval = force_reg (SImode, oldval);
6551 oldval = mips_force_binary (SImode, ASHIFT, oldval, shiftsi);
6552 }
6553
6554 /* Do the same for the new value. */
6555 if (newval && newval != const0_rtx)
6556 {
6557 newval = convert_modes (SImode, mode, newval, true);
6558 newval = force_reg (SImode, newval);
6559 newval = mips_force_binary (SImode, ASHIFT, newval, shiftsi);
6560 }
6561
6562 /* Do the SImode atomic access. */
6563 if (result)
6564 res = gen_reg_rtx (SImode);
6565 if (newval)
6566 si_op = generator.fn_6 (res, memsi, mask, inverted_mask, oldval, newval);
6567 else if (result)
6568 si_op = generator.fn_5 (res, memsi, mask, inverted_mask, oldval);
6569 else
6570 si_op = generator.fn_4 (memsi, mask, inverted_mask, oldval);
6571
6572 emit_insn (si_op);
6573
6574 if (result)
6575 {
6576 /* Shift and convert the result. */
6577 mips_emit_binary (AND, res, res, mask);
6578 mips_emit_binary (LSHIFTRT, res, res, shiftsi);
6579 mips_emit_move (result, gen_lowpart (GET_MODE (result), res));
6580 }
6581 }
6582
6583 /* Return true if it is possible to use left/right accesses for a
6584 bitfield of WIDTH bits starting BITPOS bits into *OP. When
6585 returning true, update *OP, *LEFT and *RIGHT as follows:
6586
6587 *OP is a BLKmode reference to the whole field.
6588
6589 *LEFT is a QImode reference to the first byte if big endian or
6590 the last byte if little endian. This address can be used in the
6591 left-side instructions (LWL, SWL, LDL, SDL).
6592
6593 *RIGHT is a QImode reference to the opposite end of the field and
6594 can be used in the patterning right-side instruction. */
6595
6596 static bool
6597 mips_get_unaligned_mem (rtx *op, HOST_WIDE_INT width, HOST_WIDE_INT bitpos,
6598 rtx *left, rtx *right)
6599 {
6600 rtx first, last;
6601
6602 /* Check that the operand really is a MEM. Not all the extv and
6603 extzv predicates are checked. */
6604 if (!MEM_P (*op))
6605 return false;
6606
6607 /* Check that the size is valid. */
6608 if (width != 32 && (!TARGET_64BIT || width != 64))
6609 return false;
6610
6611 /* We can only access byte-aligned values. Since we are always passed
6612 a reference to the first byte of the field, it is not necessary to
6613 do anything with BITPOS after this check. */
6614 if (bitpos % BITS_PER_UNIT != 0)
6615 return false;
6616
6617 /* Reject aligned bitfields: we want to use a normal load or store
6618 instead of a left/right pair. */
6619 if (MEM_ALIGN (*op) >= width)
6620 return false;
6621
6622 /* Adjust *OP to refer to the whole field. This also has the effect
6623 of legitimizing *OP's address for BLKmode, possibly simplifying it. */
6624 *op = adjust_address (*op, BLKmode, 0);
6625 set_mem_size (*op, GEN_INT (width / BITS_PER_UNIT));
6626
6627 /* Get references to both ends of the field. We deliberately don't
6628 use the original QImode *OP for FIRST since the new BLKmode one
6629 might have a simpler address. */
6630 first = adjust_address (*op, QImode, 0);
6631 last = adjust_address (*op, QImode, width / BITS_PER_UNIT - 1);
6632
6633 /* Allocate to LEFT and RIGHT according to endianness. LEFT should
6634 correspond to the MSB and RIGHT to the LSB. */
6635 if (TARGET_BIG_ENDIAN)
6636 *left = first, *right = last;
6637 else
6638 *left = last, *right = first;
6639
6640 return true;
6641 }
6642
6643 /* Try to use left/right loads to expand an "extv" or "extzv" pattern.
6644 DEST, SRC, WIDTH and BITPOS are the operands passed to the expander;
6645 the operation is the equivalent of:
6646
6647 (set DEST (*_extract SRC WIDTH BITPOS))
6648
6649 Return true on success. */
6650
6651 bool
6652 mips_expand_ext_as_unaligned_load (rtx dest, rtx src, HOST_WIDE_INT width,
6653 HOST_WIDE_INT bitpos)
6654 {
6655 rtx left, right, temp;
6656
6657 /* If TARGET_64BIT, the destination of a 32-bit "extz" or "extzv" will
6658 be a paradoxical word_mode subreg. This is the only case in which
6659 we allow the destination to be larger than the source. */
6660 if (GET_CODE (dest) == SUBREG
6661 && GET_MODE (dest) == DImode
6662 && GET_MODE (SUBREG_REG (dest)) == SImode)
6663 dest = SUBREG_REG (dest);
6664
6665 /* After the above adjustment, the destination must be the same
6666 width as the source. */
6667 if (GET_MODE_BITSIZE (GET_MODE (dest)) != width)
6668 return false;
6669
6670 if (!mips_get_unaligned_mem (&src, width, bitpos, &left, &right))
6671 return false;
6672
6673 temp = gen_reg_rtx (GET_MODE (dest));
6674 if (GET_MODE (dest) == DImode)
6675 {
6676 emit_insn (gen_mov_ldl (temp, src, left));
6677 emit_insn (gen_mov_ldr (dest, copy_rtx (src), right, temp));
6678 }
6679 else
6680 {
6681 emit_insn (gen_mov_lwl (temp, src, left));
6682 emit_insn (gen_mov_lwr (dest, copy_rtx (src), right, temp));
6683 }
6684 return true;
6685 }
6686
6687 /* Try to use left/right stores to expand an "ins" pattern. DEST, WIDTH,
6688 BITPOS and SRC are the operands passed to the expander; the operation
6689 is the equivalent of:
6690
6691 (set (zero_extract DEST WIDTH BITPOS) SRC)
6692
6693 Return true on success. */
6694
6695 bool
6696 mips_expand_ins_as_unaligned_store (rtx dest, rtx src, HOST_WIDE_INT width,
6697 HOST_WIDE_INT bitpos)
6698 {
6699 rtx left, right;
6700 enum machine_mode mode;
6701
6702 if (!mips_get_unaligned_mem (&dest, width, bitpos, &left, &right))
6703 return false;
6704
6705 mode = mode_for_size (width, MODE_INT, 0);
6706 src = gen_lowpart (mode, src);
6707 if (mode == DImode)
6708 {
6709 emit_insn (gen_mov_sdl (dest, src, left));
6710 emit_insn (gen_mov_sdr (copy_rtx (dest), copy_rtx (src), right));
6711 }
6712 else
6713 {
6714 emit_insn (gen_mov_swl (dest, src, left));
6715 emit_insn (gen_mov_swr (copy_rtx (dest), copy_rtx (src), right));
6716 }
6717 return true;
6718 }
6719
6720 /* Return true if X is a MEM with the same size as MODE. */
6721
6722 bool
6723 mips_mem_fits_mode_p (enum machine_mode mode, rtx x)
6724 {
6725 rtx size;
6726
6727 if (!MEM_P (x))
6728 return false;
6729
6730 size = MEM_SIZE (x);
6731 return size && INTVAL (size) == GET_MODE_SIZE (mode);
6732 }
6733
6734 /* Return true if (zero_extract OP WIDTH BITPOS) can be used as the
6735 source of an "ext" instruction or the destination of an "ins"
6736 instruction. OP must be a register operand and the following
6737 conditions must hold:
6738
6739 0 <= BITPOS < GET_MODE_BITSIZE (GET_MODE (op))
6740 0 < WIDTH <= GET_MODE_BITSIZE (GET_MODE (op))
6741 0 < BITPOS + WIDTH <= GET_MODE_BITSIZE (GET_MODE (op))
6742
6743 Also reject lengths equal to a word as they are better handled
6744 by the move patterns. */
6745
6746 bool
6747 mips_use_ins_ext_p (rtx op, HOST_WIDE_INT width, HOST_WIDE_INT bitpos)
6748 {
6749 if (!ISA_HAS_EXT_INS
6750 || !register_operand (op, VOIDmode)
6751 || GET_MODE_BITSIZE (GET_MODE (op)) > BITS_PER_WORD)
6752 return false;
6753
6754 if (!IN_RANGE (width, 1, GET_MODE_BITSIZE (GET_MODE (op)) - 1))
6755 return false;
6756
6757 if (bitpos < 0 || bitpos + width > GET_MODE_BITSIZE (GET_MODE (op)))
6758 return false;
6759
6760 return true;
6761 }
6762
6763 /* Check if MASK and SHIFT are valid in mask-low-and-shift-left
6764 operation if MAXLEN is the maxium length of consecutive bits that
6765 can make up MASK. MODE is the mode of the operation. See
6766 mask_low_and_shift_len for the actual definition. */
6767
6768 bool
6769 mask_low_and_shift_p (enum machine_mode mode, rtx mask, rtx shift, int maxlen)
6770 {
6771 return IN_RANGE (mask_low_and_shift_len (mode, mask, shift), 1, maxlen);
6772 }
6773
6774 /* The canonical form of a mask-low-and-shift-left operation is
6775 (and (ashift X SHIFT) MASK) where MASK has the lower SHIFT number of bits
6776 cleared. Thus we need to shift MASK to the right before checking if it
6777 is a valid mask value. MODE is the mode of the operation. If true
6778 return the length of the mask, otherwise return -1. */
6779
6780 int
6781 mask_low_and_shift_len (enum machine_mode mode, rtx mask, rtx shift)
6782 {
6783 HOST_WIDE_INT shval;
6784
6785 shval = INTVAL (shift) & (GET_MODE_BITSIZE (mode) - 1);
6786 return exact_log2 ((UINTVAL (mask) >> shval) + 1);
6787 }
6788 \f
6789 /* Return true if -msplit-addresses is selected and should be honored.
6790
6791 -msplit-addresses is a half-way house between explicit relocations
6792 and the traditional assembler macros. It can split absolute 32-bit
6793 symbolic constants into a high/lo_sum pair but uses macros for other
6794 sorts of access.
6795
6796 Like explicit relocation support for REL targets, it relies
6797 on GNU extensions in the assembler and the linker.
6798
6799 Although this code should work for -O0, it has traditionally
6800 been treated as an optimization. */
6801
6802 static bool
6803 mips_split_addresses_p (void)
6804 {
6805 return (TARGET_SPLIT_ADDRESSES
6806 && optimize
6807 && !TARGET_MIPS16
6808 && !flag_pic
6809 && !ABI_HAS_64BIT_SYMBOLS);
6810 }
6811
6812 /* (Re-)Initialize mips_split_p, mips_lo_relocs and mips_hi_relocs. */
6813
6814 static void
6815 mips_init_relocs (void)
6816 {
6817 memset (mips_split_p, '\0', sizeof (mips_split_p));
6818 memset (mips_split_hi_p, '\0', sizeof (mips_split_hi_p));
6819 memset (mips_hi_relocs, '\0', sizeof (mips_hi_relocs));
6820 memset (mips_lo_relocs, '\0', sizeof (mips_lo_relocs));
6821
6822 if (ABI_HAS_64BIT_SYMBOLS)
6823 {
6824 if (TARGET_EXPLICIT_RELOCS)
6825 {
6826 mips_split_p[SYMBOL_64_HIGH] = true;
6827 mips_hi_relocs[SYMBOL_64_HIGH] = "%highest(";
6828 mips_lo_relocs[SYMBOL_64_HIGH] = "%higher(";
6829
6830 mips_split_p[SYMBOL_64_MID] = true;
6831 mips_hi_relocs[SYMBOL_64_MID] = "%higher(";
6832 mips_lo_relocs[SYMBOL_64_MID] = "%hi(";
6833
6834 mips_split_p[SYMBOL_64_LOW] = true;
6835 mips_hi_relocs[SYMBOL_64_LOW] = "%hi(";
6836 mips_lo_relocs[SYMBOL_64_LOW] = "%lo(";
6837
6838 mips_split_p[SYMBOL_ABSOLUTE] = true;
6839 mips_lo_relocs[SYMBOL_ABSOLUTE] = "%lo(";
6840 }
6841 }
6842 else
6843 {
6844 if (TARGET_EXPLICIT_RELOCS || mips_split_addresses_p () || TARGET_MIPS16)
6845 {
6846 mips_split_p[SYMBOL_ABSOLUTE] = true;
6847 mips_hi_relocs[SYMBOL_ABSOLUTE] = "%hi(";
6848 mips_lo_relocs[SYMBOL_ABSOLUTE] = "%lo(";
6849
6850 mips_lo_relocs[SYMBOL_32_HIGH] = "%hi(";
6851 }
6852 }
6853
6854 if (TARGET_MIPS16)
6855 {
6856 /* The high part is provided by a pseudo copy of $gp. */
6857 mips_split_p[SYMBOL_GP_RELATIVE] = true;
6858 mips_lo_relocs[SYMBOL_GP_RELATIVE] = "%gprel(";
6859 }
6860 else if (TARGET_EXPLICIT_RELOCS)
6861 /* Small data constants are kept whole until after reload,
6862 then lowered by mips_rewrite_small_data. */
6863 mips_lo_relocs[SYMBOL_GP_RELATIVE] = "%gp_rel(";
6864
6865 if (TARGET_EXPLICIT_RELOCS)
6866 {
6867 mips_split_p[SYMBOL_GOT_PAGE_OFST] = true;
6868 if (TARGET_NEWABI)
6869 {
6870 mips_lo_relocs[SYMBOL_GOTOFF_PAGE] = "%got_page(";
6871 mips_lo_relocs[SYMBOL_GOT_PAGE_OFST] = "%got_ofst(";
6872 }
6873 else
6874 {
6875 mips_lo_relocs[SYMBOL_GOTOFF_PAGE] = "%got(";
6876 mips_lo_relocs[SYMBOL_GOT_PAGE_OFST] = "%lo(";
6877 }
6878 if (TARGET_MIPS16)
6879 /* Expose the use of $28 as soon as possible. */
6880 mips_split_hi_p[SYMBOL_GOT_PAGE_OFST] = true;
6881
6882 if (TARGET_XGOT)
6883 {
6884 /* The HIGH and LO_SUM are matched by special .md patterns. */
6885 mips_split_p[SYMBOL_GOT_DISP] = true;
6886
6887 mips_split_p[SYMBOL_GOTOFF_DISP] = true;
6888 mips_hi_relocs[SYMBOL_GOTOFF_DISP] = "%got_hi(";
6889 mips_lo_relocs[SYMBOL_GOTOFF_DISP] = "%got_lo(";
6890
6891 mips_split_p[SYMBOL_GOTOFF_CALL] = true;
6892 mips_hi_relocs[SYMBOL_GOTOFF_CALL] = "%call_hi(";
6893 mips_lo_relocs[SYMBOL_GOTOFF_CALL] = "%call_lo(";
6894 }
6895 else
6896 {
6897 if (TARGET_NEWABI)
6898 mips_lo_relocs[SYMBOL_GOTOFF_DISP] = "%got_disp(";
6899 else
6900 mips_lo_relocs[SYMBOL_GOTOFF_DISP] = "%got(";
6901 mips_lo_relocs[SYMBOL_GOTOFF_CALL] = "%call16(";
6902 if (TARGET_MIPS16)
6903 /* Expose the use of $28 as soon as possible. */
6904 mips_split_p[SYMBOL_GOT_DISP] = true;
6905 }
6906 }
6907
6908 if (TARGET_NEWABI)
6909 {
6910 mips_split_p[SYMBOL_GOTOFF_LOADGP] = true;
6911 mips_hi_relocs[SYMBOL_GOTOFF_LOADGP] = "%hi(%neg(%gp_rel(";
6912 mips_lo_relocs[SYMBOL_GOTOFF_LOADGP] = "%lo(%neg(%gp_rel(";
6913 }
6914
6915 mips_lo_relocs[SYMBOL_TLSGD] = "%tlsgd(";
6916 mips_lo_relocs[SYMBOL_TLSLDM] = "%tlsldm(";
6917
6918 mips_split_p[SYMBOL_DTPREL] = true;
6919 mips_hi_relocs[SYMBOL_DTPREL] = "%dtprel_hi(";
6920 mips_lo_relocs[SYMBOL_DTPREL] = "%dtprel_lo(";
6921
6922 mips_lo_relocs[SYMBOL_GOTTPREL] = "%gottprel(";
6923
6924 mips_split_p[SYMBOL_TPREL] = true;
6925 mips_hi_relocs[SYMBOL_TPREL] = "%tprel_hi(";
6926 mips_lo_relocs[SYMBOL_TPREL] = "%tprel_lo(";
6927
6928 mips_lo_relocs[SYMBOL_HALF] = "%half(";
6929 }
6930
6931 /* If OP is an UNSPEC address, return the address to which it refers,
6932 otherwise return OP itself. */
6933
6934 static rtx
6935 mips_strip_unspec_address (rtx op)
6936 {
6937 rtx base, offset;
6938
6939 split_const (op, &base, &offset);
6940 if (UNSPEC_ADDRESS_P (base))
6941 op = plus_constant (UNSPEC_ADDRESS (base), INTVAL (offset));
6942 return op;
6943 }
6944
6945 /* Print symbolic operand OP, which is part of a HIGH or LO_SUM
6946 in context CONTEXT. RELOCS is the array of relocations to use. */
6947
6948 static void
6949 mips_print_operand_reloc (FILE *file, rtx op, enum mips_symbol_context context,
6950 const char **relocs)
6951 {
6952 enum mips_symbol_type symbol_type;
6953 const char *p;
6954
6955 symbol_type = mips_classify_symbolic_expression (op, context);
6956 gcc_assert (relocs[symbol_type]);
6957
6958 fputs (relocs[symbol_type], file);
6959 output_addr_const (file, mips_strip_unspec_address (op));
6960 for (p = relocs[symbol_type]; *p != 0; p++)
6961 if (*p == '(')
6962 fputc (')', file);
6963 }
6964
6965 /* Print the text for PRINT_OPERAND punctation character CH to FILE.
6966 The punctuation characters are:
6967
6968 '(' Start a nested ".set noreorder" block.
6969 ')' End a nested ".set noreorder" block.
6970 '[' Start a nested ".set noat" block.
6971 ']' End a nested ".set noat" block.
6972 '<' Start a nested ".set nomacro" block.
6973 '>' End a nested ".set nomacro" block.
6974 '*' Behave like %(%< if generating a delayed-branch sequence.
6975 '#' Print a nop if in a ".set noreorder" block.
6976 '/' Like '#', but do nothing within a delayed-branch sequence.
6977 '?' Print "l" if mips_branch_likely is true
6978 '~' Print a nop if mips_branch_likely is true
6979 '.' Print the name of the register with a hard-wired zero (zero or $0).
6980 '@' Print the name of the assembler temporary register (at or $1).
6981 '^' Print the name of the pic call-through register (t9 or $25).
6982 '+' Print the name of the gp register (usually gp or $28).
6983 '$' Print the name of the stack pointer register (sp or $29).
6984 '|' Print ".set push; .set mips2" if !ISA_HAS_LL_SC.
6985 '-' Print ".set pop" under the same conditions for '|'.
6986
6987 See also mips_init_print_operand_pucnt. */
6988
6989 static void
6990 mips_print_operand_punctuation (FILE *file, int ch)
6991 {
6992 switch (ch)
6993 {
6994 case '(':
6995 if (set_noreorder++ == 0)
6996 fputs (".set\tnoreorder\n\t", file);
6997 break;
6998
6999 case ')':
7000 gcc_assert (set_noreorder > 0);
7001 if (--set_noreorder == 0)
7002 fputs ("\n\t.set\treorder", file);
7003 break;
7004
7005 case '[':
7006 if (set_noat++ == 0)
7007 fputs (".set\tnoat\n\t", file);
7008 break;
7009
7010 case ']':
7011 gcc_assert (set_noat > 0);
7012 if (--set_noat == 0)
7013 fputs ("\n\t.set\tat", file);
7014 break;
7015
7016 case '<':
7017 if (set_nomacro++ == 0)
7018 fputs (".set\tnomacro\n\t", file);
7019 break;
7020
7021 case '>':
7022 gcc_assert (set_nomacro > 0);
7023 if (--set_nomacro == 0)
7024 fputs ("\n\t.set\tmacro", file);
7025 break;
7026
7027 case '*':
7028 if (final_sequence != 0)
7029 {
7030 mips_print_operand_punctuation (file, '(');
7031 mips_print_operand_punctuation (file, '<');
7032 }
7033 break;
7034
7035 case '#':
7036 if (set_noreorder != 0)
7037 fputs ("\n\tnop", file);
7038 break;
7039
7040 case '/':
7041 /* Print an extra newline so that the delayed insn is separated
7042 from the following ones. This looks neater and is consistent
7043 with non-nop delayed sequences. */
7044 if (set_noreorder != 0 && final_sequence == 0)
7045 fputs ("\n\tnop\n", file);
7046 break;
7047
7048 case '?':
7049 if (mips_branch_likely)
7050 putc ('l', file);
7051 break;
7052
7053 case '~':
7054 if (mips_branch_likely)
7055 fputs ("\n\tnop", file);
7056 break;
7057
7058 case '.':
7059 fputs (reg_names[GP_REG_FIRST + 0], file);
7060 break;
7061
7062 case '@':
7063 fputs (reg_names[GP_REG_FIRST + 1], file);
7064 break;
7065
7066 case '^':
7067 fputs (reg_names[PIC_FUNCTION_ADDR_REGNUM], file);
7068 break;
7069
7070 case '+':
7071 fputs (reg_names[PIC_OFFSET_TABLE_REGNUM], file);
7072 break;
7073
7074 case '$':
7075 fputs (reg_names[STACK_POINTER_REGNUM], file);
7076 break;
7077
7078 case '|':
7079 if (!ISA_HAS_LL_SC)
7080 fputs (".set\tpush\n\t.set\tmips2\n\t", file);
7081 break;
7082
7083 case '-':
7084 if (!ISA_HAS_LL_SC)
7085 fputs ("\n\t.set\tpop", file);
7086 break;
7087
7088 default:
7089 gcc_unreachable ();
7090 break;
7091 }
7092 }
7093
7094 /* Initialize mips_print_operand_punct. */
7095
7096 static void
7097 mips_init_print_operand_punct (void)
7098 {
7099 const char *p;
7100
7101 for (p = "()[]<>*#/?~.@^+$|-"; *p; p++)
7102 mips_print_operand_punct[(unsigned char) *p] = true;
7103 }
7104
7105 /* PRINT_OPERAND prefix LETTER refers to the integer branch instruction
7106 associated with condition CODE. Print the condition part of the
7107 opcode to FILE. */
7108
7109 static void
7110 mips_print_int_branch_condition (FILE *file, enum rtx_code code, int letter)
7111 {
7112 switch (code)
7113 {
7114 case EQ:
7115 case NE:
7116 case GT:
7117 case GE:
7118 case LT:
7119 case LE:
7120 case GTU:
7121 case GEU:
7122 case LTU:
7123 case LEU:
7124 /* Conveniently, the MIPS names for these conditions are the same
7125 as their RTL equivalents. */
7126 fputs (GET_RTX_NAME (code), file);
7127 break;
7128
7129 default:
7130 output_operand_lossage ("'%%%c' is not a valid operand prefix", letter);
7131 break;
7132 }
7133 }
7134
7135 /* Likewise floating-point branches. */
7136
7137 static void
7138 mips_print_float_branch_condition (FILE *file, enum rtx_code code, int letter)
7139 {
7140 switch (code)
7141 {
7142 case EQ:
7143 fputs ("c1f", file);
7144 break;
7145
7146 case NE:
7147 fputs ("c1t", file);
7148 break;
7149
7150 default:
7151 output_operand_lossage ("'%%%c' is not a valid operand prefix", letter);
7152 break;
7153 }
7154 }
7155
7156 /* Implement the PRINT_OPERAND macro. The MIPS-specific operand codes are:
7157
7158 'X' Print CONST_INT OP in hexadecimal format.
7159 'x' Print the low 16 bits of CONST_INT OP in hexadecimal format.
7160 'd' Print CONST_INT OP in decimal.
7161 'm' Print one less than CONST_INT OP in decimal.
7162 'h' Print the high-part relocation associated with OP, after stripping
7163 any outermost HIGH.
7164 'R' Print the low-part relocation associated with OP.
7165 'C' Print the integer branch condition for comparison OP.
7166 'N' Print the inverse of the integer branch condition for comparison OP.
7167 'F' Print the FPU branch condition for comparison OP.
7168 'W' Print the inverse of the FPU branch condition for comparison OP.
7169 'T' Print 'f' for (eq:CC ...), 't' for (ne:CC ...),
7170 'z' for (eq:?I ...), 'n' for (ne:?I ...).
7171 't' Like 'T', but with the EQ/NE cases reversed
7172 'Y' Print mips_fp_conditions[INTVAL (OP)]
7173 'Z' Print OP and a comma for ISA_HAS_8CC, otherwise print nothing.
7174 'q' Print a DSP accumulator register.
7175 'D' Print the second part of a double-word register or memory operand.
7176 'L' Print the low-order register in a double-word register operand.
7177 'M' Print high-order register in a double-word register operand.
7178 'z' Print $0 if OP is zero, otherwise print OP normally. */
7179
7180 void
7181 mips_print_operand (FILE *file, rtx op, int letter)
7182 {
7183 enum rtx_code code;
7184
7185 if (PRINT_OPERAND_PUNCT_VALID_P (letter))
7186 {
7187 mips_print_operand_punctuation (file, letter);
7188 return;
7189 }
7190
7191 gcc_assert (op);
7192 code = GET_CODE (op);
7193
7194 switch (letter)
7195 {
7196 case 'X':
7197 if (GET_CODE (op) == CONST_INT)
7198 fprintf (file, HOST_WIDE_INT_PRINT_HEX, INTVAL (op));
7199 else
7200 output_operand_lossage ("invalid use of '%%%c'", letter);
7201 break;
7202
7203 case 'x':
7204 if (GET_CODE (op) == CONST_INT)
7205 fprintf (file, HOST_WIDE_INT_PRINT_HEX, INTVAL (op) & 0xffff);
7206 else
7207 output_operand_lossage ("invalid use of '%%%c'", letter);
7208 break;
7209
7210 case 'd':
7211 if (GET_CODE (op) == CONST_INT)
7212 fprintf (file, HOST_WIDE_INT_PRINT_DEC, INTVAL (op));
7213 else
7214 output_operand_lossage ("invalid use of '%%%c'", letter);
7215 break;
7216
7217 case 'm':
7218 if (GET_CODE (op) == CONST_INT)
7219 fprintf (file, HOST_WIDE_INT_PRINT_DEC, INTVAL (op) - 1);
7220 else
7221 output_operand_lossage ("invalid use of '%%%c'", letter);
7222 break;
7223
7224 case 'h':
7225 if (code == HIGH)
7226 op = XEXP (op, 0);
7227 mips_print_operand_reloc (file, op, SYMBOL_CONTEXT_LEA, mips_hi_relocs);
7228 break;
7229
7230 case 'R':
7231 mips_print_operand_reloc (file, op, SYMBOL_CONTEXT_LEA, mips_lo_relocs);
7232 break;
7233
7234 case 'C':
7235 mips_print_int_branch_condition (file, code, letter);
7236 break;
7237
7238 case 'N':
7239 mips_print_int_branch_condition (file, reverse_condition (code), letter);
7240 break;
7241
7242 case 'F':
7243 mips_print_float_branch_condition (file, code, letter);
7244 break;
7245
7246 case 'W':
7247 mips_print_float_branch_condition (file, reverse_condition (code),
7248 letter);
7249 break;
7250
7251 case 'T':
7252 case 't':
7253 {
7254 int truth = (code == NE) == (letter == 'T');
7255 fputc ("zfnt"[truth * 2 + (GET_MODE (op) == CCmode)], file);
7256 }
7257 break;
7258
7259 case 'Y':
7260 if (code == CONST_INT && UINTVAL (op) < ARRAY_SIZE (mips_fp_conditions))
7261 fputs (mips_fp_conditions[UINTVAL (op)], file);
7262 else
7263 output_operand_lossage ("'%%%c' is not a valid operand prefix",
7264 letter);
7265 break;
7266
7267 case 'Z':
7268 if (ISA_HAS_8CC)
7269 {
7270 mips_print_operand (file, op, 0);
7271 fputc (',', file);
7272 }
7273 break;
7274
7275 case 'q':
7276 if (code == REG && MD_REG_P (REGNO (op)))
7277 fprintf (file, "$ac0");
7278 else if (code == REG && DSP_ACC_REG_P (REGNO (op)))
7279 fprintf (file, "$ac%c", reg_names[REGNO (op)][3]);
7280 else
7281 output_operand_lossage ("invalid use of '%%%c'", letter);
7282 break;
7283
7284 default:
7285 switch (code)
7286 {
7287 case REG:
7288 {
7289 unsigned int regno = REGNO (op);
7290 if ((letter == 'M' && TARGET_LITTLE_ENDIAN)
7291 || (letter == 'L' && TARGET_BIG_ENDIAN)
7292 || letter == 'D')
7293 regno++;
7294 else if (letter && letter != 'z' && letter != 'M' && letter != 'L')
7295 output_operand_lossage ("invalid use of '%%%c'", letter);
7296 /* We need to print $0 .. $31 for COP0 registers. */
7297 if (COP0_REG_P (regno))
7298 fprintf (file, "$%s", &reg_names[regno][4]);
7299 else
7300 fprintf (file, "%s", reg_names[regno]);
7301 }
7302 break;
7303
7304 case MEM:
7305 if (letter == 'D')
7306 output_address (plus_constant (XEXP (op, 0), 4));
7307 else if (letter && letter != 'z')
7308 output_operand_lossage ("invalid use of '%%%c'", letter);
7309 else
7310 output_address (XEXP (op, 0));
7311 break;
7312
7313 default:
7314 if (letter == 'z' && op == CONST0_RTX (GET_MODE (op)))
7315 fputs (reg_names[GP_REG_FIRST], file);
7316 else if (letter && letter != 'z')
7317 output_operand_lossage ("invalid use of '%%%c'", letter);
7318 else if (CONST_GP_P (op))
7319 fputs (reg_names[GLOBAL_POINTER_REGNUM], file);
7320 else
7321 output_addr_const (file, mips_strip_unspec_address (op));
7322 break;
7323 }
7324 }
7325 }
7326
7327 /* Output address operand X to FILE. */
7328
7329 void
7330 mips_print_operand_address (FILE *file, rtx x)
7331 {
7332 struct mips_address_info addr;
7333
7334 if (mips_classify_address (&addr, x, word_mode, true))
7335 switch (addr.type)
7336 {
7337 case ADDRESS_REG:
7338 mips_print_operand (file, addr.offset, 0);
7339 fprintf (file, "(%s)", reg_names[REGNO (addr.reg)]);
7340 return;
7341
7342 case ADDRESS_LO_SUM:
7343 mips_print_operand_reloc (file, addr.offset, SYMBOL_CONTEXT_MEM,
7344 mips_lo_relocs);
7345 fprintf (file, "(%s)", reg_names[REGNO (addr.reg)]);
7346 return;
7347
7348 case ADDRESS_CONST_INT:
7349 output_addr_const (file, x);
7350 fprintf (file, "(%s)", reg_names[GP_REG_FIRST]);
7351 return;
7352
7353 case ADDRESS_SYMBOLIC:
7354 output_addr_const (file, mips_strip_unspec_address (x));
7355 return;
7356 }
7357 gcc_unreachable ();
7358 }
7359 \f
7360 /* Implement TARGET_ENCODE_SECTION_INFO. */
7361
7362 static void
7363 mips_encode_section_info (tree decl, rtx rtl, int first)
7364 {
7365 default_encode_section_info (decl, rtl, first);
7366
7367 if (TREE_CODE (decl) == FUNCTION_DECL)
7368 {
7369 rtx symbol = XEXP (rtl, 0);
7370 tree type = TREE_TYPE (decl);
7371
7372 /* Encode whether the symbol is short or long. */
7373 if ((TARGET_LONG_CALLS && !mips_near_type_p (type))
7374 || mips_far_type_p (type))
7375 SYMBOL_REF_FLAGS (symbol) |= SYMBOL_FLAG_LONG_CALL;
7376 }
7377 }
7378
7379 /* Implement TARGET_SELECT_RTX_SECTION. */
7380
7381 static section *
7382 mips_select_rtx_section (enum machine_mode mode, rtx x,
7383 unsigned HOST_WIDE_INT align)
7384 {
7385 /* ??? Consider using mergeable small data sections. */
7386 if (mips_rtx_constant_in_small_data_p (mode))
7387 return get_named_section (NULL, ".sdata", 0);
7388
7389 return default_elf_select_rtx_section (mode, x, align);
7390 }
7391
7392 /* Implement TARGET_ASM_FUNCTION_RODATA_SECTION.
7393
7394 The complication here is that, with the combination TARGET_ABICALLS
7395 && !TARGET_ABSOLUTE_ABICALLS && !TARGET_GPWORD, jump tables will use
7396 absolute addresses, and should therefore not be included in the
7397 read-only part of a DSO. Handle such cases by selecting a normal
7398 data section instead of a read-only one. The logic apes that in
7399 default_function_rodata_section. */
7400
7401 static section *
7402 mips_function_rodata_section (tree decl)
7403 {
7404 if (!TARGET_ABICALLS || TARGET_ABSOLUTE_ABICALLS || TARGET_GPWORD)
7405 return default_function_rodata_section (decl);
7406
7407 if (decl && DECL_SECTION_NAME (decl))
7408 {
7409 const char *name = TREE_STRING_POINTER (DECL_SECTION_NAME (decl));
7410 if (DECL_ONE_ONLY (decl) && strncmp (name, ".gnu.linkonce.t.", 16) == 0)
7411 {
7412 char *rname = ASTRDUP (name);
7413 rname[14] = 'd';
7414 return get_section (rname, SECTION_LINKONCE | SECTION_WRITE, decl);
7415 }
7416 else if (flag_function_sections
7417 && flag_data_sections
7418 && strncmp (name, ".text.", 6) == 0)
7419 {
7420 char *rname = ASTRDUP (name);
7421 memcpy (rname + 1, "data", 4);
7422 return get_section (rname, SECTION_WRITE, decl);
7423 }
7424 }
7425 return data_section;
7426 }
7427
7428 /* Implement TARGET_IN_SMALL_DATA_P. */
7429
7430 static bool
7431 mips_in_small_data_p (const_tree decl)
7432 {
7433 unsigned HOST_WIDE_INT size;
7434
7435 if (TREE_CODE (decl) == STRING_CST || TREE_CODE (decl) == FUNCTION_DECL)
7436 return false;
7437
7438 /* We don't yet generate small-data references for -mabicalls
7439 or VxWorks RTP code. See the related -G handling in
7440 mips_override_options. */
7441 if (TARGET_ABICALLS || TARGET_VXWORKS_RTP)
7442 return false;
7443
7444 if (TREE_CODE (decl) == VAR_DECL && DECL_SECTION_NAME (decl) != 0)
7445 {
7446 const char *name;
7447
7448 /* Reject anything that isn't in a known small-data section. */
7449 name = TREE_STRING_POINTER (DECL_SECTION_NAME (decl));
7450 if (strcmp (name, ".sdata") != 0 && strcmp (name, ".sbss") != 0)
7451 return false;
7452
7453 /* If a symbol is defined externally, the assembler will use the
7454 usual -G rules when deciding how to implement macros. */
7455 if (mips_lo_relocs[SYMBOL_GP_RELATIVE] || !DECL_EXTERNAL (decl))
7456 return true;
7457 }
7458 else if (TARGET_EMBEDDED_DATA)
7459 {
7460 /* Don't put constants into the small data section: we want them
7461 to be in ROM rather than RAM. */
7462 if (TREE_CODE (decl) != VAR_DECL)
7463 return false;
7464
7465 if (TREE_READONLY (decl)
7466 && !TREE_SIDE_EFFECTS (decl)
7467 && (!DECL_INITIAL (decl) || TREE_CONSTANT (DECL_INITIAL (decl))))
7468 return false;
7469 }
7470
7471 /* Enforce -mlocal-sdata. */
7472 if (!TARGET_LOCAL_SDATA && !TREE_PUBLIC (decl))
7473 return false;
7474
7475 /* Enforce -mextern-sdata. */
7476 if (!TARGET_EXTERN_SDATA && DECL_P (decl))
7477 {
7478 if (DECL_EXTERNAL (decl))
7479 return false;
7480 if (DECL_COMMON (decl) && DECL_INITIAL (decl) == NULL)
7481 return false;
7482 }
7483
7484 /* We have traditionally not treated zero-sized objects as small data,
7485 so this is now effectively part of the ABI. */
7486 size = int_size_in_bytes (TREE_TYPE (decl));
7487 return size > 0 && size <= mips_small_data_threshold;
7488 }
7489
7490 /* Implement TARGET_USE_ANCHORS_FOR_SYMBOL_P. We don't want to use
7491 anchors for small data: the GP register acts as an anchor in that
7492 case. We also don't want to use them for PC-relative accesses,
7493 where the PC acts as an anchor. */
7494
7495 static bool
7496 mips_use_anchors_for_symbol_p (const_rtx symbol)
7497 {
7498 switch (mips_classify_symbol (symbol, SYMBOL_CONTEXT_MEM))
7499 {
7500 case SYMBOL_PC_RELATIVE:
7501 case SYMBOL_GP_RELATIVE:
7502 return false;
7503
7504 default:
7505 return default_use_anchors_for_symbol_p (symbol);
7506 }
7507 }
7508 \f
7509 /* The MIPS debug format wants all automatic variables and arguments
7510 to be in terms of the virtual frame pointer (stack pointer before
7511 any adjustment in the function), while the MIPS 3.0 linker wants
7512 the frame pointer to be the stack pointer after the initial
7513 adjustment. So, we do the adjustment here. The arg pointer (which
7514 is eliminated) points to the virtual frame pointer, while the frame
7515 pointer (which may be eliminated) points to the stack pointer after
7516 the initial adjustments. */
7517
7518 HOST_WIDE_INT
7519 mips_debugger_offset (rtx addr, HOST_WIDE_INT offset)
7520 {
7521 rtx offset2 = const0_rtx;
7522 rtx reg = eliminate_constant_term (addr, &offset2);
7523
7524 if (offset == 0)
7525 offset = INTVAL (offset2);
7526
7527 if (reg == stack_pointer_rtx
7528 || reg == frame_pointer_rtx
7529 || reg == hard_frame_pointer_rtx)
7530 {
7531 offset -= cfun->machine->frame.total_size;
7532 if (reg == hard_frame_pointer_rtx)
7533 offset += cfun->machine->frame.hard_frame_pointer_offset;
7534 }
7535
7536 /* sdbout_parms does not want this to crash for unrecognized cases. */
7537 #if 0
7538 else if (reg != arg_pointer_rtx)
7539 fatal_insn ("mips_debugger_offset called with non stack/frame/arg pointer",
7540 addr);
7541 #endif
7542
7543 return offset;
7544 }
7545 \f
7546 /* Implement ASM_OUTPUT_EXTERNAL. */
7547
7548 void
7549 mips_output_external (FILE *file, tree decl, const char *name)
7550 {
7551 default_elf_asm_output_external (file, decl, name);
7552
7553 /* We output the name if and only if TREE_SYMBOL_REFERENCED is
7554 set in order to avoid putting out names that are never really
7555 used. */
7556 if (TREE_SYMBOL_REFERENCED (DECL_ASSEMBLER_NAME (decl)))
7557 {
7558 if (!TARGET_EXPLICIT_RELOCS && mips_in_small_data_p (decl))
7559 {
7560 /* When using assembler macros, emit .extern directives for
7561 all small-data externs so that the assembler knows how
7562 big they are.
7563
7564 In most cases it would be safe (though pointless) to emit
7565 .externs for other symbols too. One exception is when an
7566 object is within the -G limit but declared by the user to
7567 be in a section other than .sbss or .sdata. */
7568 fputs ("\t.extern\t", file);
7569 assemble_name (file, name);
7570 fprintf (file, ", " HOST_WIDE_INT_PRINT_DEC "\n",
7571 int_size_in_bytes (TREE_TYPE (decl)));
7572 }
7573 else if (TARGET_IRIX
7574 && mips_abi == ABI_32
7575 && TREE_CODE (decl) == FUNCTION_DECL)
7576 {
7577 /* In IRIX 5 or IRIX 6 for the O32 ABI, we must output a
7578 `.global name .text' directive for every used but
7579 undefined function. If we don't, the linker may perform
7580 an optimization (skipping over the insns that set $gp)
7581 when it is unsafe. */
7582 fputs ("\t.globl ", file);
7583 assemble_name (file, name);
7584 fputs (" .text\n", file);
7585 }
7586 }
7587 }
7588
7589 /* Implement ASM_OUTPUT_SOURCE_FILENAME. */
7590
7591 void
7592 mips_output_filename (FILE *stream, const char *name)
7593 {
7594 /* If we are emitting DWARF-2, let dwarf2out handle the ".file"
7595 directives. */
7596 if (write_symbols == DWARF2_DEBUG)
7597 return;
7598 else if (mips_output_filename_first_time)
7599 {
7600 mips_output_filename_first_time = 0;
7601 num_source_filenames += 1;
7602 current_function_file = name;
7603 fprintf (stream, "\t.file\t%d ", num_source_filenames);
7604 output_quoted_string (stream, name);
7605 putc ('\n', stream);
7606 }
7607 /* If we are emitting stabs, let dbxout.c handle this (except for
7608 the mips_output_filename_first_time case). */
7609 else if (write_symbols == DBX_DEBUG)
7610 return;
7611 else if (name != current_function_file
7612 && strcmp (name, current_function_file) != 0)
7613 {
7614 num_source_filenames += 1;
7615 current_function_file = name;
7616 fprintf (stream, "\t.file\t%d ", num_source_filenames);
7617 output_quoted_string (stream, name);
7618 putc ('\n', stream);
7619 }
7620 }
7621
7622 /* Implement TARGET_ASM_OUTPUT_DWARF_DTPREL. */
7623
7624 static void ATTRIBUTE_UNUSED
7625 mips_output_dwarf_dtprel (FILE *file, int size, rtx x)
7626 {
7627 switch (size)
7628 {
7629 case 4:
7630 fputs ("\t.dtprelword\t", file);
7631 break;
7632
7633 case 8:
7634 fputs ("\t.dtpreldword\t", file);
7635 break;
7636
7637 default:
7638 gcc_unreachable ();
7639 }
7640 output_addr_const (file, x);
7641 fputs ("+0x8000", file);
7642 }
7643
7644 /* Implement TARGET_DWARF_REGISTER_SPAN. */
7645
7646 static rtx
7647 mips_dwarf_register_span (rtx reg)
7648 {
7649 rtx high, low;
7650 enum machine_mode mode;
7651
7652 /* By default, GCC maps increasing register numbers to increasing
7653 memory locations, but paired FPRs are always little-endian,
7654 regardless of the prevailing endianness. */
7655 mode = GET_MODE (reg);
7656 if (FP_REG_P (REGNO (reg))
7657 && TARGET_BIG_ENDIAN
7658 && MAX_FPRS_PER_FMT > 1
7659 && GET_MODE_SIZE (mode) > UNITS_PER_FPREG)
7660 {
7661 gcc_assert (GET_MODE_SIZE (mode) == UNITS_PER_HWFPVALUE);
7662 high = mips_subword (reg, true);
7663 low = mips_subword (reg, false);
7664 return gen_rtx_PARALLEL (VOIDmode, gen_rtvec (2, high, low));
7665 }
7666
7667 return NULL_RTX;
7668 }
7669
7670 /* Implement ASM_OUTPUT_ASCII. */
7671
7672 void
7673 mips_output_ascii (FILE *stream, const char *string, size_t len)
7674 {
7675 size_t i;
7676 int cur_pos;
7677
7678 cur_pos = 17;
7679 fprintf (stream, "\t.ascii\t\"");
7680 for (i = 0; i < len; i++)
7681 {
7682 int c;
7683
7684 c = (unsigned char) string[i];
7685 if (ISPRINT (c))
7686 {
7687 if (c == '\\' || c == '\"')
7688 {
7689 putc ('\\', stream);
7690 cur_pos++;
7691 }
7692 putc (c, stream);
7693 cur_pos++;
7694 }
7695 else
7696 {
7697 fprintf (stream, "\\%03o", c);
7698 cur_pos += 4;
7699 }
7700
7701 if (cur_pos > 72 && i+1 < len)
7702 {
7703 cur_pos = 17;
7704 fprintf (stream, "\"\n\t.ascii\t\"");
7705 }
7706 }
7707 fprintf (stream, "\"\n");
7708 }
7709
7710 /* Emit either a label, .comm, or .lcomm directive. When using assembler
7711 macros, mark the symbol as written so that mips_asm_output_external
7712 won't emit an .extern for it. STREAM is the output file, NAME is the
7713 name of the symbol, INIT_STRING is the string that should be written
7714 before the symbol and FINAL_STRING is the string that should be
7715 written after it. FINAL_STRING is a printf format that consumes the
7716 remaining arguments. */
7717
7718 void
7719 mips_declare_object (FILE *stream, const char *name, const char *init_string,
7720 const char *final_string, ...)
7721 {
7722 va_list ap;
7723
7724 fputs (init_string, stream);
7725 assemble_name (stream, name);
7726 va_start (ap, final_string);
7727 vfprintf (stream, final_string, ap);
7728 va_end (ap);
7729
7730 if (!TARGET_EXPLICIT_RELOCS)
7731 {
7732 tree name_tree = get_identifier (name);
7733 TREE_ASM_WRITTEN (name_tree) = 1;
7734 }
7735 }
7736
7737 /* Declare a common object of SIZE bytes using asm directive INIT_STRING.
7738 NAME is the name of the object and ALIGN is the required alignment
7739 in bytes. TAKES_ALIGNMENT_P is true if the directive takes a third
7740 alignment argument. */
7741
7742 void
7743 mips_declare_common_object (FILE *stream, const char *name,
7744 const char *init_string,
7745 unsigned HOST_WIDE_INT size,
7746 unsigned int align, bool takes_alignment_p)
7747 {
7748 if (!takes_alignment_p)
7749 {
7750 size += (align / BITS_PER_UNIT) - 1;
7751 size -= size % (align / BITS_PER_UNIT);
7752 mips_declare_object (stream, name, init_string,
7753 "," HOST_WIDE_INT_PRINT_UNSIGNED "\n", size);
7754 }
7755 else
7756 mips_declare_object (stream, name, init_string,
7757 "," HOST_WIDE_INT_PRINT_UNSIGNED ",%u\n",
7758 size, align / BITS_PER_UNIT);
7759 }
7760
7761 /* Implement ASM_OUTPUT_ALIGNED_DECL_COMMON. This is usually the same as the
7762 elfos.h version, but we also need to handle -muninit-const-in-rodata. */
7763
7764 void
7765 mips_output_aligned_decl_common (FILE *stream, tree decl, const char *name,
7766 unsigned HOST_WIDE_INT size,
7767 unsigned int align)
7768 {
7769 /* If the target wants uninitialized const declarations in
7770 .rdata then don't put them in .comm. */
7771 if (TARGET_EMBEDDED_DATA
7772 && TARGET_UNINIT_CONST_IN_RODATA
7773 && TREE_CODE (decl) == VAR_DECL
7774 && TREE_READONLY (decl)
7775 && (DECL_INITIAL (decl) == 0 || DECL_INITIAL (decl) == error_mark_node))
7776 {
7777 if (TREE_PUBLIC (decl) && DECL_NAME (decl))
7778 targetm.asm_out.globalize_label (stream, name);
7779
7780 switch_to_section (readonly_data_section);
7781 ASM_OUTPUT_ALIGN (stream, floor_log2 (align / BITS_PER_UNIT));
7782 mips_declare_object (stream, name, "",
7783 ":\n\t.space\t" HOST_WIDE_INT_PRINT_UNSIGNED "\n",
7784 size);
7785 }
7786 else
7787 mips_declare_common_object (stream, name, "\n\t.comm\t",
7788 size, align, true);
7789 }
7790
7791 #ifdef ASM_OUTPUT_SIZE_DIRECTIVE
7792 extern int size_directive_output;
7793
7794 /* Implement ASM_DECLARE_OBJECT_NAME. This is like most of the standard ELF
7795 definitions except that it uses mips_declare_object to emit the label. */
7796
7797 void
7798 mips_declare_object_name (FILE *stream, const char *name,
7799 tree decl ATTRIBUTE_UNUSED)
7800 {
7801 #ifdef ASM_OUTPUT_TYPE_DIRECTIVE
7802 ASM_OUTPUT_TYPE_DIRECTIVE (stream, name, "object");
7803 #endif
7804
7805 size_directive_output = 0;
7806 if (!flag_inhibit_size_directive && DECL_SIZE (decl))
7807 {
7808 HOST_WIDE_INT size;
7809
7810 size_directive_output = 1;
7811 size = int_size_in_bytes (TREE_TYPE (decl));
7812 ASM_OUTPUT_SIZE_DIRECTIVE (stream, name, size);
7813 }
7814
7815 mips_declare_object (stream, name, "", ":\n");
7816 }
7817
7818 /* Implement ASM_FINISH_DECLARE_OBJECT. This is generic ELF stuff. */
7819
7820 void
7821 mips_finish_declare_object (FILE *stream, tree decl, int top_level, int at_end)
7822 {
7823 const char *name;
7824
7825 name = XSTR (XEXP (DECL_RTL (decl), 0), 0);
7826 if (!flag_inhibit_size_directive
7827 && DECL_SIZE (decl) != 0
7828 && !at_end
7829 && top_level
7830 && DECL_INITIAL (decl) == error_mark_node
7831 && !size_directive_output)
7832 {
7833 HOST_WIDE_INT size;
7834
7835 size_directive_output = 1;
7836 size = int_size_in_bytes (TREE_TYPE (decl));
7837 ASM_OUTPUT_SIZE_DIRECTIVE (stream, name, size);
7838 }
7839 }
7840 #endif
7841 \f
7842 /* Return the FOO in the name of the ".mdebug.FOO" section associated
7843 with the current ABI. */
7844
7845 static const char *
7846 mips_mdebug_abi_name (void)
7847 {
7848 switch (mips_abi)
7849 {
7850 case ABI_32:
7851 return "abi32";
7852 case ABI_O64:
7853 return "abiO64";
7854 case ABI_N32:
7855 return "abiN32";
7856 case ABI_64:
7857 return "abi64";
7858 case ABI_EABI:
7859 return TARGET_64BIT ? "eabi64" : "eabi32";
7860 default:
7861 gcc_unreachable ();
7862 }
7863 }
7864
7865 /* Implement TARGET_ASM_FILE_START. */
7866
7867 static void
7868 mips_file_start (void)
7869 {
7870 default_file_start ();
7871
7872 /* Generate a special section to describe the ABI switches used to
7873 produce the resultant binary. This is unnecessary on IRIX and
7874 causes unwanted warnings from the native linker. */
7875 if (!TARGET_IRIX)
7876 {
7877 /* Record the ABI itself. Modern versions of binutils encode
7878 this information in the ELF header flags, but GDB needs the
7879 information in order to correctly debug binaries produced by
7880 older binutils. See the function mips_gdbarch_init in
7881 gdb/mips-tdep.c. */
7882 fprintf (asm_out_file, "\t.section .mdebug.%s\n\t.previous\n",
7883 mips_mdebug_abi_name ());
7884
7885 /* There is no ELF header flag to distinguish long32 forms of the
7886 EABI from long64 forms. Emit a special section to help tools
7887 such as GDB. Do the same for o64, which is sometimes used with
7888 -mlong64. */
7889 if (mips_abi == ABI_EABI || mips_abi == ABI_O64)
7890 fprintf (asm_out_file, "\t.section .gcc_compiled_long%d\n"
7891 "\t.previous\n", TARGET_LONG64 ? 64 : 32);
7892
7893 #ifdef HAVE_AS_GNU_ATTRIBUTE
7894 fprintf (asm_out_file, "\t.gnu_attribute 4, %d\n",
7895 (TARGET_HARD_FLOAT_ABI
7896 ? (TARGET_DOUBLE_FLOAT
7897 ? ((!TARGET_64BIT && TARGET_FLOAT64) ? 4 : 1) : 2) : 3));
7898 #endif
7899 }
7900
7901 /* If TARGET_ABICALLS, tell GAS to generate -KPIC code. */
7902 if (TARGET_ABICALLS)
7903 {
7904 fprintf (asm_out_file, "\t.abicalls\n");
7905 if (TARGET_ABICALLS_PIC0)
7906 fprintf (asm_out_file, "\t.option\tpic0\n");
7907 }
7908
7909 if (flag_verbose_asm)
7910 fprintf (asm_out_file, "\n%s -G value = %d, Arch = %s, ISA = %d\n",
7911 ASM_COMMENT_START,
7912 mips_small_data_threshold, mips_arch_info->name, mips_isa);
7913 }
7914 \f
7915 /* Make the last instruction frame-related and note that it performs
7916 the operation described by FRAME_PATTERN. */
7917
7918 static void
7919 mips_set_frame_expr (rtx frame_pattern)
7920 {
7921 rtx insn;
7922
7923 insn = get_last_insn ();
7924 RTX_FRAME_RELATED_P (insn) = 1;
7925 REG_NOTES (insn) = alloc_EXPR_LIST (REG_FRAME_RELATED_EXPR,
7926 frame_pattern,
7927 REG_NOTES (insn));
7928 }
7929
7930 /* Return a frame-related rtx that stores REG at MEM.
7931 REG must be a single register. */
7932
7933 static rtx
7934 mips_frame_set (rtx mem, rtx reg)
7935 {
7936 rtx set;
7937
7938 /* If we're saving the return address register and the DWARF return
7939 address column differs from the hard register number, adjust the
7940 note reg to refer to the former. */
7941 if (REGNO (reg) == GP_REG_FIRST + 31
7942 && DWARF_FRAME_RETURN_COLUMN != GP_REG_FIRST + 31)
7943 reg = gen_rtx_REG (GET_MODE (reg), DWARF_FRAME_RETURN_COLUMN);
7944
7945 set = gen_rtx_SET (VOIDmode, mem, reg);
7946 RTX_FRAME_RELATED_P (set) = 1;
7947
7948 return set;
7949 }
7950 \f
7951 /* If a MIPS16e SAVE or RESTORE instruction saves or restores register
7952 mips16e_s2_s8_regs[X], it must also save the registers in indexes
7953 X + 1 onwards. Likewise mips16e_a0_a3_regs. */
7954 static const unsigned char mips16e_s2_s8_regs[] = {
7955 30, 23, 22, 21, 20, 19, 18
7956 };
7957 static const unsigned char mips16e_a0_a3_regs[] = {
7958 4, 5, 6, 7
7959 };
7960
7961 /* A list of the registers that can be saved by the MIPS16e SAVE instruction,
7962 ordered from the uppermost in memory to the lowest in memory. */
7963 static const unsigned char mips16e_save_restore_regs[] = {
7964 31, 30, 23, 22, 21, 20, 19, 18, 17, 16, 7, 6, 5, 4
7965 };
7966
7967 /* Return the index of the lowest X in the range [0, SIZE) for which
7968 bit REGS[X] is set in MASK. Return SIZE if there is no such X. */
7969
7970 static unsigned int
7971 mips16e_find_first_register (unsigned int mask, const unsigned char *regs,
7972 unsigned int size)
7973 {
7974 unsigned int i;
7975
7976 for (i = 0; i < size; i++)
7977 if (BITSET_P (mask, regs[i]))
7978 break;
7979
7980 return i;
7981 }
7982
7983 /* *MASK_PTR is a mask of general-purpose registers and *NUM_REGS_PTR
7984 is the number of set bits. If *MASK_PTR contains REGS[X] for some X
7985 in [0, SIZE), adjust *MASK_PTR and *NUM_REGS_PTR so that the same
7986 is true for all indexes (X, SIZE). */
7987
7988 static void
7989 mips16e_mask_registers (unsigned int *mask_ptr, const unsigned char *regs,
7990 unsigned int size, unsigned int *num_regs_ptr)
7991 {
7992 unsigned int i;
7993
7994 i = mips16e_find_first_register (*mask_ptr, regs, size);
7995 for (i++; i < size; i++)
7996 if (!BITSET_P (*mask_ptr, regs[i]))
7997 {
7998 *num_regs_ptr += 1;
7999 *mask_ptr |= 1 << regs[i];
8000 }
8001 }
8002
8003 /* Return a simplified form of X using the register values in REG_VALUES.
8004 REG_VALUES[R] is the last value assigned to hard register R, or null
8005 if R has not been modified.
8006
8007 This function is rather limited, but is good enough for our purposes. */
8008
8009 static rtx
8010 mips16e_collect_propagate_value (rtx x, rtx *reg_values)
8011 {
8012 x = avoid_constant_pool_reference (x);
8013
8014 if (UNARY_P (x))
8015 {
8016 rtx x0 = mips16e_collect_propagate_value (XEXP (x, 0), reg_values);
8017 return simplify_gen_unary (GET_CODE (x), GET_MODE (x),
8018 x0, GET_MODE (XEXP (x, 0)));
8019 }
8020
8021 if (ARITHMETIC_P (x))
8022 {
8023 rtx x0 = mips16e_collect_propagate_value (XEXP (x, 0), reg_values);
8024 rtx x1 = mips16e_collect_propagate_value (XEXP (x, 1), reg_values);
8025 return simplify_gen_binary (GET_CODE (x), GET_MODE (x), x0, x1);
8026 }
8027
8028 if (REG_P (x)
8029 && reg_values[REGNO (x)]
8030 && !rtx_unstable_p (reg_values[REGNO (x)]))
8031 return reg_values[REGNO (x)];
8032
8033 return x;
8034 }
8035
8036 /* Return true if (set DEST SRC) stores an argument register into its
8037 caller-allocated save slot, storing the number of that argument
8038 register in *REGNO_PTR if so. REG_VALUES is as for
8039 mips16e_collect_propagate_value. */
8040
8041 static bool
8042 mips16e_collect_argument_save_p (rtx dest, rtx src, rtx *reg_values,
8043 unsigned int *regno_ptr)
8044 {
8045 unsigned int argno, regno;
8046 HOST_WIDE_INT offset, required_offset;
8047 rtx addr, base;
8048
8049 /* Check that this is a word-mode store. */
8050 if (!MEM_P (dest) || !REG_P (src) || GET_MODE (dest) != word_mode)
8051 return false;
8052
8053 /* Check that the register being saved is an unmodified argument
8054 register. */
8055 regno = REGNO (src);
8056 if (!IN_RANGE (regno, GP_ARG_FIRST, GP_ARG_LAST) || reg_values[regno])
8057 return false;
8058 argno = regno - GP_ARG_FIRST;
8059
8060 /* Check whether the address is an appropriate stack-pointer or
8061 frame-pointer access. */
8062 addr = mips16e_collect_propagate_value (XEXP (dest, 0), reg_values);
8063 mips_split_plus (addr, &base, &offset);
8064 required_offset = cfun->machine->frame.total_size + argno * UNITS_PER_WORD;
8065 if (base == hard_frame_pointer_rtx)
8066 required_offset -= cfun->machine->frame.hard_frame_pointer_offset;
8067 else if (base != stack_pointer_rtx)
8068 return false;
8069 if (offset != required_offset)
8070 return false;
8071
8072 *regno_ptr = regno;
8073 return true;
8074 }
8075
8076 /* A subroutine of mips_expand_prologue, called only when generating
8077 MIPS16e SAVE instructions. Search the start of the function for any
8078 instructions that save argument registers into their caller-allocated
8079 save slots. Delete such instructions and return a value N such that
8080 saving [GP_ARG_FIRST, GP_ARG_FIRST + N) would make all the deleted
8081 instructions redundant. */
8082
8083 static unsigned int
8084 mips16e_collect_argument_saves (void)
8085 {
8086 rtx reg_values[FIRST_PSEUDO_REGISTER];
8087 rtx insn, next, set, dest, src;
8088 unsigned int nargs, regno;
8089
8090 push_topmost_sequence ();
8091 nargs = 0;
8092 memset (reg_values, 0, sizeof (reg_values));
8093 for (insn = get_insns (); insn; insn = next)
8094 {
8095 next = NEXT_INSN (insn);
8096 if (NOTE_P (insn))
8097 continue;
8098
8099 if (!INSN_P (insn))
8100 break;
8101
8102 set = PATTERN (insn);
8103 if (GET_CODE (set) != SET)
8104 break;
8105
8106 dest = SET_DEST (set);
8107 src = SET_SRC (set);
8108 if (mips16e_collect_argument_save_p (dest, src, reg_values, &regno))
8109 {
8110 if (!BITSET_P (cfun->machine->frame.mask, regno))
8111 {
8112 delete_insn (insn);
8113 nargs = MAX (nargs, (regno - GP_ARG_FIRST) + 1);
8114 }
8115 }
8116 else if (REG_P (dest) && GET_MODE (dest) == word_mode)
8117 reg_values[REGNO (dest)]
8118 = mips16e_collect_propagate_value (src, reg_values);
8119 else
8120 break;
8121 }
8122 pop_topmost_sequence ();
8123
8124 return nargs;
8125 }
8126
8127 /* Return a move between register REGNO and memory location SP + OFFSET.
8128 Make the move a load if RESTORE_P, otherwise make it a frame-related
8129 store. */
8130
8131 static rtx
8132 mips16e_save_restore_reg (bool restore_p, HOST_WIDE_INT offset,
8133 unsigned int regno)
8134 {
8135 rtx reg, mem;
8136
8137 mem = gen_frame_mem (SImode, plus_constant (stack_pointer_rtx, offset));
8138 reg = gen_rtx_REG (SImode, regno);
8139 return (restore_p
8140 ? gen_rtx_SET (VOIDmode, reg, mem)
8141 : mips_frame_set (mem, reg));
8142 }
8143
8144 /* Return RTL for a MIPS16e SAVE or RESTORE instruction; RESTORE_P says which.
8145 The instruction must:
8146
8147 - Allocate or deallocate SIZE bytes in total; SIZE is known
8148 to be nonzero.
8149
8150 - Save or restore as many registers in *MASK_PTR as possible.
8151 The instruction saves the first registers at the top of the
8152 allocated area, with the other registers below it.
8153
8154 - Save NARGS argument registers above the allocated area.
8155
8156 (NARGS is always zero if RESTORE_P.)
8157
8158 The SAVE and RESTORE instructions cannot save and restore all general
8159 registers, so there may be some registers left over for the caller to
8160 handle. Destructively modify *MASK_PTR so that it contains the registers
8161 that still need to be saved or restored. The caller can save these
8162 registers in the memory immediately below *OFFSET_PTR, which is a
8163 byte offset from the bottom of the allocated stack area. */
8164
8165 static rtx
8166 mips16e_build_save_restore (bool restore_p, unsigned int *mask_ptr,
8167 HOST_WIDE_INT *offset_ptr, unsigned int nargs,
8168 HOST_WIDE_INT size)
8169 {
8170 rtx pattern, set;
8171 HOST_WIDE_INT offset, top_offset;
8172 unsigned int i, regno;
8173 int n;
8174
8175 gcc_assert (cfun->machine->frame.num_fp == 0);
8176
8177 /* Calculate the number of elements in the PARALLEL. We need one element
8178 for the stack adjustment, one for each argument register save, and one
8179 for each additional register move. */
8180 n = 1 + nargs;
8181 for (i = 0; i < ARRAY_SIZE (mips16e_save_restore_regs); i++)
8182 if (BITSET_P (*mask_ptr, mips16e_save_restore_regs[i]))
8183 n++;
8184
8185 /* Create the final PARALLEL. */
8186 pattern = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (n));
8187 n = 0;
8188
8189 /* Add the stack pointer adjustment. */
8190 set = gen_rtx_SET (VOIDmode, stack_pointer_rtx,
8191 plus_constant (stack_pointer_rtx,
8192 restore_p ? size : -size));
8193 RTX_FRAME_RELATED_P (set) = 1;
8194 XVECEXP (pattern, 0, n++) = set;
8195
8196 /* Stack offsets in the PARALLEL are relative to the old stack pointer. */
8197 top_offset = restore_p ? size : 0;
8198
8199 /* Save the arguments. */
8200 for (i = 0; i < nargs; i++)
8201 {
8202 offset = top_offset + i * UNITS_PER_WORD;
8203 set = mips16e_save_restore_reg (restore_p, offset, GP_ARG_FIRST + i);
8204 XVECEXP (pattern, 0, n++) = set;
8205 }
8206
8207 /* Then fill in the other register moves. */
8208 offset = top_offset;
8209 for (i = 0; i < ARRAY_SIZE (mips16e_save_restore_regs); i++)
8210 {
8211 regno = mips16e_save_restore_regs[i];
8212 if (BITSET_P (*mask_ptr, regno))
8213 {
8214 offset -= UNITS_PER_WORD;
8215 set = mips16e_save_restore_reg (restore_p, offset, regno);
8216 XVECEXP (pattern, 0, n++) = set;
8217 *mask_ptr &= ~(1 << regno);
8218 }
8219 }
8220
8221 /* Tell the caller what offset it should use for the remaining registers. */
8222 *offset_ptr = size + (offset - top_offset);
8223
8224 gcc_assert (n == XVECLEN (pattern, 0));
8225
8226 return pattern;
8227 }
8228
8229 /* PATTERN is a PARALLEL whose first element adds ADJUST to the stack
8230 pointer. Return true if PATTERN matches the kind of instruction
8231 generated by mips16e_build_save_restore. If INFO is nonnull,
8232 initialize it when returning true. */
8233
8234 bool
8235 mips16e_save_restore_pattern_p (rtx pattern, HOST_WIDE_INT adjust,
8236 struct mips16e_save_restore_info *info)
8237 {
8238 unsigned int i, nargs, mask, extra;
8239 HOST_WIDE_INT top_offset, save_offset, offset;
8240 rtx set, reg, mem, base;
8241 int n;
8242
8243 if (!GENERATE_MIPS16E_SAVE_RESTORE)
8244 return false;
8245
8246 /* Stack offsets in the PARALLEL are relative to the old stack pointer. */
8247 top_offset = adjust > 0 ? adjust : 0;
8248
8249 /* Interpret all other members of the PARALLEL. */
8250 save_offset = top_offset - UNITS_PER_WORD;
8251 mask = 0;
8252 nargs = 0;
8253 i = 0;
8254 for (n = 1; n < XVECLEN (pattern, 0); n++)
8255 {
8256 /* Check that we have a SET. */
8257 set = XVECEXP (pattern, 0, n);
8258 if (GET_CODE (set) != SET)
8259 return false;
8260
8261 /* Check that the SET is a load (if restoring) or a store
8262 (if saving). */
8263 mem = adjust > 0 ? SET_SRC (set) : SET_DEST (set);
8264 if (!MEM_P (mem))
8265 return false;
8266
8267 /* Check that the address is the sum of the stack pointer and a
8268 possibly-zero constant offset. */
8269 mips_split_plus (XEXP (mem, 0), &base, &offset);
8270 if (base != stack_pointer_rtx)
8271 return false;
8272
8273 /* Check that SET's other operand is a register. */
8274 reg = adjust > 0 ? SET_DEST (set) : SET_SRC (set);
8275 if (!REG_P (reg))
8276 return false;
8277
8278 /* Check for argument saves. */
8279 if (offset == top_offset + nargs * UNITS_PER_WORD
8280 && REGNO (reg) == GP_ARG_FIRST + nargs)
8281 nargs++;
8282 else if (offset == save_offset)
8283 {
8284 while (mips16e_save_restore_regs[i++] != REGNO (reg))
8285 if (i == ARRAY_SIZE (mips16e_save_restore_regs))
8286 return false;
8287
8288 mask |= 1 << REGNO (reg);
8289 save_offset -= UNITS_PER_WORD;
8290 }
8291 else
8292 return false;
8293 }
8294
8295 /* Check that the restrictions on register ranges are met. */
8296 extra = 0;
8297 mips16e_mask_registers (&mask, mips16e_s2_s8_regs,
8298 ARRAY_SIZE (mips16e_s2_s8_regs), &extra);
8299 mips16e_mask_registers (&mask, mips16e_a0_a3_regs,
8300 ARRAY_SIZE (mips16e_a0_a3_regs), &extra);
8301 if (extra != 0)
8302 return false;
8303
8304 /* Make sure that the topmost argument register is not saved twice.
8305 The checks above ensure that the same is then true for the other
8306 argument registers. */
8307 if (nargs > 0 && BITSET_P (mask, GP_ARG_FIRST + nargs - 1))
8308 return false;
8309
8310 /* Pass back information, if requested. */
8311 if (info)
8312 {
8313 info->nargs = nargs;
8314 info->mask = mask;
8315 info->size = (adjust > 0 ? adjust : -adjust);
8316 }
8317
8318 return true;
8319 }
8320
8321 /* Add a MIPS16e SAVE or RESTORE register-range argument to string S
8322 for the register range [MIN_REG, MAX_REG]. Return a pointer to
8323 the null terminator. */
8324
8325 static char *
8326 mips16e_add_register_range (char *s, unsigned int min_reg,
8327 unsigned int max_reg)
8328 {
8329 if (min_reg != max_reg)
8330 s += sprintf (s, ",%s-%s", reg_names[min_reg], reg_names[max_reg]);
8331 else
8332 s += sprintf (s, ",%s", reg_names[min_reg]);
8333 return s;
8334 }
8335
8336 /* Return the assembly instruction for a MIPS16e SAVE or RESTORE instruction.
8337 PATTERN and ADJUST are as for mips16e_save_restore_pattern_p. */
8338
8339 const char *
8340 mips16e_output_save_restore (rtx pattern, HOST_WIDE_INT adjust)
8341 {
8342 static char buffer[300];
8343
8344 struct mips16e_save_restore_info info;
8345 unsigned int i, end;
8346 char *s;
8347
8348 /* Parse the pattern. */
8349 if (!mips16e_save_restore_pattern_p (pattern, adjust, &info))
8350 gcc_unreachable ();
8351
8352 /* Add the mnemonic. */
8353 s = strcpy (buffer, adjust > 0 ? "restore\t" : "save\t");
8354 s += strlen (s);
8355
8356 /* Save the arguments. */
8357 if (info.nargs > 1)
8358 s += sprintf (s, "%s-%s,", reg_names[GP_ARG_FIRST],
8359 reg_names[GP_ARG_FIRST + info.nargs - 1]);
8360 else if (info.nargs == 1)
8361 s += sprintf (s, "%s,", reg_names[GP_ARG_FIRST]);
8362
8363 /* Emit the amount of stack space to allocate or deallocate. */
8364 s += sprintf (s, "%d", (int) info.size);
8365
8366 /* Save or restore $16. */
8367 if (BITSET_P (info.mask, 16))
8368 s += sprintf (s, ",%s", reg_names[GP_REG_FIRST + 16]);
8369
8370 /* Save or restore $17. */
8371 if (BITSET_P (info.mask, 17))
8372 s += sprintf (s, ",%s", reg_names[GP_REG_FIRST + 17]);
8373
8374 /* Save or restore registers in the range $s2...$s8, which
8375 mips16e_s2_s8_regs lists in decreasing order. Note that this
8376 is a software register range; the hardware registers are not
8377 numbered consecutively. */
8378 end = ARRAY_SIZE (mips16e_s2_s8_regs);
8379 i = mips16e_find_first_register (info.mask, mips16e_s2_s8_regs, end);
8380 if (i < end)
8381 s = mips16e_add_register_range (s, mips16e_s2_s8_regs[end - 1],
8382 mips16e_s2_s8_regs[i]);
8383
8384 /* Save or restore registers in the range $a0...$a3. */
8385 end = ARRAY_SIZE (mips16e_a0_a3_regs);
8386 i = mips16e_find_first_register (info.mask, mips16e_a0_a3_regs, end);
8387 if (i < end)
8388 s = mips16e_add_register_range (s, mips16e_a0_a3_regs[i],
8389 mips16e_a0_a3_regs[end - 1]);
8390
8391 /* Save or restore $31. */
8392 if (BITSET_P (info.mask, 31))
8393 s += sprintf (s, ",%s", reg_names[GP_REG_FIRST + 31]);
8394
8395 return buffer;
8396 }
8397 \f
8398 /* Return true if the current function has an insn that implicitly
8399 refers to $gp. */
8400
8401 static bool
8402 mips_function_has_gp_insn (void)
8403 {
8404 /* Don't bother rechecking if we found one last time. */
8405 if (!cfun->machine->has_gp_insn_p)
8406 {
8407 rtx insn;
8408
8409 push_topmost_sequence ();
8410 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
8411 if (USEFUL_INSN_P (insn)
8412 && (get_attr_got (insn) != GOT_UNSET
8413 || mips_small_data_pattern_p (PATTERN (insn))))
8414 {
8415 cfun->machine->has_gp_insn_p = true;
8416 break;
8417 }
8418 pop_topmost_sequence ();
8419 }
8420 return cfun->machine->has_gp_insn_p;
8421 }
8422
8423 /* Return true if the current function returns its value in a floating-point
8424 register in MIPS16 mode. */
8425
8426 static bool
8427 mips16_cfun_returns_in_fpr_p (void)
8428 {
8429 tree return_type = DECL_RESULT (current_function_decl);
8430 return (TARGET_MIPS16
8431 && TARGET_HARD_FLOAT_ABI
8432 && !aggregate_value_p (return_type, current_function_decl)
8433 && mips_return_mode_in_fpr_p (DECL_MODE (return_type)));
8434 }
8435
8436 /* Return the register that should be used as the global pointer
8437 within this function. Return INVALID_REGNUM if the function
8438 doesn't need a global pointer. */
8439
8440 static unsigned int
8441 mips_global_pointer (void)
8442 {
8443 unsigned int regno;
8444
8445 /* $gp is always available unless we're using a GOT. */
8446 if (!TARGET_USE_GOT)
8447 return GLOBAL_POINTER_REGNUM;
8448
8449 /* We must always provide $gp when it is used implicitly. */
8450 if (!TARGET_EXPLICIT_RELOCS)
8451 return GLOBAL_POINTER_REGNUM;
8452
8453 /* FUNCTION_PROFILER includes a jal macro, so we need to give it
8454 a valid gp. */
8455 if (crtl->profile)
8456 return GLOBAL_POINTER_REGNUM;
8457
8458 /* If the function has a nonlocal goto, $gp must hold the correct
8459 global pointer for the target function. */
8460 if (crtl->has_nonlocal_goto)
8461 return GLOBAL_POINTER_REGNUM;
8462
8463 /* There's no need to initialize $gp if it isn't referenced now,
8464 and if we can be sure that no new references will be added during
8465 or after reload. */
8466 if (!df_regs_ever_live_p (GLOBAL_POINTER_REGNUM)
8467 && !mips_function_has_gp_insn ())
8468 {
8469 /* The function doesn't use $gp at the moment. If we're generating
8470 -call_nonpic code, no new uses will be introduced during or after
8471 reload. */
8472 if (TARGET_ABICALLS_PIC0)
8473 return INVALID_REGNUM;
8474
8475 /* We need to handle the following implicit gp references:
8476
8477 - Reload can sometimes introduce constant pool references
8478 into a function that otherwise didn't need them. For example,
8479 suppose we have an instruction like:
8480
8481 (set (reg:DF R1) (float:DF (reg:SI R2)))
8482
8483 If R2 turns out to be constant such as 1, the instruction may
8484 have a REG_EQUAL note saying that R1 == 1.0. Reload then has
8485 the option of using this constant if R2 doesn't get allocated
8486 to a register.
8487
8488 In cases like these, reload will have added the constant to the
8489 pool but no instruction will yet refer to it.
8490
8491 - MIPS16 functions that return in FPRs need to call an
8492 external libgcc routine. */
8493 if (!crtl->uses_const_pool
8494 && !mips16_cfun_returns_in_fpr_p ())
8495 return INVALID_REGNUM;
8496 }
8497
8498 /* We need a global pointer, but perhaps we can use a call-clobbered
8499 register instead of $gp. */
8500 if (TARGET_CALL_SAVED_GP && current_function_is_leaf)
8501 for (regno = GP_REG_FIRST; regno <= GP_REG_LAST; regno++)
8502 if (!df_regs_ever_live_p (regno)
8503 && call_really_used_regs[regno]
8504 && !fixed_regs[regno]
8505 && regno != PIC_FUNCTION_ADDR_REGNUM)
8506 return regno;
8507
8508 return GLOBAL_POINTER_REGNUM;
8509 }
8510
8511 /* Return true if REGNO is a register that is ordinarily call-clobbered
8512 but must nevertheless be preserved by an interrupt handler. */
8513
8514 static bool
8515 mips_interrupt_extra_call_saved_reg_p (unsigned int regno)
8516 {
8517 if (MD_REG_P (regno))
8518 return true;
8519
8520 if (TARGET_DSP && DSP_ACC_REG_P (regno))
8521 return true;
8522
8523 if (GP_REG_P (regno) && !cfun->machine->use_shadow_register_set_p)
8524 {
8525 /* $0 is hard-wired. */
8526 if (regno == GP_REG_FIRST)
8527 return false;
8528
8529 /* The interrupt handler can treat kernel registers as
8530 scratch registers. */
8531 if (KERNEL_REG_P (regno))
8532 return false;
8533
8534 /* The function will return the stack pointer to its original value
8535 anyway. */
8536 if (regno == STACK_POINTER_REGNUM)
8537 return false;
8538
8539 /* Otherwise, return true for registers that aren't ordinarily
8540 call-clobbered. */
8541 return call_really_used_regs[regno];
8542 }
8543
8544 return false;
8545 }
8546
8547 /* Return true if the current function should treat register REGNO
8548 as call-saved. */
8549
8550 static bool
8551 mips_cfun_call_saved_reg_p (unsigned int regno)
8552 {
8553 /* Interrupt handlers need to save extra registers. */
8554 if (cfun->machine->interrupt_handler_p
8555 && mips_interrupt_extra_call_saved_reg_p (regno))
8556 return true;
8557
8558 /* call_insns preserve $28 unless they explicitly say otherwise,
8559 so call_really_used_regs[] treats $28 as call-saved. However,
8560 we want the ABI property rather than the default call_insn
8561 property here. */
8562 return (regno == GLOBAL_POINTER_REGNUM
8563 ? TARGET_CALL_SAVED_GP
8564 : !call_really_used_regs[regno]);
8565 }
8566
8567 /* Return true if the function body might clobber register REGNO.
8568 We know that REGNO is call-saved. */
8569
8570 static bool
8571 mips_cfun_might_clobber_call_saved_reg_p (unsigned int regno)
8572 {
8573 /* Some functions should be treated as clobbering all call-saved
8574 registers. */
8575 if (crtl->saves_all_registers)
8576 return true;
8577
8578 /* DF handles cases where a register is explicitly referenced in
8579 the rtl. Incoming values are passed in call-clobbered registers,
8580 so we can assume that any live call-saved register is set within
8581 the function. */
8582 if (df_regs_ever_live_p (regno))
8583 return true;
8584
8585 /* Check for registers that are clobbered by FUNCTION_PROFILER.
8586 These clobbers are not explicit in the rtl. */
8587 if (crtl->profile && MIPS_SAVE_REG_FOR_PROFILING_P (regno))
8588 return true;
8589
8590 /* If we're using a call-saved global pointer, the function's
8591 prologue will need to set it up. */
8592 if (cfun->machine->global_pointer == regno)
8593 return true;
8594
8595 /* The function's prologue will need to set the frame pointer if
8596 frame_pointer_needed. */
8597 if (regno == HARD_FRAME_POINTER_REGNUM && frame_pointer_needed)
8598 return true;
8599
8600 /* If a MIPS16 function returns a value in FPRs, its epilogue
8601 will need to call an external libgcc routine. This yet-to-be
8602 generated call_insn will clobber $31. */
8603 if (regno == GP_REG_FIRST + 31 && mips16_cfun_returns_in_fpr_p ())
8604 return true;
8605
8606 /* If REGNO is ordinarily call-clobbered, we must assume that any
8607 called function could modify it. */
8608 if (cfun->machine->interrupt_handler_p
8609 && !current_function_is_leaf
8610 && mips_interrupt_extra_call_saved_reg_p (regno))
8611 return true;
8612
8613 return false;
8614 }
8615
8616 /* Return true if the current function must save register REGNO. */
8617
8618 static bool
8619 mips_save_reg_p (unsigned int regno)
8620 {
8621 if (mips_cfun_call_saved_reg_p (regno))
8622 {
8623 if (mips_cfun_might_clobber_call_saved_reg_p (regno))
8624 return true;
8625
8626 /* Save both registers in an FPR pair if either one is used. This is
8627 needed for the case when MIN_FPRS_PER_FMT == 1, which allows the odd
8628 register to be used without the even register. */
8629 if (FP_REG_P (regno)
8630 && MAX_FPRS_PER_FMT == 2
8631 && mips_cfun_might_clobber_call_saved_reg_p (regno + 1))
8632 return true;
8633 }
8634
8635 /* We need to save the incoming return address if __builtin_eh_return
8636 is being used to set a different return address. */
8637 if (regno == GP_REG_FIRST + 31 && crtl->calls_eh_return)
8638 return true;
8639
8640 return false;
8641 }
8642
8643 /* Populate the current function's mips_frame_info structure.
8644
8645 MIPS stack frames look like:
8646
8647 +-------------------------------+
8648 | |
8649 | incoming stack arguments |
8650 | |
8651 +-------------------------------+
8652 | |
8653 | caller-allocated save area |
8654 A | for register arguments |
8655 | |
8656 +-------------------------------+ <-- incoming stack pointer
8657 | |
8658 | callee-allocated save area |
8659 B | for arguments that are |
8660 | split between registers and |
8661 | the stack |
8662 | |
8663 +-------------------------------+ <-- arg_pointer_rtx
8664 | |
8665 C | callee-allocated save area |
8666 | for register varargs |
8667 | |
8668 +-------------------------------+ <-- frame_pointer_rtx
8669 | | + cop0_sp_offset
8670 | COP0 reg save area | + UNITS_PER_WORD
8671 | |
8672 +-------------------------------+ <-- frame_pointer_rtx + acc_sp_offset
8673 | | + UNITS_PER_WORD
8674 | accumulator save area |
8675 | |
8676 +-------------------------------+ <-- stack_pointer_rtx + fp_sp_offset
8677 | | + UNITS_PER_HWFPVALUE
8678 | FPR save area |
8679 | |
8680 +-------------------------------+ <-- stack_pointer_rtx + gp_sp_offset
8681 | | + UNITS_PER_WORD
8682 | GPR save area |
8683 | |
8684 +-------------------------------+ <-- frame_pointer_rtx with
8685 | | \ -fstack-protector
8686 | local variables | | var_size
8687 | | /
8688 +-------------------------------+
8689 | | \
8690 | $gp save area | | cprestore_size
8691 | | /
8692 P +-------------------------------+ <-- hard_frame_pointer_rtx for
8693 | | \ MIPS16 code
8694 | outgoing stack arguments | |
8695 | | |
8696 +-------------------------------+ | args_size
8697 | | |
8698 | caller-allocated save area | |
8699 | for register arguments | |
8700 | | /
8701 +-------------------------------+ <-- stack_pointer_rtx
8702 frame_pointer_rtx without
8703 -fstack-protector
8704 hard_frame_pointer_rtx for
8705 non-MIPS16 code.
8706
8707 At least two of A, B and C will be empty.
8708
8709 Dynamic stack allocations such as alloca insert data at point P.
8710 They decrease stack_pointer_rtx but leave frame_pointer_rtx and
8711 hard_frame_pointer_rtx unchanged. */
8712
8713 static void
8714 mips_compute_frame_info (void)
8715 {
8716 struct mips_frame_info *frame;
8717 HOST_WIDE_INT offset, size;
8718 unsigned int regno, i;
8719
8720 /* Set this function's interrupt properties. */
8721 if (mips_interrupt_type_p (TREE_TYPE (current_function_decl)))
8722 {
8723 if (!ISA_MIPS32R2)
8724 error ("the %<interrupt%> attribute requires a MIPS32r2 processor");
8725 else if (TARGET_HARD_FLOAT)
8726 error ("the %<interrupt%> attribute requires %<-msoft-float%>");
8727 else if (TARGET_MIPS16)
8728 error ("interrupt handlers cannot be MIPS16 functions");
8729 else
8730 {
8731 cfun->machine->interrupt_handler_p = true;
8732 cfun->machine->use_shadow_register_set_p =
8733 mips_use_shadow_register_set_p (TREE_TYPE (current_function_decl));
8734 cfun->machine->keep_interrupts_masked_p =
8735 mips_keep_interrupts_masked_p (TREE_TYPE (current_function_decl));
8736 cfun->machine->use_debug_exception_return_p =
8737 mips_use_debug_exception_return_p (TREE_TYPE
8738 (current_function_decl));
8739 }
8740 }
8741
8742 frame = &cfun->machine->frame;
8743 memset (frame, 0, sizeof (*frame));
8744 size = get_frame_size ();
8745
8746 cfun->machine->global_pointer = mips_global_pointer ();
8747
8748 /* The first two blocks contain the outgoing argument area and the $gp save
8749 slot. This area isn't needed in leaf functions, but if the
8750 target-independent frame size is nonzero, we have already committed to
8751 allocating these in STARTING_FRAME_OFFSET for !FRAME_GROWS_DOWNWARD. */
8752 if ((size == 0 || FRAME_GROWS_DOWNWARD) && current_function_is_leaf)
8753 {
8754 /* The MIPS 3.0 linker does not like functions that dynamically
8755 allocate the stack and have 0 for STACK_DYNAMIC_OFFSET, since it
8756 looks like we are trying to create a second frame pointer to the
8757 function, so allocate some stack space to make it happy. */
8758 if (cfun->calls_alloca)
8759 frame->args_size = REG_PARM_STACK_SPACE (cfun->decl);
8760 else
8761 frame->args_size = 0;
8762 frame->cprestore_size = 0;
8763 }
8764 else
8765 {
8766 frame->args_size = crtl->outgoing_args_size;
8767 frame->cprestore_size = MIPS_GP_SAVE_AREA_SIZE;
8768 }
8769 offset = frame->args_size + frame->cprestore_size;
8770
8771 /* Move above the local variables. */
8772 frame->var_size = MIPS_STACK_ALIGN (size);
8773 offset += frame->var_size;
8774
8775 /* Find out which GPRs we need to save. */
8776 for (regno = GP_REG_FIRST; regno <= GP_REG_LAST; regno++)
8777 if (mips_save_reg_p (regno))
8778 {
8779 frame->num_gp++;
8780 frame->mask |= 1 << (regno - GP_REG_FIRST);
8781 }
8782
8783 /* If this function calls eh_return, we must also save and restore the
8784 EH data registers. */
8785 if (crtl->calls_eh_return)
8786 for (i = 0; EH_RETURN_DATA_REGNO (i) != INVALID_REGNUM; i++)
8787 {
8788 frame->num_gp++;
8789 frame->mask |= 1 << (EH_RETURN_DATA_REGNO (i) - GP_REG_FIRST);
8790 }
8791
8792 /* The MIPS16e SAVE and RESTORE instructions have two ranges of registers:
8793 $a3-$a0 and $s2-$s8. If we save one register in the range, we must
8794 save all later registers too. */
8795 if (GENERATE_MIPS16E_SAVE_RESTORE)
8796 {
8797 mips16e_mask_registers (&frame->mask, mips16e_s2_s8_regs,
8798 ARRAY_SIZE (mips16e_s2_s8_regs), &frame->num_gp);
8799 mips16e_mask_registers (&frame->mask, mips16e_a0_a3_regs,
8800 ARRAY_SIZE (mips16e_a0_a3_regs), &frame->num_gp);
8801 }
8802
8803 /* Move above the GPR save area. */
8804 if (frame->num_gp > 0)
8805 {
8806 offset += MIPS_STACK_ALIGN (frame->num_gp * UNITS_PER_WORD);
8807 frame->gp_sp_offset = offset - UNITS_PER_WORD;
8808 }
8809
8810 /* Find out which FPRs we need to save. This loop must iterate over
8811 the same space as its companion in mips_for_each_saved_gpr_and_fpr. */
8812 if (TARGET_HARD_FLOAT)
8813 for (regno = FP_REG_FIRST; regno <= FP_REG_LAST; regno += MAX_FPRS_PER_FMT)
8814 if (mips_save_reg_p (regno))
8815 {
8816 frame->num_fp += MAX_FPRS_PER_FMT;
8817 frame->fmask |= ~(~0 << MAX_FPRS_PER_FMT) << (regno - FP_REG_FIRST);
8818 }
8819
8820 /* Move above the FPR save area. */
8821 if (frame->num_fp > 0)
8822 {
8823 offset += MIPS_STACK_ALIGN (frame->num_fp * UNITS_PER_FPREG);
8824 frame->fp_sp_offset = offset - UNITS_PER_HWFPVALUE;
8825 }
8826
8827 /* Add in space for the interrupt context information. */
8828 if (cfun->machine->interrupt_handler_p)
8829 {
8830 /* Check HI/LO. */
8831 if (mips_save_reg_p (LO_REGNUM) || mips_save_reg_p (HI_REGNUM))
8832 {
8833 frame->num_acc++;
8834 frame->acc_mask |= (1 << 0);
8835 }
8836
8837 /* Check accumulators 1, 2, 3. */
8838 for (i = DSP_ACC_REG_FIRST; i <= DSP_ACC_REG_LAST; i += 2)
8839 if (mips_save_reg_p (i) || mips_save_reg_p (i + 1))
8840 {
8841 frame->num_acc++;
8842 frame->acc_mask |= 1 << (((i - DSP_ACC_REG_FIRST) / 2) + 1);
8843 }
8844
8845 /* All interrupt context functions need space to preserve STATUS. */
8846 frame->num_cop0_regs++;
8847
8848 /* If we don't keep interrupts masked, we need to save EPC. */
8849 if (!cfun->machine->keep_interrupts_masked_p)
8850 frame->num_cop0_regs++;
8851 }
8852
8853 /* Move above the accumulator save area. */
8854 if (frame->num_acc > 0)
8855 {
8856 /* Each accumulator needs 2 words. */
8857 offset += frame->num_acc * 2 * UNITS_PER_WORD;
8858 frame->acc_sp_offset = offset - UNITS_PER_WORD;
8859 }
8860
8861 /* Move above the COP0 register save area. */
8862 if (frame->num_cop0_regs > 0)
8863 {
8864 offset += frame->num_cop0_regs * UNITS_PER_WORD;
8865 frame->cop0_sp_offset = offset - UNITS_PER_WORD;
8866 }
8867
8868 /* Move above the callee-allocated varargs save area. */
8869 offset += MIPS_STACK_ALIGN (cfun->machine->varargs_size);
8870 frame->arg_pointer_offset = offset;
8871
8872 /* Move above the callee-allocated area for pretend stack arguments. */
8873 offset += crtl->args.pretend_args_size;
8874 frame->total_size = offset;
8875
8876 /* Work out the offsets of the save areas from the top of the frame. */
8877 if (frame->gp_sp_offset > 0)
8878 frame->gp_save_offset = frame->gp_sp_offset - offset;
8879 if (frame->fp_sp_offset > 0)
8880 frame->fp_save_offset = frame->fp_sp_offset - offset;
8881 if (frame->acc_sp_offset > 0)
8882 frame->acc_save_offset = frame->acc_sp_offset - offset;
8883 if (frame->num_cop0_regs > 0)
8884 frame->cop0_save_offset = frame->cop0_sp_offset - offset;
8885
8886 /* MIPS16 code offsets the frame pointer by the size of the outgoing
8887 arguments. This tends to increase the chances of using unextended
8888 instructions for local variables and incoming arguments. */
8889 if (TARGET_MIPS16)
8890 frame->hard_frame_pointer_offset = frame->args_size;
8891 }
8892
8893 /* Return the style of GP load sequence that is being used for the
8894 current function. */
8895
8896 enum mips_loadgp_style
8897 mips_current_loadgp_style (void)
8898 {
8899 if (!TARGET_USE_GOT || cfun->machine->global_pointer == INVALID_REGNUM)
8900 return LOADGP_NONE;
8901
8902 if (TARGET_RTP_PIC)
8903 return LOADGP_RTP;
8904
8905 if (TARGET_ABSOLUTE_ABICALLS)
8906 return LOADGP_ABSOLUTE;
8907
8908 return TARGET_NEWABI ? LOADGP_NEWABI : LOADGP_OLDABI;
8909 }
8910
8911 /* Implement FRAME_POINTER_REQUIRED. */
8912
8913 bool
8914 mips_frame_pointer_required (void)
8915 {
8916 /* If the function contains dynamic stack allocations, we need to
8917 use the frame pointer to access the static parts of the frame. */
8918 if (cfun->calls_alloca)
8919 return true;
8920
8921 /* In MIPS16 mode, we need a frame pointer for a large frame; otherwise,
8922 reload may be unable to compute the address of a local variable,
8923 since there is no way to add a large constant to the stack pointer
8924 without using a second temporary register. */
8925 if (TARGET_MIPS16)
8926 {
8927 mips_compute_frame_info ();
8928 if (!SMALL_OPERAND (cfun->machine->frame.total_size))
8929 return true;
8930 }
8931
8932 return false;
8933 }
8934
8935 /* Implement INITIAL_ELIMINATION_OFFSET. FROM is either the frame pointer
8936 or argument pointer. TO is either the stack pointer or hard frame
8937 pointer. */
8938
8939 HOST_WIDE_INT
8940 mips_initial_elimination_offset (int from, int to)
8941 {
8942 HOST_WIDE_INT offset;
8943
8944 mips_compute_frame_info ();
8945
8946 /* Set OFFSET to the offset from the end-of-prologue stack pointer. */
8947 switch (from)
8948 {
8949 case FRAME_POINTER_REGNUM:
8950 if (FRAME_GROWS_DOWNWARD)
8951 offset = (cfun->machine->frame.args_size
8952 + cfun->machine->frame.cprestore_size
8953 + cfun->machine->frame.var_size);
8954 else
8955 offset = 0;
8956 break;
8957
8958 case ARG_POINTER_REGNUM:
8959 offset = cfun->machine->frame.arg_pointer_offset;
8960 break;
8961
8962 default:
8963 gcc_unreachable ();
8964 }
8965
8966 if (to == HARD_FRAME_POINTER_REGNUM)
8967 offset -= cfun->machine->frame.hard_frame_pointer_offset;
8968
8969 return offset;
8970 }
8971 \f
8972 /* Implement TARGET_EXTRA_LIVE_ON_ENTRY. */
8973
8974 static void
8975 mips_extra_live_on_entry (bitmap regs)
8976 {
8977 if (TARGET_USE_GOT)
8978 {
8979 /* PIC_FUNCTION_ADDR_REGNUM is live if we need it to set up
8980 the global pointer. */
8981 if (!TARGET_ABSOLUTE_ABICALLS)
8982 bitmap_set_bit (regs, PIC_FUNCTION_ADDR_REGNUM);
8983
8984 /* The prologue may set MIPS16_PIC_TEMP_REGNUM to the value of
8985 the global pointer. */
8986 if (TARGET_MIPS16)
8987 bitmap_set_bit (regs, MIPS16_PIC_TEMP_REGNUM);
8988
8989 /* See the comment above load_call<mode> for details. */
8990 bitmap_set_bit (regs, GOT_VERSION_REGNUM);
8991 }
8992 }
8993
8994 /* Implement RETURN_ADDR_RTX. We do not support moving back to a
8995 previous frame. */
8996
8997 rtx
8998 mips_return_addr (int count, rtx frame ATTRIBUTE_UNUSED)
8999 {
9000 if (count != 0)
9001 return const0_rtx;
9002
9003 return get_hard_reg_initial_val (Pmode, GP_REG_FIRST + 31);
9004 }
9005
9006 /* Emit code to change the current function's return address to
9007 ADDRESS. SCRATCH is available as a scratch register, if needed.
9008 ADDRESS and SCRATCH are both word-mode GPRs. */
9009
9010 void
9011 mips_set_return_address (rtx address, rtx scratch)
9012 {
9013 rtx slot_address;
9014
9015 gcc_assert (BITSET_P (cfun->machine->frame.mask, 31));
9016 slot_address = mips_add_offset (scratch, stack_pointer_rtx,
9017 cfun->machine->frame.gp_sp_offset);
9018 mips_emit_move (gen_frame_mem (GET_MODE (address), slot_address), address);
9019 }
9020
9021 /* Return a MEM rtx for the cprestore slot, using TEMP as a temporary base
9022 register if need be. */
9023
9024 static rtx
9025 mips_cprestore_slot (rtx temp)
9026 {
9027 const struct mips_frame_info *frame;
9028 rtx base;
9029 HOST_WIDE_INT offset;
9030
9031 frame = &cfun->machine->frame;
9032 if (frame_pointer_needed)
9033 {
9034 base = hard_frame_pointer_rtx;
9035 offset = frame->args_size - frame->hard_frame_pointer_offset;
9036 }
9037 else
9038 {
9039 base = stack_pointer_rtx;
9040 offset = frame->args_size;
9041 }
9042 return gen_frame_mem (Pmode, mips_add_offset (temp, base, offset));
9043 }
9044
9045 /* Restore $gp from its save slot, using TEMP as a temporary base register
9046 if need be. This function is for o32 and o64 abicalls only. */
9047
9048 void
9049 mips_restore_gp (rtx temp)
9050 {
9051 gcc_assert (TARGET_ABICALLS && TARGET_OLDABI);
9052
9053 if (cfun->machine->global_pointer == INVALID_REGNUM)
9054 return;
9055
9056 if (TARGET_MIPS16)
9057 {
9058 mips_emit_move (temp, mips_cprestore_slot (temp));
9059 mips_emit_move (pic_offset_table_rtx, temp);
9060 }
9061 else
9062 mips_emit_move (pic_offset_table_rtx, mips_cprestore_slot (temp));
9063 if (!TARGET_EXPLICIT_RELOCS)
9064 emit_insn (gen_blockage ());
9065 }
9066 \f
9067 /* A function to save or store a register. The first argument is the
9068 register and the second is the stack slot. */
9069 typedef void (*mips_save_restore_fn) (rtx, rtx);
9070
9071 /* Use FN to save or restore register REGNO. MODE is the register's
9072 mode and OFFSET is the offset of its save slot from the current
9073 stack pointer. */
9074
9075 static void
9076 mips_save_restore_reg (enum machine_mode mode, int regno,
9077 HOST_WIDE_INT offset, mips_save_restore_fn fn)
9078 {
9079 rtx mem;
9080
9081 mem = gen_frame_mem (mode, plus_constant (stack_pointer_rtx, offset));
9082 fn (gen_rtx_REG (mode, regno), mem);
9083 }
9084
9085 /* Call FN for each accumlator that is saved by the current function.
9086 SP_OFFSET is the offset of the current stack pointer from the start
9087 of the frame. */
9088
9089 static void
9090 mips_for_each_saved_acc (HOST_WIDE_INT sp_offset, mips_save_restore_fn fn)
9091 {
9092 HOST_WIDE_INT offset;
9093 int regno;
9094
9095 offset = cfun->machine->frame.acc_sp_offset - sp_offset;
9096 if (BITSET_P (cfun->machine->frame.acc_mask, 0))
9097 {
9098 mips_save_restore_reg (word_mode, LO_REGNUM, offset, fn);
9099 offset -= UNITS_PER_WORD;
9100 mips_save_restore_reg (word_mode, HI_REGNUM, offset, fn);
9101 offset -= UNITS_PER_WORD;
9102 }
9103
9104 for (regno = DSP_ACC_REG_FIRST; regno <= DSP_ACC_REG_LAST; regno++)
9105 if (BITSET_P (cfun->machine->frame.acc_mask,
9106 ((regno - DSP_ACC_REG_FIRST) / 2) + 1))
9107 {
9108 mips_save_restore_reg (word_mode, regno, offset, fn);
9109 offset -= UNITS_PER_WORD;
9110 }
9111 }
9112
9113 /* Call FN for each register that is saved by the current function.
9114 SP_OFFSET is the offset of the current stack pointer from the start
9115 of the frame. */
9116
9117 static void
9118 mips_for_each_saved_gpr_and_fpr (HOST_WIDE_INT sp_offset,
9119 mips_save_restore_fn fn)
9120 {
9121 enum machine_mode fpr_mode;
9122 HOST_WIDE_INT offset;
9123 int regno;
9124
9125 /* Save registers starting from high to low. The debuggers prefer at least
9126 the return register be stored at func+4, and also it allows us not to
9127 need a nop in the epilogue if at least one register is reloaded in
9128 addition to return address. */
9129 offset = cfun->machine->frame.gp_sp_offset - sp_offset;
9130 for (regno = GP_REG_LAST; regno >= GP_REG_FIRST; regno--)
9131 if (BITSET_P (cfun->machine->frame.mask, regno - GP_REG_FIRST))
9132 {
9133 mips_save_restore_reg (word_mode, regno, offset, fn);
9134 offset -= UNITS_PER_WORD;
9135 }
9136
9137 /* This loop must iterate over the same space as its companion in
9138 mips_compute_frame_info. */
9139 offset = cfun->machine->frame.fp_sp_offset - sp_offset;
9140 fpr_mode = (TARGET_SINGLE_FLOAT ? SFmode : DFmode);
9141 for (regno = FP_REG_LAST - MAX_FPRS_PER_FMT + 1;
9142 regno >= FP_REG_FIRST;
9143 regno -= MAX_FPRS_PER_FMT)
9144 if (BITSET_P (cfun->machine->frame.fmask, regno - FP_REG_FIRST))
9145 {
9146 mips_save_restore_reg (fpr_mode, regno, offset, fn);
9147 offset -= GET_MODE_SIZE (fpr_mode);
9148 }
9149 }
9150 \f
9151 /* If we're generating n32 or n64 abicalls, and the current function
9152 does not use $28 as its global pointer, emit a cplocal directive.
9153 Use pic_offset_table_rtx as the argument to the directive. */
9154
9155 static void
9156 mips_output_cplocal (void)
9157 {
9158 if (!TARGET_EXPLICIT_RELOCS
9159 && cfun->machine->global_pointer != INVALID_REGNUM
9160 && cfun->machine->global_pointer != GLOBAL_POINTER_REGNUM)
9161 output_asm_insn (".cplocal %+", 0);
9162 }
9163
9164 /* Implement TARGET_OUTPUT_FUNCTION_PROLOGUE. */
9165
9166 static void
9167 mips_output_function_prologue (FILE *file, HOST_WIDE_INT size ATTRIBUTE_UNUSED)
9168 {
9169 const char *fnname;
9170
9171 #ifdef SDB_DEBUGGING_INFO
9172 if (debug_info_level != DINFO_LEVEL_TERSE && write_symbols == SDB_DEBUG)
9173 SDB_OUTPUT_SOURCE_LINE (file, DECL_SOURCE_LINE (current_function_decl));
9174 #endif
9175
9176 /* In MIPS16 mode, we may need to generate a non-MIPS16 stub to handle
9177 floating-point arguments. */
9178 if (TARGET_MIPS16
9179 && TARGET_HARD_FLOAT_ABI
9180 && crtl->args.info.fp_code != 0)
9181 mips16_build_function_stub ();
9182
9183 /* Get the function name the same way that toplev.c does before calling
9184 assemble_start_function. This is needed so that the name used here
9185 exactly matches the name used in ASM_DECLARE_FUNCTION_NAME. */
9186 fnname = XSTR (XEXP (DECL_RTL (current_function_decl), 0), 0);
9187 mips_start_function_definition (fnname, TARGET_MIPS16);
9188
9189 /* Stop mips_file_end from treating this function as external. */
9190 if (TARGET_IRIX && mips_abi == ABI_32)
9191 TREE_ASM_WRITTEN (DECL_NAME (cfun->decl)) = 1;
9192
9193 /* Output MIPS-specific frame information. */
9194 if (!flag_inhibit_size_directive)
9195 {
9196 const struct mips_frame_info *frame;
9197
9198 frame = &cfun->machine->frame;
9199
9200 /* .frame FRAMEREG, FRAMESIZE, RETREG. */
9201 fprintf (file,
9202 "\t.frame\t%s," HOST_WIDE_INT_PRINT_DEC ",%s\t\t"
9203 "# vars= " HOST_WIDE_INT_PRINT_DEC
9204 ", regs= %d/%d"
9205 ", args= " HOST_WIDE_INT_PRINT_DEC
9206 ", gp= " HOST_WIDE_INT_PRINT_DEC "\n",
9207 reg_names[frame_pointer_needed
9208 ? HARD_FRAME_POINTER_REGNUM
9209 : STACK_POINTER_REGNUM],
9210 (frame_pointer_needed
9211 ? frame->total_size - frame->hard_frame_pointer_offset
9212 : frame->total_size),
9213 reg_names[GP_REG_FIRST + 31],
9214 frame->var_size,
9215 frame->num_gp, frame->num_fp,
9216 frame->args_size,
9217 frame->cprestore_size);
9218
9219 /* .mask MASK, OFFSET. */
9220 fprintf (file, "\t.mask\t0x%08x," HOST_WIDE_INT_PRINT_DEC "\n",
9221 frame->mask, frame->gp_save_offset);
9222
9223 /* .fmask MASK, OFFSET. */
9224 fprintf (file, "\t.fmask\t0x%08x," HOST_WIDE_INT_PRINT_DEC "\n",
9225 frame->fmask, frame->fp_save_offset);
9226 }
9227
9228 /* Handle the initialization of $gp for SVR4 PIC, if applicable.
9229 Also emit the ".set noreorder; .set nomacro" sequence for functions
9230 that need it. */
9231 if (mips_current_loadgp_style () == LOADGP_OLDABI)
9232 {
9233 if (TARGET_MIPS16)
9234 {
9235 /* This is a fixed-form sequence. The position of the
9236 first two instructions is important because of the
9237 way _gp_disp is defined. */
9238 output_asm_insn ("li\t$2,%%hi(_gp_disp)", 0);
9239 output_asm_insn ("addiu\t$3,$pc,%%lo(_gp_disp)", 0);
9240 output_asm_insn ("sll\t$2,16", 0);
9241 output_asm_insn ("addu\t$2,$3", 0);
9242 }
9243 /* .cpload must be in a .set noreorder but not a .set nomacro block. */
9244 else if (!cfun->machine->all_noreorder_p)
9245 output_asm_insn ("%(.cpload\t%^%)", 0);
9246 else
9247 output_asm_insn ("%(.cpload\t%^\n\t%<", 0);
9248 }
9249 else if (cfun->machine->all_noreorder_p)
9250 output_asm_insn ("%(%<", 0);
9251
9252 /* Tell the assembler which register we're using as the global
9253 pointer. This is needed for thunks, since they can use either
9254 explicit relocs or assembler macros. */
9255 mips_output_cplocal ();
9256 }
9257
9258 /* Implement TARGET_OUTPUT_FUNCTION_EPILOGUE. */
9259
9260 static void
9261 mips_output_function_epilogue (FILE *file ATTRIBUTE_UNUSED,
9262 HOST_WIDE_INT size ATTRIBUTE_UNUSED)
9263 {
9264 const char *fnname;
9265
9266 /* Reinstate the normal $gp. */
9267 SET_REGNO (pic_offset_table_rtx, GLOBAL_POINTER_REGNUM);
9268 mips_output_cplocal ();
9269
9270 if (cfun->machine->all_noreorder_p)
9271 {
9272 /* Avoid using %>%) since it adds excess whitespace. */
9273 output_asm_insn (".set\tmacro", 0);
9274 output_asm_insn (".set\treorder", 0);
9275 set_noreorder = set_nomacro = 0;
9276 }
9277
9278 /* Get the function name the same way that toplev.c does before calling
9279 assemble_start_function. This is needed so that the name used here
9280 exactly matches the name used in ASM_DECLARE_FUNCTION_NAME. */
9281 fnname = XSTR (XEXP (DECL_RTL (current_function_decl), 0), 0);
9282 mips_end_function_definition (fnname);
9283 }
9284 \f
9285 /* Save register REG to MEM. Make the instruction frame-related. */
9286
9287 static void
9288 mips_save_reg (rtx reg, rtx mem)
9289 {
9290 if (GET_MODE (reg) == DFmode && !TARGET_FLOAT64)
9291 {
9292 rtx x1, x2;
9293
9294 if (mips_split_64bit_move_p (mem, reg))
9295 mips_split_doubleword_move (mem, reg);
9296 else
9297 mips_emit_move (mem, reg);
9298
9299 x1 = mips_frame_set (mips_subword (mem, false),
9300 mips_subword (reg, false));
9301 x2 = mips_frame_set (mips_subword (mem, true),
9302 mips_subword (reg, true));
9303 mips_set_frame_expr (gen_rtx_PARALLEL (VOIDmode, gen_rtvec (2, x1, x2)));
9304 }
9305 else
9306 {
9307 if (REGNO (reg) == HI_REGNUM)
9308 {
9309 if (TARGET_64BIT)
9310 emit_insn (gen_mfhidi_ti (MIPS_PROLOGUE_TEMP (DImode),
9311 gen_rtx_REG (TImode, MD_REG_FIRST)));
9312 else
9313 emit_insn (gen_mfhisi_di (MIPS_PROLOGUE_TEMP (SImode),
9314 gen_rtx_REG (DImode, MD_REG_FIRST)));
9315 mips_emit_move (mem, MIPS_PROLOGUE_TEMP (GET_MODE (reg)));
9316 }
9317 else if ((TARGET_MIPS16
9318 && REGNO (reg) != GP_REG_FIRST + 31
9319 && !M16_REG_P (REGNO (reg)))
9320 || ACC_REG_P (REGNO (reg)))
9321 {
9322 /* If the register has no direct store instruction, move it
9323 through a temporary. Note that there's a special MIPS16
9324 instruction to save $31. */
9325 mips_emit_move (MIPS_PROLOGUE_TEMP (GET_MODE (reg)), reg);
9326 mips_emit_move (mem, MIPS_PROLOGUE_TEMP (GET_MODE (reg)));
9327 }
9328 else
9329 mips_emit_move (mem, reg);
9330
9331 mips_set_frame_expr (mips_frame_set (mem, reg));
9332 }
9333 }
9334
9335 /* The __gnu_local_gp symbol. */
9336
9337 static GTY(()) rtx mips_gnu_local_gp;
9338
9339 /* If we're generating n32 or n64 abicalls, emit instructions
9340 to set up the global pointer. */
9341
9342 static void
9343 mips_emit_loadgp (void)
9344 {
9345 rtx addr, offset, incoming_address, base, index, pic_reg;
9346
9347 pic_reg = TARGET_MIPS16 ? MIPS16_PIC_TEMP : pic_offset_table_rtx;
9348 switch (mips_current_loadgp_style ())
9349 {
9350 case LOADGP_ABSOLUTE:
9351 if (mips_gnu_local_gp == NULL)
9352 {
9353 mips_gnu_local_gp = gen_rtx_SYMBOL_REF (Pmode, "__gnu_local_gp");
9354 SYMBOL_REF_FLAGS (mips_gnu_local_gp) |= SYMBOL_FLAG_LOCAL;
9355 }
9356 emit_insn (Pmode == SImode
9357 ? gen_loadgp_absolute_si (pic_reg, mips_gnu_local_gp)
9358 : gen_loadgp_absolute_di (pic_reg, mips_gnu_local_gp));
9359 break;
9360
9361 case LOADGP_OLDABI:
9362 /* Added by mips_output_function_prologue. */
9363 break;
9364
9365 case LOADGP_NEWABI:
9366 addr = XEXP (DECL_RTL (current_function_decl), 0);
9367 offset = mips_unspec_address (addr, SYMBOL_GOTOFF_LOADGP);
9368 incoming_address = gen_rtx_REG (Pmode, PIC_FUNCTION_ADDR_REGNUM);
9369 emit_insn (Pmode == SImode
9370 ? gen_loadgp_newabi_si (pic_reg, offset, incoming_address)
9371 : gen_loadgp_newabi_di (pic_reg, offset, incoming_address));
9372 break;
9373
9374 case LOADGP_RTP:
9375 base = gen_rtx_SYMBOL_REF (Pmode, ggc_strdup (VXWORKS_GOTT_BASE));
9376 index = gen_rtx_SYMBOL_REF (Pmode, ggc_strdup (VXWORKS_GOTT_INDEX));
9377 emit_insn (Pmode == SImode
9378 ? gen_loadgp_rtp_si (pic_reg, base, index)
9379 : gen_loadgp_rtp_di (pic_reg, base, index));
9380 break;
9381
9382 default:
9383 return;
9384 }
9385
9386 if (TARGET_MIPS16)
9387 emit_insn (gen_copygp_mips16 (pic_offset_table_rtx, pic_reg));
9388
9389 /* Emit a blockage if there are implicit uses of the GP register.
9390 This includes profiled functions, because FUNCTION_PROFILE uses
9391 a jal macro. */
9392 if (!TARGET_EXPLICIT_RELOCS || crtl->profile)
9393 emit_insn (gen_loadgp_blockage ());
9394 }
9395
9396 /* A for_each_rtx callback. Stop the search if *X is a kernel register. */
9397
9398 static int
9399 mips_kernel_reg_p (rtx *x, void *data ATTRIBUTE_UNUSED)
9400 {
9401 return GET_CODE (*x) == REG && KERNEL_REG_P (REGNO (*x));
9402 }
9403
9404 /* Expand the "prologue" pattern. */
9405
9406 void
9407 mips_expand_prologue (void)
9408 {
9409 const struct mips_frame_info *frame;
9410 HOST_WIDE_INT size;
9411 unsigned int nargs;
9412 rtx insn;
9413
9414 if (cfun->machine->global_pointer != INVALID_REGNUM)
9415 SET_REGNO (pic_offset_table_rtx, cfun->machine->global_pointer);
9416
9417 frame = &cfun->machine->frame;
9418 size = frame->total_size;
9419
9420 /* Save the registers. Allocate up to MIPS_MAX_FIRST_STACK_STEP
9421 bytes beforehand; this is enough to cover the register save area
9422 without going out of range. */
9423 if (((frame->mask | frame->fmask | frame->acc_mask) != 0)
9424 || frame->num_cop0_regs > 0)
9425 {
9426 HOST_WIDE_INT step1;
9427
9428 step1 = MIN (size, MIPS_MAX_FIRST_STACK_STEP);
9429 if (GENERATE_MIPS16E_SAVE_RESTORE)
9430 {
9431 HOST_WIDE_INT offset;
9432 unsigned int mask, regno;
9433
9434 /* Try to merge argument stores into the save instruction. */
9435 nargs = mips16e_collect_argument_saves ();
9436
9437 /* Build the save instruction. */
9438 mask = frame->mask;
9439 insn = mips16e_build_save_restore (false, &mask, &offset,
9440 nargs, step1);
9441 RTX_FRAME_RELATED_P (emit_insn (insn)) = 1;
9442 size -= step1;
9443
9444 /* Check if we need to save other registers. */
9445 for (regno = GP_REG_FIRST; regno < GP_REG_LAST; regno++)
9446 if (BITSET_P (mask, regno - GP_REG_FIRST))
9447 {
9448 offset -= UNITS_PER_WORD;
9449 mips_save_restore_reg (word_mode, regno,
9450 offset, mips_save_reg);
9451 }
9452 }
9453 else
9454 {
9455 if (cfun->machine->interrupt_handler_p)
9456 {
9457 HOST_WIDE_INT offset;
9458 rtx mem;
9459
9460 /* If this interrupt is using a shadow register set, we need to
9461 get the stack pointer from the previous register set. */
9462 if (cfun->machine->use_shadow_register_set_p)
9463 emit_insn (gen_mips_rdpgpr (stack_pointer_rtx,
9464 stack_pointer_rtx));
9465
9466 if (!cfun->machine->keep_interrupts_masked_p)
9467 {
9468 /* Move from COP0 Cause to K0. */
9469 emit_insn (gen_cop0_move (gen_rtx_REG (SImode, K0_REG_NUM),
9470 gen_rtx_REG (SImode,
9471 COP0_CAUSE_REG_NUM)));
9472 /* Move from COP0 EPC to K1. */
9473 emit_insn (gen_cop0_move (gen_rtx_REG (SImode, K1_REG_NUM),
9474 gen_rtx_REG (SImode,
9475 COP0_EPC_REG_NUM)));
9476 }
9477
9478 /* Allocate the first part of the frame. */
9479 insn = gen_add3_insn (stack_pointer_rtx, stack_pointer_rtx,
9480 GEN_INT (-step1));
9481 RTX_FRAME_RELATED_P (emit_insn (insn)) = 1;
9482 size -= step1;
9483
9484 /* Start at the uppermost location for saving. */
9485 offset = frame->cop0_sp_offset - size;
9486 if (!cfun->machine->keep_interrupts_masked_p)
9487 {
9488 /* Push EPC into its stack slot. */
9489 mem = gen_frame_mem (word_mode,
9490 plus_constant (stack_pointer_rtx,
9491 offset));
9492 mips_emit_move (mem, gen_rtx_REG (word_mode, K1_REG_NUM));
9493 offset -= UNITS_PER_WORD;
9494 }
9495
9496 /* Move from COP0 Status to K1. */
9497 emit_insn (gen_cop0_move (gen_rtx_REG (SImode, K1_REG_NUM),
9498 gen_rtx_REG (SImode,
9499 COP0_STATUS_REG_NUM)));
9500
9501 /* Right justify the RIPL in k0. */
9502 if (!cfun->machine->keep_interrupts_masked_p)
9503 emit_insn (gen_lshrsi3 (gen_rtx_REG (SImode, K0_REG_NUM),
9504 gen_rtx_REG (SImode, K0_REG_NUM),
9505 GEN_INT (CAUSE_IPL)));
9506
9507 /* Push Status into its stack slot. */
9508 mem = gen_frame_mem (word_mode,
9509 plus_constant (stack_pointer_rtx, offset));
9510 mips_emit_move (mem, gen_rtx_REG (word_mode, K1_REG_NUM));
9511 offset -= UNITS_PER_WORD;
9512
9513 /* Insert the RIPL into our copy of SR (k1) as the new IPL. */
9514 if (!cfun->machine->keep_interrupts_masked_p)
9515 emit_insn (gen_insvsi (gen_rtx_REG (SImode, K1_REG_NUM),
9516 GEN_INT (6),
9517 GEN_INT (SR_IPL),
9518 gen_rtx_REG (SImode, K0_REG_NUM)));
9519
9520 if (!cfun->machine->keep_interrupts_masked_p)
9521 /* Enable interrupts by clearing the KSU ERL and EXL bits.
9522 IE is already the correct value, so we don't have to do
9523 anything explicit. */
9524 emit_insn (gen_insvsi (gen_rtx_REG (SImode, K1_REG_NUM),
9525 GEN_INT (4),
9526 GEN_INT (SR_EXL),
9527 gen_rtx_REG (SImode, GP_REG_FIRST)));
9528 else
9529 /* Disable interrupts by clearing the KSU, ERL, EXL,
9530 and IE bits. */
9531 emit_insn (gen_insvsi (gen_rtx_REG (SImode, K1_REG_NUM),
9532 GEN_INT (5),
9533 GEN_INT (SR_IE),
9534 gen_rtx_REG (SImode, GP_REG_FIRST)));
9535 }
9536 else
9537 {
9538 insn = gen_add3_insn (stack_pointer_rtx,
9539 stack_pointer_rtx,
9540 GEN_INT (-step1));
9541 RTX_FRAME_RELATED_P (emit_insn (insn)) = 1;
9542 size -= step1;
9543 }
9544 mips_for_each_saved_acc (size, mips_save_reg);
9545 mips_for_each_saved_gpr_and_fpr (size, mips_save_reg);
9546 }
9547 }
9548
9549 /* Allocate the rest of the frame. */
9550 if (size > 0)
9551 {
9552 if (SMALL_OPERAND (-size))
9553 RTX_FRAME_RELATED_P (emit_insn (gen_add3_insn (stack_pointer_rtx,
9554 stack_pointer_rtx,
9555 GEN_INT (-size)))) = 1;
9556 else
9557 {
9558 mips_emit_move (MIPS_PROLOGUE_TEMP (Pmode), GEN_INT (size));
9559 if (TARGET_MIPS16)
9560 {
9561 /* There are no instructions to add or subtract registers
9562 from the stack pointer, so use the frame pointer as a
9563 temporary. We should always be using a frame pointer
9564 in this case anyway. */
9565 gcc_assert (frame_pointer_needed);
9566 mips_emit_move (hard_frame_pointer_rtx, stack_pointer_rtx);
9567 emit_insn (gen_sub3_insn (hard_frame_pointer_rtx,
9568 hard_frame_pointer_rtx,
9569 MIPS_PROLOGUE_TEMP (Pmode)));
9570 mips_emit_move (stack_pointer_rtx, hard_frame_pointer_rtx);
9571 }
9572 else
9573 emit_insn (gen_sub3_insn (stack_pointer_rtx,
9574 stack_pointer_rtx,
9575 MIPS_PROLOGUE_TEMP (Pmode)));
9576
9577 /* Describe the combined effect of the previous instructions. */
9578 mips_set_frame_expr
9579 (gen_rtx_SET (VOIDmode, stack_pointer_rtx,
9580 plus_constant (stack_pointer_rtx, -size)));
9581 }
9582 }
9583
9584 /* Set up the frame pointer, if we're using one. */
9585 if (frame_pointer_needed)
9586 {
9587 HOST_WIDE_INT offset;
9588
9589 offset = frame->hard_frame_pointer_offset;
9590 if (offset == 0)
9591 {
9592 insn = mips_emit_move (hard_frame_pointer_rtx, stack_pointer_rtx);
9593 RTX_FRAME_RELATED_P (insn) = 1;
9594 }
9595 else if (SMALL_OPERAND (offset))
9596 {
9597 insn = gen_add3_insn (hard_frame_pointer_rtx,
9598 stack_pointer_rtx, GEN_INT (offset));
9599 RTX_FRAME_RELATED_P (emit_insn (insn)) = 1;
9600 }
9601 else
9602 {
9603 mips_emit_move (MIPS_PROLOGUE_TEMP (Pmode), GEN_INT (offset));
9604 mips_emit_move (hard_frame_pointer_rtx, stack_pointer_rtx);
9605 emit_insn (gen_add3_insn (hard_frame_pointer_rtx,
9606 hard_frame_pointer_rtx,
9607 MIPS_PROLOGUE_TEMP (Pmode)));
9608 mips_set_frame_expr
9609 (gen_rtx_SET (VOIDmode, hard_frame_pointer_rtx,
9610 plus_constant (stack_pointer_rtx, offset)));
9611 }
9612 }
9613
9614 mips_emit_loadgp ();
9615
9616 /* Initialize the $gp save slot. */
9617 if (frame->cprestore_size > 0
9618 && cfun->machine->global_pointer != INVALID_REGNUM)
9619 {
9620 if (TARGET_MIPS16)
9621 mips_emit_move (mips_cprestore_slot (MIPS_PROLOGUE_TEMP (Pmode)),
9622 MIPS16_PIC_TEMP);
9623 else if (TARGET_ABICALLS_PIC2)
9624 emit_insn (gen_cprestore (GEN_INT (frame->args_size)));
9625 else
9626 emit_move_insn (mips_cprestore_slot (MIPS_PROLOGUE_TEMP (Pmode)),
9627 pic_offset_table_rtx);
9628 }
9629
9630 /* We need to search back to the last use of K0 or K1. */
9631 if (cfun->machine->interrupt_handler_p)
9632 {
9633 for (insn = get_last_insn (); insn != NULL_RTX; insn = PREV_INSN (insn))
9634 if (INSN_P (insn)
9635 && for_each_rtx (&PATTERN (insn), mips_kernel_reg_p, NULL))
9636 break;
9637 /* Emit a move from K1 to COP0 Status after insn. */
9638 gcc_assert (insn != NULL_RTX);
9639 emit_insn_after (gen_cop0_move (gen_rtx_REG (SImode, COP0_STATUS_REG_NUM),
9640 gen_rtx_REG (SImode, K1_REG_NUM)),
9641 insn);
9642 }
9643
9644 /* If we are profiling, make sure no instructions are scheduled before
9645 the call to mcount. */
9646 if (crtl->profile)
9647 emit_insn (gen_blockage ());
9648 }
9649 \f
9650 /* Emit instructions to restore register REG from slot MEM. */
9651
9652 static void
9653 mips_restore_reg (rtx reg, rtx mem)
9654 {
9655 /* There's no MIPS16 instruction to load $31 directly. Load into
9656 $7 instead and adjust the return insn appropriately. */
9657 if (TARGET_MIPS16 && REGNO (reg) == GP_REG_FIRST + 31)
9658 reg = gen_rtx_REG (GET_MODE (reg), GP_REG_FIRST + 7);
9659
9660 if (REGNO (reg) == HI_REGNUM)
9661 {
9662 mips_emit_move (MIPS_EPILOGUE_TEMP (GET_MODE (reg)), mem);
9663 if (TARGET_64BIT)
9664 emit_insn (gen_mthisi_di (gen_rtx_REG (TImode, MD_REG_FIRST),
9665 MIPS_EPILOGUE_TEMP (DImode),
9666 gen_rtx_REG (DImode, LO_REGNUM)));
9667 else
9668 emit_insn (gen_mthisi_di (gen_rtx_REG (DImode, MD_REG_FIRST),
9669 MIPS_EPILOGUE_TEMP (SImode),
9670 gen_rtx_REG (SImode, LO_REGNUM)));
9671 }
9672 else if ((TARGET_MIPS16 && !M16_REG_P (REGNO (reg)))
9673 || ACC_REG_P (REGNO (reg)))
9674 {
9675 /* Can't restore directly; move through a temporary. */
9676 mips_emit_move (MIPS_EPILOGUE_TEMP (GET_MODE (reg)), mem);
9677 mips_emit_move (reg, MIPS_EPILOGUE_TEMP (GET_MODE (reg)));
9678 }
9679 else
9680 mips_emit_move (reg, mem);
9681 }
9682
9683 /* Emit any instructions needed before a return. */
9684
9685 void
9686 mips_expand_before_return (void)
9687 {
9688 /* When using a call-clobbered gp, we start out with unified call
9689 insns that include instructions to restore the gp. We then split
9690 these unified calls after reload. These split calls explicitly
9691 clobber gp, so there is no need to define
9692 PIC_OFFSET_TABLE_REG_CALL_CLOBBERED.
9693
9694 For consistency, we should also insert an explicit clobber of $28
9695 before return insns, so that the post-reload optimizers know that
9696 the register is not live on exit. */
9697 if (TARGET_CALL_CLOBBERED_GP)
9698 emit_clobber (pic_offset_table_rtx);
9699 }
9700
9701 /* Expand an "epilogue" or "sibcall_epilogue" pattern; SIBCALL_P
9702 says which. */
9703
9704 void
9705 mips_expand_epilogue (bool sibcall_p)
9706 {
9707 const struct mips_frame_info *frame;
9708 HOST_WIDE_INT step1, step2;
9709 rtx base, target, insn;
9710
9711 if (!sibcall_p && mips_can_use_return_insn ())
9712 {
9713 emit_jump_insn (gen_return ());
9714 return;
9715 }
9716
9717 /* In MIPS16 mode, if the return value should go into a floating-point
9718 register, we need to call a helper routine to copy it over. */
9719 if (mips16_cfun_returns_in_fpr_p ())
9720 mips16_copy_fpr_return_value ();
9721
9722 /* Split the frame into two. STEP1 is the amount of stack we should
9723 deallocate before restoring the registers. STEP2 is the amount we
9724 should deallocate afterwards.
9725
9726 Start off by assuming that no registers need to be restored. */
9727 frame = &cfun->machine->frame;
9728 step1 = frame->total_size;
9729 step2 = 0;
9730
9731 /* Work out which register holds the frame address. */
9732 if (!frame_pointer_needed)
9733 base = stack_pointer_rtx;
9734 else
9735 {
9736 base = hard_frame_pointer_rtx;
9737 step1 -= frame->hard_frame_pointer_offset;
9738 }
9739
9740 /* If we need to restore registers, deallocate as much stack as
9741 possible in the second step without going out of range. */
9742 if ((frame->mask | frame->fmask | frame->acc_mask) != 0
9743 || frame->num_cop0_regs > 0)
9744 {
9745 step2 = MIN (step1, MIPS_MAX_FIRST_STACK_STEP);
9746 step1 -= step2;
9747 }
9748
9749 /* Set TARGET to BASE + STEP1. */
9750 target = base;
9751 if (step1 > 0)
9752 {
9753 rtx adjust;
9754
9755 /* Get an rtx for STEP1 that we can add to BASE. */
9756 adjust = GEN_INT (step1);
9757 if (!SMALL_OPERAND (step1))
9758 {
9759 mips_emit_move (MIPS_EPILOGUE_TEMP (Pmode), adjust);
9760 adjust = MIPS_EPILOGUE_TEMP (Pmode);
9761 }
9762
9763 /* Normal mode code can copy the result straight into $sp. */
9764 if (!TARGET_MIPS16)
9765 target = stack_pointer_rtx;
9766
9767 emit_insn (gen_add3_insn (target, base, adjust));
9768 }
9769
9770 /* Copy TARGET into the stack pointer. */
9771 if (target != stack_pointer_rtx)
9772 mips_emit_move (stack_pointer_rtx, target);
9773
9774 /* If we're using addressing macros, $gp is implicitly used by all
9775 SYMBOL_REFs. We must emit a blockage insn before restoring $gp
9776 from the stack. */
9777 if (TARGET_CALL_SAVED_GP && !TARGET_EXPLICIT_RELOCS)
9778 emit_insn (gen_blockage ());
9779
9780 if (GENERATE_MIPS16E_SAVE_RESTORE && frame->mask != 0)
9781 {
9782 unsigned int regno, mask;
9783 HOST_WIDE_INT offset;
9784 rtx restore;
9785
9786 /* Generate the restore instruction. */
9787 mask = frame->mask;
9788 restore = mips16e_build_save_restore (true, &mask, &offset, 0, step2);
9789
9790 /* Restore any other registers manually. */
9791 for (regno = GP_REG_FIRST; regno < GP_REG_LAST; regno++)
9792 if (BITSET_P (mask, regno - GP_REG_FIRST))
9793 {
9794 offset -= UNITS_PER_WORD;
9795 mips_save_restore_reg (word_mode, regno, offset, mips_restore_reg);
9796 }
9797
9798 /* Restore the remaining registers and deallocate the final bit
9799 of the frame. */
9800 emit_insn (restore);
9801 }
9802 else
9803 {
9804 /* Restore the registers. */
9805 mips_for_each_saved_acc (frame->total_size - step2, mips_restore_reg);
9806 mips_for_each_saved_gpr_and_fpr (frame->total_size - step2,
9807 mips_restore_reg);
9808
9809 if (cfun->machine->interrupt_handler_p)
9810 {
9811 HOST_WIDE_INT offset;
9812 rtx mem;
9813
9814 offset = frame->cop0_sp_offset - (frame->total_size - step2);
9815 if (!cfun->machine->keep_interrupts_masked_p)
9816 {
9817 /* Restore the original EPC. */
9818 mem = gen_frame_mem (word_mode,
9819 plus_constant (stack_pointer_rtx, offset));
9820 mips_emit_move (gen_rtx_REG (word_mode, K0_REG_NUM), mem);
9821 offset -= UNITS_PER_WORD;
9822
9823 /* Move to COP0 EPC. */
9824 emit_insn (gen_cop0_move (gen_rtx_REG (SImode, COP0_EPC_REG_NUM),
9825 gen_rtx_REG (SImode, K0_REG_NUM)));
9826 }
9827
9828 /* Restore the original Status. */
9829 mem = gen_frame_mem (word_mode,
9830 plus_constant (stack_pointer_rtx, offset));
9831 mips_emit_move (gen_rtx_REG (word_mode, K0_REG_NUM), mem);
9832 offset -= UNITS_PER_WORD;
9833
9834 /* If we don't use shoadow register set, we need to update SP. */
9835 if (!cfun->machine->use_shadow_register_set_p && step2 > 0)
9836 emit_insn (gen_add3_insn (stack_pointer_rtx,
9837 stack_pointer_rtx,
9838 GEN_INT (step2)));
9839
9840 /* Move to COP0 Status. */
9841 emit_insn (gen_cop0_move (gen_rtx_REG (SImode, COP0_STATUS_REG_NUM),
9842 gen_rtx_REG (SImode, K0_REG_NUM)));
9843 }
9844 else
9845 {
9846 /* Deallocate the final bit of the frame. */
9847 if (step2 > 0)
9848 emit_insn (gen_add3_insn (stack_pointer_rtx,
9849 stack_pointer_rtx,
9850 GEN_INT (step2)));
9851 }
9852 }
9853
9854 /* Add in the __builtin_eh_return stack adjustment. We need to
9855 use a temporary in MIPS16 code. */
9856 if (crtl->calls_eh_return)
9857 {
9858 if (TARGET_MIPS16)
9859 {
9860 mips_emit_move (MIPS_EPILOGUE_TEMP (Pmode), stack_pointer_rtx);
9861 emit_insn (gen_add3_insn (MIPS_EPILOGUE_TEMP (Pmode),
9862 MIPS_EPILOGUE_TEMP (Pmode),
9863 EH_RETURN_STACKADJ_RTX));
9864 mips_emit_move (stack_pointer_rtx, MIPS_EPILOGUE_TEMP (Pmode));
9865 }
9866 else
9867 emit_insn (gen_add3_insn (stack_pointer_rtx,
9868 stack_pointer_rtx,
9869 EH_RETURN_STACKADJ_RTX));
9870 }
9871
9872 if (!sibcall_p)
9873 {
9874 mips_expand_before_return ();
9875 if (cfun->machine->interrupt_handler_p)
9876 {
9877 /* Interrupt handlers generate eret or deret. */
9878 if (cfun->machine->use_debug_exception_return_p)
9879 emit_jump_insn (gen_mips_deret ());
9880 else
9881 emit_jump_insn (gen_mips_eret ());
9882 }
9883 else
9884 {
9885 unsigned int regno;
9886
9887 /* When generating MIPS16 code, the normal
9888 mips_for_each_saved_gpr_and_fpr path will restore the return
9889 address into $7 rather than $31. */
9890 if (TARGET_MIPS16
9891 && !GENERATE_MIPS16E_SAVE_RESTORE
9892 && BITSET_P (frame->mask, 31))
9893 regno = GP_REG_FIRST + 7;
9894 else
9895 regno = GP_REG_FIRST + 31;
9896 emit_jump_insn (gen_return_internal (gen_rtx_REG (Pmode, regno)));
9897 }
9898 }
9899
9900 /* Search from the beginning to the first use of K0 or K1. */
9901 if (cfun->machine->interrupt_handler_p
9902 && !cfun->machine->keep_interrupts_masked_p)
9903 {
9904 for (insn = get_insns (); insn != NULL_RTX; insn = NEXT_INSN (insn))
9905 if (INSN_P (insn)
9906 && for_each_rtx (&PATTERN(insn), mips_kernel_reg_p, NULL))
9907 break;
9908 gcc_assert (insn != NULL_RTX);
9909 /* Insert disable interrupts before the first use of K0 or K1. */
9910 emit_insn_before (gen_mips_di (), insn);
9911 emit_insn_before (gen_mips_ehb (), insn);
9912 }
9913 }
9914 \f
9915 /* Return nonzero if this function is known to have a null epilogue.
9916 This allows the optimizer to omit jumps to jumps if no stack
9917 was created. */
9918
9919 bool
9920 mips_can_use_return_insn (void)
9921 {
9922 /* Interrupt handlers need to go through the epilogue. */
9923 if (cfun->machine->interrupt_handler_p)
9924 return false;
9925
9926 if (!reload_completed)
9927 return false;
9928
9929 if (crtl->profile)
9930 return false;
9931
9932 /* In MIPS16 mode, a function that returns a floating-point value
9933 needs to arrange to copy the return value into the floating-point
9934 registers. */
9935 if (mips16_cfun_returns_in_fpr_p ())
9936 return false;
9937
9938 return cfun->machine->frame.total_size == 0;
9939 }
9940 \f
9941 /* Return true if register REGNO can store a value of mode MODE.
9942 The result of this function is cached in mips_hard_regno_mode_ok. */
9943
9944 static bool
9945 mips_hard_regno_mode_ok_p (unsigned int regno, enum machine_mode mode)
9946 {
9947 unsigned int size;
9948 enum mode_class mclass;
9949
9950 if (mode == CCV2mode)
9951 return (ISA_HAS_8CC
9952 && ST_REG_P (regno)
9953 && (regno - ST_REG_FIRST) % 2 == 0);
9954
9955 if (mode == CCV4mode)
9956 return (ISA_HAS_8CC
9957 && ST_REG_P (regno)
9958 && (regno - ST_REG_FIRST) % 4 == 0);
9959
9960 if (mode == CCmode)
9961 {
9962 if (!ISA_HAS_8CC)
9963 return regno == FPSW_REGNUM;
9964
9965 return (ST_REG_P (regno)
9966 || GP_REG_P (regno)
9967 || FP_REG_P (regno));
9968 }
9969
9970 size = GET_MODE_SIZE (mode);
9971 mclass = GET_MODE_CLASS (mode);
9972
9973 if (GP_REG_P (regno))
9974 return ((regno - GP_REG_FIRST) & 1) == 0 || size <= UNITS_PER_WORD;
9975
9976 if (FP_REG_P (regno)
9977 && (((regno - FP_REG_FIRST) % MAX_FPRS_PER_FMT) == 0
9978 || (MIN_FPRS_PER_FMT == 1 && size <= UNITS_PER_FPREG)))
9979 {
9980 /* Allow TFmode for CCmode reloads. */
9981 if (mode == TFmode && ISA_HAS_8CC)
9982 return true;
9983
9984 /* Allow 64-bit vector modes for Loongson-2E/2F. */
9985 if (TARGET_LOONGSON_VECTORS
9986 && (mode == V2SImode
9987 || mode == V4HImode
9988 || mode == V8QImode
9989 || mode == DImode))
9990 return true;
9991
9992 if (mclass == MODE_FLOAT
9993 || mclass == MODE_COMPLEX_FLOAT
9994 || mclass == MODE_VECTOR_FLOAT)
9995 return size <= UNITS_PER_FPVALUE;
9996
9997 /* Allow integer modes that fit into a single register. We need
9998 to put integers into FPRs when using instructions like CVT
9999 and TRUNC. There's no point allowing sizes smaller than a word,
10000 because the FPU has no appropriate load/store instructions. */
10001 if (mclass == MODE_INT)
10002 return size >= MIN_UNITS_PER_WORD && size <= UNITS_PER_FPREG;
10003 }
10004
10005 if (ACC_REG_P (regno)
10006 && (INTEGRAL_MODE_P (mode) || ALL_FIXED_POINT_MODE_P (mode)))
10007 {
10008 if (MD_REG_P (regno))
10009 {
10010 /* After a multiplication or division, clobbering HI makes
10011 the value of LO unpredictable, and vice versa. This means
10012 that, for all interesting cases, HI and LO are effectively
10013 a single register.
10014
10015 We model this by requiring that any value that uses HI
10016 also uses LO. */
10017 if (size <= UNITS_PER_WORD * 2)
10018 return regno == (size <= UNITS_PER_WORD ? LO_REGNUM : MD_REG_FIRST);
10019 }
10020 else
10021 {
10022 /* DSP accumulators do not have the same restrictions as
10023 HI and LO, so we can treat them as normal doubleword
10024 registers. */
10025 if (size <= UNITS_PER_WORD)
10026 return true;
10027
10028 if (size <= UNITS_PER_WORD * 2
10029 && ((regno - DSP_ACC_REG_FIRST) & 1) == 0)
10030 return true;
10031 }
10032 }
10033
10034 if (ALL_COP_REG_P (regno))
10035 return mclass == MODE_INT && size <= UNITS_PER_WORD;
10036
10037 if (regno == GOT_VERSION_REGNUM)
10038 return mode == SImode;
10039
10040 return false;
10041 }
10042
10043 /* Implement HARD_REGNO_NREGS. */
10044
10045 unsigned int
10046 mips_hard_regno_nregs (int regno, enum machine_mode mode)
10047 {
10048 if (ST_REG_P (regno))
10049 /* The size of FP status registers is always 4, because they only hold
10050 CCmode values, and CCmode is always considered to be 4 bytes wide. */
10051 return (GET_MODE_SIZE (mode) + 3) / 4;
10052
10053 if (FP_REG_P (regno))
10054 return (GET_MODE_SIZE (mode) + UNITS_PER_FPREG - 1) / UNITS_PER_FPREG;
10055
10056 /* All other registers are word-sized. */
10057 return (GET_MODE_SIZE (mode) + UNITS_PER_WORD - 1) / UNITS_PER_WORD;
10058 }
10059
10060 /* Implement CLASS_MAX_NREGS, taking the maximum of the cases
10061 in mips_hard_regno_nregs. */
10062
10063 int
10064 mips_class_max_nregs (enum reg_class rclass, enum machine_mode mode)
10065 {
10066 int size;
10067 HARD_REG_SET left;
10068
10069 size = 0x8000;
10070 COPY_HARD_REG_SET (left, reg_class_contents[(int) rclass]);
10071 if (hard_reg_set_intersect_p (left, reg_class_contents[(int) ST_REGS]))
10072 {
10073 size = MIN (size, 4);
10074 AND_COMPL_HARD_REG_SET (left, reg_class_contents[(int) ST_REGS]);
10075 }
10076 if (hard_reg_set_intersect_p (left, reg_class_contents[(int) FP_REGS]))
10077 {
10078 size = MIN (size, UNITS_PER_FPREG);
10079 AND_COMPL_HARD_REG_SET (left, reg_class_contents[(int) FP_REGS]);
10080 }
10081 if (!hard_reg_set_empty_p (left))
10082 size = MIN (size, UNITS_PER_WORD);
10083 return (GET_MODE_SIZE (mode) + size - 1) / size;
10084 }
10085
10086 /* Implement CANNOT_CHANGE_MODE_CLASS. */
10087
10088 bool
10089 mips_cannot_change_mode_class (enum machine_mode from ATTRIBUTE_UNUSED,
10090 enum machine_mode to ATTRIBUTE_UNUSED,
10091 enum reg_class rclass)
10092 {
10093 /* There are several problems with changing the modes of values
10094 in floating-point registers:
10095
10096 - When a multi-word value is stored in paired floating-point
10097 registers, the first register always holds the low word.
10098 We therefore can't allow FPRs to change between single-word
10099 and multi-word modes on big-endian targets.
10100
10101 - GCC assumes that each word of a multiword register can be accessed
10102 individually using SUBREGs. This is not true for floating-point
10103 registers if they are bigger than a word.
10104
10105 - Loading a 32-bit value into a 64-bit floating-point register
10106 will not sign-extend the value, despite what LOAD_EXTEND_OP says.
10107 We can't allow FPRs to change from SImode to to a wider mode on
10108 64-bit targets.
10109
10110 - If the FPU has already interpreted a value in one format, we must
10111 not ask it to treat the value as having a different format.
10112
10113 We therefore disallow all mode changes involving FPRs. */
10114 return reg_classes_intersect_p (FP_REGS, rclass);
10115 }
10116
10117 /* Return true if moves in mode MODE can use the FPU's mov.fmt instruction. */
10118
10119 static bool
10120 mips_mode_ok_for_mov_fmt_p (enum machine_mode mode)
10121 {
10122 switch (mode)
10123 {
10124 case SFmode:
10125 return TARGET_HARD_FLOAT;
10126
10127 case DFmode:
10128 return TARGET_HARD_FLOAT && TARGET_DOUBLE_FLOAT;
10129
10130 case V2SFmode:
10131 return TARGET_HARD_FLOAT && TARGET_PAIRED_SINGLE_FLOAT;
10132
10133 default:
10134 return false;
10135 }
10136 }
10137
10138 /* Implement MODES_TIEABLE_P. */
10139
10140 bool
10141 mips_modes_tieable_p (enum machine_mode mode1, enum machine_mode mode2)
10142 {
10143 /* FPRs allow no mode punning, so it's not worth tying modes if we'd
10144 prefer to put one of them in FPRs. */
10145 return (mode1 == mode2
10146 || (!mips_mode_ok_for_mov_fmt_p (mode1)
10147 && !mips_mode_ok_for_mov_fmt_p (mode2)));
10148 }
10149
10150 /* Implement PREFERRED_RELOAD_CLASS. */
10151
10152 enum reg_class
10153 mips_preferred_reload_class (rtx x, enum reg_class rclass)
10154 {
10155 if (mips_dangerous_for_la25_p (x) && reg_class_subset_p (LEA_REGS, rclass))
10156 return LEA_REGS;
10157
10158 if (reg_class_subset_p (FP_REGS, rclass)
10159 && mips_mode_ok_for_mov_fmt_p (GET_MODE (x)))
10160 return FP_REGS;
10161
10162 if (reg_class_subset_p (GR_REGS, rclass))
10163 rclass = GR_REGS;
10164
10165 if (TARGET_MIPS16 && reg_class_subset_p (M16_REGS, rclass))
10166 rclass = M16_REGS;
10167
10168 return rclass;
10169 }
10170
10171 /* RCLASS is a class involved in a REGISTER_MOVE_COST calculation.
10172 Return a "canonical" class to represent it in later calculations. */
10173
10174 static enum reg_class
10175 mips_canonicalize_move_class (enum reg_class rclass)
10176 {
10177 /* All moves involving accumulator registers have the same cost. */
10178 if (reg_class_subset_p (rclass, ACC_REGS))
10179 rclass = ACC_REGS;
10180
10181 /* Likewise promote subclasses of general registers to the most
10182 interesting containing class. */
10183 if (TARGET_MIPS16 && reg_class_subset_p (rclass, M16_REGS))
10184 rclass = M16_REGS;
10185 else if (reg_class_subset_p (rclass, GENERAL_REGS))
10186 rclass = GENERAL_REGS;
10187
10188 return rclass;
10189 }
10190
10191 /* Return the cost of moving a value of mode MODE from a register of
10192 class FROM to a GPR. Return 0 for classes that are unions of other
10193 classes handled by this function. */
10194
10195 static int
10196 mips_move_to_gpr_cost (enum machine_mode mode ATTRIBUTE_UNUSED,
10197 enum reg_class from)
10198 {
10199 switch (from)
10200 {
10201 case GENERAL_REGS:
10202 /* A MIPS16 MOVE instruction, or a non-MIPS16 MOVE macro. */
10203 return 2;
10204
10205 case ACC_REGS:
10206 /* MFLO and MFHI. */
10207 return 6;
10208
10209 case FP_REGS:
10210 /* MFC1, etc. */
10211 return 4;
10212
10213 case ST_REGS:
10214 /* LUI followed by MOVF. */
10215 return 4;
10216
10217 case COP0_REGS:
10218 case COP2_REGS:
10219 case COP3_REGS:
10220 /* This choice of value is historical. */
10221 return 5;
10222
10223 default:
10224 return 0;
10225 }
10226 }
10227
10228 /* Return the cost of moving a value of mode MODE from a GPR to a
10229 register of class TO. Return 0 for classes that are unions of
10230 other classes handled by this function. */
10231
10232 static int
10233 mips_move_from_gpr_cost (enum machine_mode mode, enum reg_class to)
10234 {
10235 switch (to)
10236 {
10237 case GENERAL_REGS:
10238 /* A MIPS16 MOVE instruction, or a non-MIPS16 MOVE macro. */
10239 return 2;
10240
10241 case ACC_REGS:
10242 /* MTLO and MTHI. */
10243 return 6;
10244
10245 case FP_REGS:
10246 /* MTC1, etc. */
10247 return 4;
10248
10249 case ST_REGS:
10250 /* A secondary reload through an FPR scratch. */
10251 return (mips_register_move_cost (mode, GENERAL_REGS, FP_REGS)
10252 + mips_register_move_cost (mode, FP_REGS, ST_REGS));
10253
10254 case COP0_REGS:
10255 case COP2_REGS:
10256 case COP3_REGS:
10257 /* This choice of value is historical. */
10258 return 5;
10259
10260 default:
10261 return 0;
10262 }
10263 }
10264
10265 /* Implement REGISTER_MOVE_COST. Return 0 for classes that are the
10266 maximum of the move costs for subclasses; regclass will work out
10267 the maximum for us. */
10268
10269 int
10270 mips_register_move_cost (enum machine_mode mode,
10271 enum reg_class from, enum reg_class to)
10272 {
10273 enum reg_class dregs;
10274 int cost1, cost2;
10275
10276 from = mips_canonicalize_move_class (from);
10277 to = mips_canonicalize_move_class (to);
10278
10279 /* Handle moves that can be done without using general-purpose registers. */
10280 if (from == FP_REGS)
10281 {
10282 if (to == FP_REGS && mips_mode_ok_for_mov_fmt_p (mode))
10283 /* MOV.FMT. */
10284 return 4;
10285 if (to == ST_REGS)
10286 /* The sequence generated by mips_expand_fcc_reload. */
10287 return 8;
10288 }
10289
10290 /* Handle cases in which only one class deviates from the ideal. */
10291 dregs = TARGET_MIPS16 ? M16_REGS : GENERAL_REGS;
10292 if (from == dregs)
10293 return mips_move_from_gpr_cost (mode, to);
10294 if (to == dregs)
10295 return mips_move_to_gpr_cost (mode, from);
10296
10297 /* Handles cases that require a GPR temporary. */
10298 cost1 = mips_move_to_gpr_cost (mode, from);
10299 if (cost1 != 0)
10300 {
10301 cost2 = mips_move_from_gpr_cost (mode, to);
10302 if (cost2 != 0)
10303 return cost1 + cost2;
10304 }
10305
10306 return 0;
10307 }
10308
10309 /* Implement TARGET_IRA_COVER_CLASSES. */
10310
10311 static const enum reg_class *
10312 mips_ira_cover_classes (void)
10313 {
10314 static const enum reg_class acc_classes[] = {
10315 GR_AND_ACC_REGS, FP_REGS, COP0_REGS, COP2_REGS, COP3_REGS,
10316 ST_REGS, LIM_REG_CLASSES
10317 };
10318 static const enum reg_class no_acc_classes[] = {
10319 GR_REGS, FP_REGS, COP0_REGS, COP2_REGS, COP3_REGS,
10320 ST_REGS, LIM_REG_CLASSES
10321 };
10322
10323 /* Don't allow the register allocators to use LO and HI in MIPS16 mode,
10324 which has no MTLO or MTHI instructions. Also, using GR_AND_ACC_REGS
10325 as a cover class only works well when we keep per-register costs.
10326 Using it when not optimizing can cause us to think accumulators
10327 have the same cost as GPRs in cases where GPRs are actually much
10328 cheaper. */
10329 return TARGET_MIPS16 || !optimize ? no_acc_classes : acc_classes;
10330 }
10331
10332 /* Return the register class required for a secondary register when
10333 copying between one of the registers in RCLASS and value X, which
10334 has mode MODE. X is the source of the move if IN_P, otherwise it
10335 is the destination. Return NO_REGS if no secondary register is
10336 needed. */
10337
10338 enum reg_class
10339 mips_secondary_reload_class (enum reg_class rclass,
10340 enum machine_mode mode, rtx x, bool in_p)
10341 {
10342 int regno;
10343
10344 /* If X is a constant that cannot be loaded into $25, it must be loaded
10345 into some other GPR. No other register class allows a direct move. */
10346 if (mips_dangerous_for_la25_p (x))
10347 return reg_class_subset_p (rclass, LEA_REGS) ? NO_REGS : LEA_REGS;
10348
10349 regno = true_regnum (x);
10350 if (TARGET_MIPS16)
10351 {
10352 /* In MIPS16 mode, every move must involve a member of M16_REGS. */
10353 if (!reg_class_subset_p (rclass, M16_REGS) && !M16_REG_P (regno))
10354 return M16_REGS;
10355
10356 return NO_REGS;
10357 }
10358
10359 /* Copying from accumulator registers to anywhere other than a general
10360 register requires a temporary general register. */
10361 if (reg_class_subset_p (rclass, ACC_REGS))
10362 return GP_REG_P (regno) ? NO_REGS : GR_REGS;
10363 if (ACC_REG_P (regno))
10364 return reg_class_subset_p (rclass, GR_REGS) ? NO_REGS : GR_REGS;
10365
10366 /* We can only copy a value to a condition code register from a
10367 floating-point register, and even then we require a scratch
10368 floating-point register. We can only copy a value out of a
10369 condition-code register into a general register. */
10370 if (reg_class_subset_p (rclass, ST_REGS))
10371 {
10372 if (in_p)
10373 return FP_REGS;
10374 return GP_REG_P (regno) ? NO_REGS : GR_REGS;
10375 }
10376 if (ST_REG_P (regno))
10377 {
10378 if (!in_p)
10379 return FP_REGS;
10380 return reg_class_subset_p (rclass, GR_REGS) ? NO_REGS : GR_REGS;
10381 }
10382
10383 if (reg_class_subset_p (rclass, FP_REGS))
10384 {
10385 if (MEM_P (x)
10386 && (GET_MODE_SIZE (mode) == 4 || GET_MODE_SIZE (mode) == 8))
10387 /* In this case we can use lwc1, swc1, ldc1 or sdc1. We'll use
10388 pairs of lwc1s and swc1s if ldc1 and sdc1 are not supported. */
10389 return NO_REGS;
10390
10391 if (GP_REG_P (regno) || x == CONST0_RTX (mode))
10392 /* In this case we can use mtc1, mfc1, dmtc1 or dmfc1. */
10393 return NO_REGS;
10394
10395 if (CONSTANT_P (x) && !targetm.cannot_force_const_mem (x))
10396 /* We can force the constant to memory and use lwc1
10397 and ldc1. As above, we will use pairs of lwc1s if
10398 ldc1 is not supported. */
10399 return NO_REGS;
10400
10401 if (FP_REG_P (regno) && mips_mode_ok_for_mov_fmt_p (mode))
10402 /* In this case we can use mov.fmt. */
10403 return NO_REGS;
10404
10405 /* Otherwise, we need to reload through an integer register. */
10406 return GR_REGS;
10407 }
10408 if (FP_REG_P (regno))
10409 return reg_class_subset_p (rclass, GR_REGS) ? NO_REGS : GR_REGS;
10410
10411 return NO_REGS;
10412 }
10413
10414 /* Implement TARGET_MODE_REP_EXTENDED. */
10415
10416 static int
10417 mips_mode_rep_extended (enum machine_mode mode, enum machine_mode mode_rep)
10418 {
10419 /* On 64-bit targets, SImode register values are sign-extended to DImode. */
10420 if (TARGET_64BIT && mode == SImode && mode_rep == DImode)
10421 return SIGN_EXTEND;
10422
10423 return UNKNOWN;
10424 }
10425 \f
10426 /* Implement TARGET_VALID_POINTER_MODE. */
10427
10428 static bool
10429 mips_valid_pointer_mode (enum machine_mode mode)
10430 {
10431 return mode == SImode || (TARGET_64BIT && mode == DImode);
10432 }
10433
10434 /* Implement TARGET_VECTOR_MODE_SUPPORTED_P. */
10435
10436 static bool
10437 mips_vector_mode_supported_p (enum machine_mode mode)
10438 {
10439 switch (mode)
10440 {
10441 case V2SFmode:
10442 return TARGET_PAIRED_SINGLE_FLOAT;
10443
10444 case V2HImode:
10445 case V4QImode:
10446 case V2HQmode:
10447 case V2UHQmode:
10448 case V2HAmode:
10449 case V2UHAmode:
10450 case V4QQmode:
10451 case V4UQQmode:
10452 return TARGET_DSP;
10453
10454 case V2SImode:
10455 case V4HImode:
10456 case V8QImode:
10457 return TARGET_LOONGSON_VECTORS;
10458
10459 default:
10460 return false;
10461 }
10462 }
10463
10464 /* Implement TARGET_SCALAR_MODE_SUPPORTED_P. */
10465
10466 static bool
10467 mips_scalar_mode_supported_p (enum machine_mode mode)
10468 {
10469 if (ALL_FIXED_POINT_MODE_P (mode)
10470 && GET_MODE_PRECISION (mode) <= 2 * BITS_PER_WORD)
10471 return true;
10472
10473 return default_scalar_mode_supported_p (mode);
10474 }
10475 \f
10476 /* Implement TARGET_INIT_LIBFUNCS. */
10477
10478 #include "config/gofast.h"
10479
10480 static void
10481 mips_init_libfuncs (void)
10482 {
10483 if (TARGET_FIX_VR4120)
10484 {
10485 /* Register the special divsi3 and modsi3 functions needed to work
10486 around VR4120 division errata. */
10487 set_optab_libfunc (sdiv_optab, SImode, "__vr4120_divsi3");
10488 set_optab_libfunc (smod_optab, SImode, "__vr4120_modsi3");
10489 }
10490
10491 if (TARGET_MIPS16 && TARGET_HARD_FLOAT_ABI)
10492 {
10493 /* Register the MIPS16 -mhard-float stubs. */
10494 set_optab_libfunc (add_optab, SFmode, "__mips16_addsf3");
10495 set_optab_libfunc (sub_optab, SFmode, "__mips16_subsf3");
10496 set_optab_libfunc (smul_optab, SFmode, "__mips16_mulsf3");
10497 set_optab_libfunc (sdiv_optab, SFmode, "__mips16_divsf3");
10498
10499 set_optab_libfunc (eq_optab, SFmode, "__mips16_eqsf2");
10500 set_optab_libfunc (ne_optab, SFmode, "__mips16_nesf2");
10501 set_optab_libfunc (gt_optab, SFmode, "__mips16_gtsf2");
10502 set_optab_libfunc (ge_optab, SFmode, "__mips16_gesf2");
10503 set_optab_libfunc (lt_optab, SFmode, "__mips16_ltsf2");
10504 set_optab_libfunc (le_optab, SFmode, "__mips16_lesf2");
10505 set_optab_libfunc (unord_optab, SFmode, "__mips16_unordsf2");
10506
10507 set_conv_libfunc (sfix_optab, SImode, SFmode, "__mips16_fix_truncsfsi");
10508 set_conv_libfunc (sfloat_optab, SFmode, SImode, "__mips16_floatsisf");
10509 set_conv_libfunc (ufloat_optab, SFmode, SImode, "__mips16_floatunsisf");
10510
10511 if (TARGET_DOUBLE_FLOAT)
10512 {
10513 set_optab_libfunc (add_optab, DFmode, "__mips16_adddf3");
10514 set_optab_libfunc (sub_optab, DFmode, "__mips16_subdf3");
10515 set_optab_libfunc (smul_optab, DFmode, "__mips16_muldf3");
10516 set_optab_libfunc (sdiv_optab, DFmode, "__mips16_divdf3");
10517
10518 set_optab_libfunc (eq_optab, DFmode, "__mips16_eqdf2");
10519 set_optab_libfunc (ne_optab, DFmode, "__mips16_nedf2");
10520 set_optab_libfunc (gt_optab, DFmode, "__mips16_gtdf2");
10521 set_optab_libfunc (ge_optab, DFmode, "__mips16_gedf2");
10522 set_optab_libfunc (lt_optab, DFmode, "__mips16_ltdf2");
10523 set_optab_libfunc (le_optab, DFmode, "__mips16_ledf2");
10524 set_optab_libfunc (unord_optab, DFmode, "__mips16_unorddf2");
10525
10526 set_conv_libfunc (sext_optab, DFmode, SFmode,
10527 "__mips16_extendsfdf2");
10528 set_conv_libfunc (trunc_optab, SFmode, DFmode,
10529 "__mips16_truncdfsf2");
10530 set_conv_libfunc (sfix_optab, SImode, DFmode,
10531 "__mips16_fix_truncdfsi");
10532 set_conv_libfunc (sfloat_optab, DFmode, SImode,
10533 "__mips16_floatsidf");
10534 set_conv_libfunc (ufloat_optab, DFmode, SImode,
10535 "__mips16_floatunsidf");
10536 }
10537 }
10538 else
10539 /* Register the gofast functions if selected using --enable-gofast. */
10540 gofast_maybe_init_libfuncs ();
10541
10542 /* The MIPS16 ISA does not have an encoding for "sync", so we rely
10543 on an external non-MIPS16 routine to implement __sync_synchronize. */
10544 if (TARGET_MIPS16)
10545 synchronize_libfunc = init_one_libfunc ("__sync_synchronize");
10546 }
10547
10548 /* Return the length of INSN. LENGTH is the initial length computed by
10549 attributes in the machine-description file. */
10550
10551 int
10552 mips_adjust_insn_length (rtx insn, int length)
10553 {
10554 /* A unconditional jump has an unfilled delay slot if it is not part
10555 of a sequence. A conditional jump normally has a delay slot, but
10556 does not on MIPS16. */
10557 if (CALL_P (insn) || (TARGET_MIPS16 ? simplejump_p (insn) : JUMP_P (insn)))
10558 length += 4;
10559
10560 /* See how many nops might be needed to avoid hardware hazards. */
10561 if (!cfun->machine->ignore_hazard_length_p && INSN_CODE (insn) >= 0)
10562 switch (get_attr_hazard (insn))
10563 {
10564 case HAZARD_NONE:
10565 break;
10566
10567 case HAZARD_DELAY:
10568 length += 4;
10569 break;
10570
10571 case HAZARD_HILO:
10572 length += 8;
10573 break;
10574 }
10575
10576 /* In order to make it easier to share MIPS16 and non-MIPS16 patterns,
10577 the .md file length attributes are 4-based for both modes.
10578 Adjust the MIPS16 ones here. */
10579 if (TARGET_MIPS16)
10580 length /= 2;
10581
10582 return length;
10583 }
10584
10585 /* Return an asm sequence to start a noat block and load the address
10586 of a label into $1. */
10587
10588 const char *
10589 mips_output_load_label (void)
10590 {
10591 if (TARGET_EXPLICIT_RELOCS)
10592 switch (mips_abi)
10593 {
10594 case ABI_N32:
10595 return "%[lw\t%@,%%got_page(%0)(%+)\n\taddiu\t%@,%@,%%got_ofst(%0)";
10596
10597 case ABI_64:
10598 return "%[ld\t%@,%%got_page(%0)(%+)\n\tdaddiu\t%@,%@,%%got_ofst(%0)";
10599
10600 default:
10601 if (ISA_HAS_LOAD_DELAY)
10602 return "%[lw\t%@,%%got(%0)(%+)%#\n\taddiu\t%@,%@,%%lo(%0)";
10603 return "%[lw\t%@,%%got(%0)(%+)\n\taddiu\t%@,%@,%%lo(%0)";
10604 }
10605 else
10606 {
10607 if (Pmode == DImode)
10608 return "%[dla\t%@,%0";
10609 else
10610 return "%[la\t%@,%0";
10611 }
10612 }
10613
10614 /* Return the assembly code for INSN, which has the operands given by
10615 OPERANDS, and which branches to OPERANDS[1] if some condition is true.
10616 BRANCH_IF_TRUE is the asm template that should be used if OPERANDS[1]
10617 is in range of a direct branch. BRANCH_IF_FALSE is an inverted
10618 version of BRANCH_IF_TRUE. */
10619
10620 const char *
10621 mips_output_conditional_branch (rtx insn, rtx *operands,
10622 const char *branch_if_true,
10623 const char *branch_if_false)
10624 {
10625 unsigned int length;
10626 rtx taken, not_taken;
10627
10628 gcc_assert (LABEL_P (operands[1]));
10629
10630 length = get_attr_length (insn);
10631 if (length <= 8)
10632 {
10633 /* Just a simple conditional branch. */
10634 mips_branch_likely = (final_sequence && INSN_ANNULLED_BRANCH_P (insn));
10635 return branch_if_true;
10636 }
10637
10638 /* Generate a reversed branch around a direct jump. This fallback does
10639 not use branch-likely instructions. */
10640 mips_branch_likely = false;
10641 not_taken = gen_label_rtx ();
10642 taken = operands[1];
10643
10644 /* Generate the reversed branch to NOT_TAKEN. */
10645 operands[1] = not_taken;
10646 output_asm_insn (branch_if_false, operands);
10647
10648 /* If INSN has a delay slot, we must provide delay slots for both the
10649 branch to NOT_TAKEN and the conditional jump. We must also ensure
10650 that INSN's delay slot is executed in the appropriate cases. */
10651 if (final_sequence)
10652 {
10653 /* This first delay slot will always be executed, so use INSN's
10654 delay slot if is not annulled. */
10655 if (!INSN_ANNULLED_BRANCH_P (insn))
10656 {
10657 final_scan_insn (XVECEXP (final_sequence, 0, 1),
10658 asm_out_file, optimize, 1, NULL);
10659 INSN_DELETED_P (XVECEXP (final_sequence, 0, 1)) = 1;
10660 }
10661 else
10662 output_asm_insn ("nop", 0);
10663 fprintf (asm_out_file, "\n");
10664 }
10665
10666 /* Output the unconditional branch to TAKEN. */
10667 if (length <= 16)
10668 output_asm_insn ("j\t%0%/", &taken);
10669 else
10670 {
10671 output_asm_insn (mips_output_load_label (), &taken);
10672 output_asm_insn ("jr\t%@%]%/", 0);
10673 }
10674
10675 /* Now deal with its delay slot; see above. */
10676 if (final_sequence)
10677 {
10678 /* This delay slot will only be executed if the branch is taken.
10679 Use INSN's delay slot if is annulled. */
10680 if (INSN_ANNULLED_BRANCH_P (insn))
10681 {
10682 final_scan_insn (XVECEXP (final_sequence, 0, 1),
10683 asm_out_file, optimize, 1, NULL);
10684 INSN_DELETED_P (XVECEXP (final_sequence, 0, 1)) = 1;
10685 }
10686 else
10687 output_asm_insn ("nop", 0);
10688 fprintf (asm_out_file, "\n");
10689 }
10690
10691 /* Output NOT_TAKEN. */
10692 targetm.asm_out.internal_label (asm_out_file, "L",
10693 CODE_LABEL_NUMBER (not_taken));
10694 return "";
10695 }
10696
10697 /* Return the assembly code for INSN, which branches to OPERANDS[1]
10698 if some ordering condition is true. The condition is given by
10699 OPERANDS[0] if !INVERTED_P, otherwise it is the inverse of
10700 OPERANDS[0]. OPERANDS[2] is the comparison's first operand;
10701 its second is always zero. */
10702
10703 const char *
10704 mips_output_order_conditional_branch (rtx insn, rtx *operands, bool inverted_p)
10705 {
10706 const char *branch[2];
10707
10708 /* Make BRANCH[1] branch to OPERANDS[1] when the condition is true.
10709 Make BRANCH[0] branch on the inverse condition. */
10710 switch (GET_CODE (operands[0]))
10711 {
10712 /* These cases are equivalent to comparisons against zero. */
10713 case LEU:
10714 inverted_p = !inverted_p;
10715 /* Fall through. */
10716 case GTU:
10717 branch[!inverted_p] = MIPS_BRANCH ("bne", "%2,%.,%1");
10718 branch[inverted_p] = MIPS_BRANCH ("beq", "%2,%.,%1");
10719 break;
10720
10721 /* These cases are always true or always false. */
10722 case LTU:
10723 inverted_p = !inverted_p;
10724 /* Fall through. */
10725 case GEU:
10726 branch[!inverted_p] = MIPS_BRANCH ("beq", "%.,%.,%1");
10727 branch[inverted_p] = MIPS_BRANCH ("bne", "%.,%.,%1");
10728 break;
10729
10730 default:
10731 branch[!inverted_p] = MIPS_BRANCH ("b%C0z", "%2,%1");
10732 branch[inverted_p] = MIPS_BRANCH ("b%N0z", "%2,%1");
10733 break;
10734 }
10735 return mips_output_conditional_branch (insn, operands, branch[1], branch[0]);
10736 }
10737 \f
10738 /* Return the assembly code for __sync_*() loop LOOP. The loop should support
10739 both normal and likely branches, using %? and %~ where appropriate. */
10740
10741 const char *
10742 mips_output_sync_loop (const char *loop)
10743 {
10744 /* Use branch-likely instructions to work around the LL/SC R10000 errata. */
10745 mips_branch_likely = TARGET_FIX_R10000;
10746 return loop;
10747 }
10748 \f
10749 /* Return the assembly code for DIV or DDIV instruction DIVISION, which has
10750 the operands given by OPERANDS. Add in a divide-by-zero check if needed.
10751
10752 When working around R4000 and R4400 errata, we need to make sure that
10753 the division is not immediately followed by a shift[1][2]. We also
10754 need to stop the division from being put into a branch delay slot[3].
10755 The easiest way to avoid both problems is to add a nop after the
10756 division. When a divide-by-zero check is needed, this nop can be
10757 used to fill the branch delay slot.
10758
10759 [1] If a double-word or a variable shift executes immediately
10760 after starting an integer division, the shift may give an
10761 incorrect result. See quotations of errata #16 and #28 from
10762 "MIPS R4000PC/SC Errata, Processor Revision 2.2 and 3.0"
10763 in mips.md for details.
10764
10765 [2] A similar bug to [1] exists for all revisions of the
10766 R4000 and the R4400 when run in an MC configuration.
10767 From "MIPS R4000MC Errata, Processor Revision 2.2 and 3.0":
10768
10769 "19. In this following sequence:
10770
10771 ddiv (or ddivu or div or divu)
10772 dsll32 (or dsrl32, dsra32)
10773
10774 if an MPT stall occurs, while the divide is slipping the cpu
10775 pipeline, then the following double shift would end up with an
10776 incorrect result.
10777
10778 Workaround: The compiler needs to avoid generating any
10779 sequence with divide followed by extended double shift."
10780
10781 This erratum is also present in "MIPS R4400MC Errata, Processor
10782 Revision 1.0" and "MIPS R4400MC Errata, Processor Revision 2.0
10783 & 3.0" as errata #10 and #4, respectively.
10784
10785 [3] From "MIPS R4000PC/SC Errata, Processor Revision 2.2 and 3.0"
10786 (also valid for MIPS R4000MC processors):
10787
10788 "52. R4000SC: This bug does not apply for the R4000PC.
10789
10790 There are two flavors of this bug:
10791
10792 1) If the instruction just after divide takes an RF exception
10793 (tlb-refill, tlb-invalid) and gets an instruction cache
10794 miss (both primary and secondary) and the line which is
10795 currently in secondary cache at this index had the first
10796 data word, where the bits 5..2 are set, then R4000 would
10797 get a wrong result for the div.
10798
10799 ##1
10800 nop
10801 div r8, r9
10802 ------------------- # end-of page. -tlb-refill
10803 nop
10804 ##2
10805 nop
10806 div r8, r9
10807 ------------------- # end-of page. -tlb-invalid
10808 nop
10809
10810 2) If the divide is in the taken branch delay slot, where the
10811 target takes RF exception and gets an I-cache miss for the
10812 exception vector or where I-cache miss occurs for the
10813 target address, under the above mentioned scenarios, the
10814 div would get wrong results.
10815
10816 ##1
10817 j r2 # to next page mapped or unmapped
10818 div r8,r9 # this bug would be there as long
10819 # as there is an ICache miss and
10820 nop # the "data pattern" is present
10821
10822 ##2
10823 beq r0, r0, NextPage # to Next page
10824 div r8,r9
10825 nop
10826
10827 This bug is present for div, divu, ddiv, and ddivu
10828 instructions.
10829
10830 Workaround: For item 1), OS could make sure that the next page
10831 after the divide instruction is also mapped. For item 2), the
10832 compiler could make sure that the divide instruction is not in
10833 the branch delay slot."
10834
10835 These processors have PRId values of 0x00004220 and 0x00004300 for
10836 the R4000 and 0x00004400, 0x00004500 and 0x00004600 for the R4400. */
10837
10838 const char *
10839 mips_output_division (const char *division, rtx *operands)
10840 {
10841 const char *s;
10842
10843 s = division;
10844 if (TARGET_FIX_R4000 || TARGET_FIX_R4400)
10845 {
10846 output_asm_insn (s, operands);
10847 s = "nop";
10848 }
10849 if (TARGET_CHECK_ZERO_DIV)
10850 {
10851 if (TARGET_MIPS16)
10852 {
10853 output_asm_insn (s, operands);
10854 s = "bnez\t%2,1f\n\tbreak\t7\n1:";
10855 }
10856 else if (GENERATE_DIVIDE_TRAPS)
10857 {
10858 output_asm_insn (s, operands);
10859 s = "teq\t%2,%.,7";
10860 }
10861 else
10862 {
10863 output_asm_insn ("%(bne\t%2,%.,1f", operands);
10864 output_asm_insn (s, operands);
10865 s = "break\t7%)\n1:";
10866 }
10867 }
10868 return s;
10869 }
10870 \f
10871 /* Return true if IN_INSN is a multiply-add or multiply-subtract
10872 instruction and if OUT_INSN assigns to the accumulator operand. */
10873
10874 bool
10875 mips_linked_madd_p (rtx out_insn, rtx in_insn)
10876 {
10877 rtx x;
10878
10879 x = single_set (in_insn);
10880 if (x == 0)
10881 return false;
10882
10883 x = SET_SRC (x);
10884
10885 if (GET_CODE (x) == PLUS
10886 && GET_CODE (XEXP (x, 0)) == MULT
10887 && reg_set_p (XEXP (x, 1), out_insn))
10888 return true;
10889
10890 if (GET_CODE (x) == MINUS
10891 && GET_CODE (XEXP (x, 1)) == MULT
10892 && reg_set_p (XEXP (x, 0), out_insn))
10893 return true;
10894
10895 return false;
10896 }
10897
10898 /* True if the dependency between OUT_INSN and IN_INSN is on the store
10899 data rather than the address. We need this because the cprestore
10900 pattern is type "store", but is defined using an UNSPEC_VOLATILE,
10901 which causes the default routine to abort. We just return false
10902 for that case. */
10903
10904 bool
10905 mips_store_data_bypass_p (rtx out_insn, rtx in_insn)
10906 {
10907 if (GET_CODE (PATTERN (in_insn)) == UNSPEC_VOLATILE)
10908 return false;
10909
10910 return !store_data_bypass_p (out_insn, in_insn);
10911 }
10912 \f
10913
10914 /* Variables and flags used in scheduler hooks when tuning for
10915 Loongson 2E/2F. */
10916 static struct
10917 {
10918 /* Variables to support Loongson 2E/2F round-robin [F]ALU1/2 dispatch
10919 strategy. */
10920
10921 /* If true, then next ALU1/2 instruction will go to ALU1. */
10922 bool alu1_turn_p;
10923
10924 /* If true, then next FALU1/2 unstruction will go to FALU1. */
10925 bool falu1_turn_p;
10926
10927 /* Codes to query if [f]alu{1,2}_core units are subscribed or not. */
10928 int alu1_core_unit_code;
10929 int alu2_core_unit_code;
10930 int falu1_core_unit_code;
10931 int falu2_core_unit_code;
10932
10933 /* True if current cycle has a multi instruction.
10934 This flag is used in mips_ls2_dfa_post_advance_cycle. */
10935 bool cycle_has_multi_p;
10936
10937 /* Instructions to subscribe ls2_[f]alu{1,2}_turn_enabled units.
10938 These are used in mips_ls2_dfa_post_advance_cycle to initialize
10939 DFA state.
10940 E.g., when alu1_turn_enabled_insn is issued it makes next ALU1/2
10941 instruction to go ALU1. */
10942 rtx alu1_turn_enabled_insn;
10943 rtx alu2_turn_enabled_insn;
10944 rtx falu1_turn_enabled_insn;
10945 rtx falu2_turn_enabled_insn;
10946 } mips_ls2;
10947
10948 /* Implement TARGET_SCHED_ADJUST_COST. We assume that anti and output
10949 dependencies have no cost, except on the 20Kc where output-dependence
10950 is treated like input-dependence. */
10951
10952 static int
10953 mips_adjust_cost (rtx insn ATTRIBUTE_UNUSED, rtx link,
10954 rtx dep ATTRIBUTE_UNUSED, int cost)
10955 {
10956 if (REG_NOTE_KIND (link) == REG_DEP_OUTPUT
10957 && TUNE_20KC)
10958 return cost;
10959 if (REG_NOTE_KIND (link) != 0)
10960 return 0;
10961 return cost;
10962 }
10963
10964 /* Return the number of instructions that can be issued per cycle. */
10965
10966 static int
10967 mips_issue_rate (void)
10968 {
10969 switch (mips_tune)
10970 {
10971 case PROCESSOR_74KC:
10972 case PROCESSOR_74KF2_1:
10973 case PROCESSOR_74KF1_1:
10974 case PROCESSOR_74KF3_2:
10975 /* The 74k is not strictly quad-issue cpu, but can be seen as one
10976 by the scheduler. It can issue 1 ALU, 1 AGEN and 2 FPU insns,
10977 but in reality only a maximum of 3 insns can be issued as
10978 floating-point loads and stores also require a slot in the
10979 AGEN pipe. */
10980 case PROCESSOR_R10000:
10981 /* All R10K Processors are quad-issue (being the first MIPS
10982 processors to support this feature). */
10983 return 4;
10984
10985 case PROCESSOR_20KC:
10986 case PROCESSOR_R4130:
10987 case PROCESSOR_R5400:
10988 case PROCESSOR_R5500:
10989 case PROCESSOR_R7000:
10990 case PROCESSOR_R9000:
10991 case PROCESSOR_OCTEON:
10992 return 2;
10993
10994 case PROCESSOR_SB1:
10995 case PROCESSOR_SB1A:
10996 /* This is actually 4, but we get better performance if we claim 3.
10997 This is partly because of unwanted speculative code motion with the
10998 larger number, and partly because in most common cases we can't
10999 reach the theoretical max of 4. */
11000 return 3;
11001
11002 case PROCESSOR_LOONGSON_2E:
11003 case PROCESSOR_LOONGSON_2F:
11004 return 4;
11005
11006 default:
11007 return 1;
11008 }
11009 }
11010
11011 /* Implement TARGET_SCHED_INIT_DFA_POST_CYCLE_INSN hook for Loongson2. */
11012
11013 static void
11014 mips_ls2_init_dfa_post_cycle_insn (void)
11015 {
11016 start_sequence ();
11017 emit_insn (gen_ls2_alu1_turn_enabled_insn ());
11018 mips_ls2.alu1_turn_enabled_insn = get_insns ();
11019 end_sequence ();
11020
11021 start_sequence ();
11022 emit_insn (gen_ls2_alu2_turn_enabled_insn ());
11023 mips_ls2.alu2_turn_enabled_insn = get_insns ();
11024 end_sequence ();
11025
11026 start_sequence ();
11027 emit_insn (gen_ls2_falu1_turn_enabled_insn ());
11028 mips_ls2.falu1_turn_enabled_insn = get_insns ();
11029 end_sequence ();
11030
11031 start_sequence ();
11032 emit_insn (gen_ls2_falu2_turn_enabled_insn ());
11033 mips_ls2.falu2_turn_enabled_insn = get_insns ();
11034 end_sequence ();
11035
11036 mips_ls2.alu1_core_unit_code = get_cpu_unit_code ("ls2_alu1_core");
11037 mips_ls2.alu2_core_unit_code = get_cpu_unit_code ("ls2_alu2_core");
11038 mips_ls2.falu1_core_unit_code = get_cpu_unit_code ("ls2_falu1_core");
11039 mips_ls2.falu2_core_unit_code = get_cpu_unit_code ("ls2_falu2_core");
11040 }
11041
11042 /* Implement TARGET_SCHED_INIT_DFA_POST_CYCLE_INSN hook.
11043 Init data used in mips_dfa_post_advance_cycle. */
11044
11045 static void
11046 mips_init_dfa_post_cycle_insn (void)
11047 {
11048 if (TUNE_LOONGSON_2EF)
11049 mips_ls2_init_dfa_post_cycle_insn ();
11050 }
11051
11052 /* Initialize STATE when scheduling for Loongson 2E/2F.
11053 Support round-robin dispatch scheme by enabling only one of
11054 ALU1/ALU2 and one of FALU1/FALU2 units for ALU1/2 and FALU1/2 instructions
11055 respectively. */
11056
11057 static void
11058 mips_ls2_dfa_post_advance_cycle (state_t state)
11059 {
11060 if (cpu_unit_reservation_p (state, mips_ls2.alu1_core_unit_code))
11061 {
11062 /* Though there are no non-pipelined ALU1 insns,
11063 we can get an instruction of type 'multi' before reload. */
11064 gcc_assert (mips_ls2.cycle_has_multi_p);
11065 mips_ls2.alu1_turn_p = false;
11066 }
11067
11068 mips_ls2.cycle_has_multi_p = false;
11069
11070 if (cpu_unit_reservation_p (state, mips_ls2.alu2_core_unit_code))
11071 /* We have a non-pipelined alu instruction in the core,
11072 adjust round-robin counter. */
11073 mips_ls2.alu1_turn_p = true;
11074
11075 if (mips_ls2.alu1_turn_p)
11076 {
11077 if (state_transition (state, mips_ls2.alu1_turn_enabled_insn) >= 0)
11078 gcc_unreachable ();
11079 }
11080 else
11081 {
11082 if (state_transition (state, mips_ls2.alu2_turn_enabled_insn) >= 0)
11083 gcc_unreachable ();
11084 }
11085
11086 if (cpu_unit_reservation_p (state, mips_ls2.falu1_core_unit_code))
11087 {
11088 /* There are no non-pipelined FALU1 insns. */
11089 gcc_unreachable ();
11090 mips_ls2.falu1_turn_p = false;
11091 }
11092
11093 if (cpu_unit_reservation_p (state, mips_ls2.falu2_core_unit_code))
11094 /* We have a non-pipelined falu instruction in the core,
11095 adjust round-robin counter. */
11096 mips_ls2.falu1_turn_p = true;
11097
11098 if (mips_ls2.falu1_turn_p)
11099 {
11100 if (state_transition (state, mips_ls2.falu1_turn_enabled_insn) >= 0)
11101 gcc_unreachable ();
11102 }
11103 else
11104 {
11105 if (state_transition (state, mips_ls2.falu2_turn_enabled_insn) >= 0)
11106 gcc_unreachable ();
11107 }
11108 }
11109
11110 /* Implement TARGET_SCHED_DFA_POST_ADVANCE_CYCLE.
11111 This hook is being called at the start of each cycle. */
11112
11113 static void
11114 mips_dfa_post_advance_cycle (void)
11115 {
11116 if (TUNE_LOONGSON_2EF)
11117 mips_ls2_dfa_post_advance_cycle (curr_state);
11118 }
11119
11120 /* Implement TARGET_SCHED_FIRST_CYCLE_MULTIPASS_DFA_LOOKAHEAD. This should
11121 be as wide as the scheduling freedom in the DFA. */
11122
11123 static int
11124 mips_multipass_dfa_lookahead (void)
11125 {
11126 /* Can schedule up to 4 of the 6 function units in any one cycle. */
11127 if (TUNE_SB1)
11128 return 4;
11129
11130 if (TUNE_LOONGSON_2EF)
11131 return 4;
11132
11133 if (TUNE_OCTEON)
11134 return 2;
11135
11136 return 0;
11137 }
11138 \f
11139 /* Remove the instruction at index LOWER from ready queue READY and
11140 reinsert it in front of the instruction at index HIGHER. LOWER must
11141 be <= HIGHER. */
11142
11143 static void
11144 mips_promote_ready (rtx *ready, int lower, int higher)
11145 {
11146 rtx new_head;
11147 int i;
11148
11149 new_head = ready[lower];
11150 for (i = lower; i < higher; i++)
11151 ready[i] = ready[i + 1];
11152 ready[i] = new_head;
11153 }
11154
11155 /* If the priority of the instruction at POS2 in the ready queue READY
11156 is within LIMIT units of that of the instruction at POS1, swap the
11157 instructions if POS2 is not already less than POS1. */
11158
11159 static void
11160 mips_maybe_swap_ready (rtx *ready, int pos1, int pos2, int limit)
11161 {
11162 if (pos1 < pos2
11163 && INSN_PRIORITY (ready[pos1]) + limit >= INSN_PRIORITY (ready[pos2]))
11164 {
11165 rtx temp;
11166
11167 temp = ready[pos1];
11168 ready[pos1] = ready[pos2];
11169 ready[pos2] = temp;
11170 }
11171 }
11172 \f
11173 /* Used by TUNE_MACC_CHAINS to record the last scheduled instruction
11174 that may clobber hi or lo. */
11175 static rtx mips_macc_chains_last_hilo;
11176
11177 /* A TUNE_MACC_CHAINS helper function. Record that instruction INSN has
11178 been scheduled, updating mips_macc_chains_last_hilo appropriately. */
11179
11180 static void
11181 mips_macc_chains_record (rtx insn)
11182 {
11183 if (get_attr_may_clobber_hilo (insn))
11184 mips_macc_chains_last_hilo = insn;
11185 }
11186
11187 /* A TUNE_MACC_CHAINS helper function. Search ready queue READY, which
11188 has NREADY elements, looking for a multiply-add or multiply-subtract
11189 instruction that is cumulative with mips_macc_chains_last_hilo.
11190 If there is one, promote it ahead of anything else that might
11191 clobber hi or lo. */
11192
11193 static void
11194 mips_macc_chains_reorder (rtx *ready, int nready)
11195 {
11196 int i, j;
11197
11198 if (mips_macc_chains_last_hilo != 0)
11199 for (i = nready - 1; i >= 0; i--)
11200 if (mips_linked_madd_p (mips_macc_chains_last_hilo, ready[i]))
11201 {
11202 for (j = nready - 1; j > i; j--)
11203 if (recog_memoized (ready[j]) >= 0
11204 && get_attr_may_clobber_hilo (ready[j]))
11205 {
11206 mips_promote_ready (ready, i, j);
11207 break;
11208 }
11209 break;
11210 }
11211 }
11212 \f
11213 /* The last instruction to be scheduled. */
11214 static rtx vr4130_last_insn;
11215
11216 /* A note_stores callback used by vr4130_true_reg_dependence_p. DATA
11217 points to an rtx that is initially an instruction. Nullify the rtx
11218 if the instruction uses the value of register X. */
11219
11220 static void
11221 vr4130_true_reg_dependence_p_1 (rtx x, const_rtx pat ATTRIBUTE_UNUSED,
11222 void *data)
11223 {
11224 rtx *insn_ptr;
11225
11226 insn_ptr = (rtx *) data;
11227 if (REG_P (x)
11228 && *insn_ptr != 0
11229 && reg_referenced_p (x, PATTERN (*insn_ptr)))
11230 *insn_ptr = 0;
11231 }
11232
11233 /* Return true if there is true register dependence between vr4130_last_insn
11234 and INSN. */
11235
11236 static bool
11237 vr4130_true_reg_dependence_p (rtx insn)
11238 {
11239 note_stores (PATTERN (vr4130_last_insn),
11240 vr4130_true_reg_dependence_p_1, &insn);
11241 return insn == 0;
11242 }
11243
11244 /* A TUNE_MIPS4130 helper function. Given that INSN1 is at the head of
11245 the ready queue and that INSN2 is the instruction after it, return
11246 true if it is worth promoting INSN2 ahead of INSN1. Look for cases
11247 in which INSN1 and INSN2 can probably issue in parallel, but for
11248 which (INSN2, INSN1) should be less sensitive to instruction
11249 alignment than (INSN1, INSN2). See 4130.md for more details. */
11250
11251 static bool
11252 vr4130_swap_insns_p (rtx insn1, rtx insn2)
11253 {
11254 sd_iterator_def sd_it;
11255 dep_t dep;
11256
11257 /* Check for the following case:
11258
11259 1) there is some other instruction X with an anti dependence on INSN1;
11260 2) X has a higher priority than INSN2; and
11261 3) X is an arithmetic instruction (and thus has no unit restrictions).
11262
11263 If INSN1 is the last instruction blocking X, it would better to
11264 choose (INSN1, X) over (INSN2, INSN1). */
11265 FOR_EACH_DEP (insn1, SD_LIST_FORW, sd_it, dep)
11266 if (DEP_TYPE (dep) == REG_DEP_ANTI
11267 && INSN_PRIORITY (DEP_CON (dep)) > INSN_PRIORITY (insn2)
11268 && recog_memoized (DEP_CON (dep)) >= 0
11269 && get_attr_vr4130_class (DEP_CON (dep)) == VR4130_CLASS_ALU)
11270 return false;
11271
11272 if (vr4130_last_insn != 0
11273 && recog_memoized (insn1) >= 0
11274 && recog_memoized (insn2) >= 0)
11275 {
11276 /* See whether INSN1 and INSN2 use different execution units,
11277 or if they are both ALU-type instructions. If so, they can
11278 probably execute in parallel. */
11279 enum attr_vr4130_class class1 = get_attr_vr4130_class (insn1);
11280 enum attr_vr4130_class class2 = get_attr_vr4130_class (insn2);
11281 if (class1 != class2 || class1 == VR4130_CLASS_ALU)
11282 {
11283 /* If only one of the instructions has a dependence on
11284 vr4130_last_insn, prefer to schedule the other one first. */
11285 bool dep1_p = vr4130_true_reg_dependence_p (insn1);
11286 bool dep2_p = vr4130_true_reg_dependence_p (insn2);
11287 if (dep1_p != dep2_p)
11288 return dep1_p;
11289
11290 /* Prefer to schedule INSN2 ahead of INSN1 if vr4130_last_insn
11291 is not an ALU-type instruction and if INSN1 uses the same
11292 execution unit. (Note that if this condition holds, we already
11293 know that INSN2 uses a different execution unit.) */
11294 if (class1 != VR4130_CLASS_ALU
11295 && recog_memoized (vr4130_last_insn) >= 0
11296 && class1 == get_attr_vr4130_class (vr4130_last_insn))
11297 return true;
11298 }
11299 }
11300 return false;
11301 }
11302
11303 /* A TUNE_MIPS4130 helper function. (READY, NREADY) describes a ready
11304 queue with at least two instructions. Swap the first two if
11305 vr4130_swap_insns_p says that it could be worthwhile. */
11306
11307 static void
11308 vr4130_reorder (rtx *ready, int nready)
11309 {
11310 if (vr4130_swap_insns_p (ready[nready - 1], ready[nready - 2]))
11311 mips_promote_ready (ready, nready - 2, nready - 1);
11312 }
11313 \f
11314 /* Record whether last 74k AGEN instruction was a load or store. */
11315 static enum attr_type mips_last_74k_agen_insn = TYPE_UNKNOWN;
11316
11317 /* Initialize mips_last_74k_agen_insn from INSN. A null argument
11318 resets to TYPE_UNKNOWN state. */
11319
11320 static void
11321 mips_74k_agen_init (rtx insn)
11322 {
11323 if (!insn || !NONJUMP_INSN_P (insn))
11324 mips_last_74k_agen_insn = TYPE_UNKNOWN;
11325 else
11326 {
11327 enum attr_type type = get_attr_type (insn);
11328 if (type == TYPE_LOAD || type == TYPE_STORE)
11329 mips_last_74k_agen_insn = type;
11330 }
11331 }
11332
11333 /* A TUNE_74K helper function. The 74K AGEN pipeline likes multiple
11334 loads to be grouped together, and multiple stores to be grouped
11335 together. Swap things around in the ready queue to make this happen. */
11336
11337 static void
11338 mips_74k_agen_reorder (rtx *ready, int nready)
11339 {
11340 int i;
11341 int store_pos, load_pos;
11342
11343 store_pos = -1;
11344 load_pos = -1;
11345
11346 for (i = nready - 1; i >= 0; i--)
11347 {
11348 rtx insn = ready[i];
11349 if (USEFUL_INSN_P (insn))
11350 switch (get_attr_type (insn))
11351 {
11352 case TYPE_STORE:
11353 if (store_pos == -1)
11354 store_pos = i;
11355 break;
11356
11357 case TYPE_LOAD:
11358 if (load_pos == -1)
11359 load_pos = i;
11360 break;
11361
11362 default:
11363 break;
11364 }
11365 }
11366
11367 if (load_pos == -1 || store_pos == -1)
11368 return;
11369
11370 switch (mips_last_74k_agen_insn)
11371 {
11372 case TYPE_UNKNOWN:
11373 /* Prefer to schedule loads since they have a higher latency. */
11374 case TYPE_LOAD:
11375 /* Swap loads to the front of the queue. */
11376 mips_maybe_swap_ready (ready, load_pos, store_pos, 4);
11377 break;
11378 case TYPE_STORE:
11379 /* Swap stores to the front of the queue. */
11380 mips_maybe_swap_ready (ready, store_pos, load_pos, 4);
11381 break;
11382 default:
11383 break;
11384 }
11385 }
11386 \f
11387 /* Implement TARGET_SCHED_INIT. */
11388
11389 static void
11390 mips_sched_init (FILE *file ATTRIBUTE_UNUSED, int verbose ATTRIBUTE_UNUSED,
11391 int max_ready ATTRIBUTE_UNUSED)
11392 {
11393 mips_macc_chains_last_hilo = 0;
11394 vr4130_last_insn = 0;
11395 mips_74k_agen_init (NULL_RTX);
11396
11397 /* When scheduling for Loongson2, branch instructions go to ALU1,
11398 therefore basic block is most likely to start with round-robin counter
11399 pointed to ALU2. */
11400 mips_ls2.alu1_turn_p = false;
11401 mips_ls2.falu1_turn_p = true;
11402 }
11403
11404 /* Implement TARGET_SCHED_REORDER and TARGET_SCHED_REORDER2. */
11405
11406 static int
11407 mips_sched_reorder (FILE *file ATTRIBUTE_UNUSED, int verbose ATTRIBUTE_UNUSED,
11408 rtx *ready, int *nreadyp, int cycle ATTRIBUTE_UNUSED)
11409 {
11410 if (!reload_completed
11411 && TUNE_MACC_CHAINS
11412 && *nreadyp > 0)
11413 mips_macc_chains_reorder (ready, *nreadyp);
11414
11415 if (reload_completed
11416 && TUNE_MIPS4130
11417 && !TARGET_VR4130_ALIGN
11418 && *nreadyp > 1)
11419 vr4130_reorder (ready, *nreadyp);
11420
11421 if (TUNE_74K)
11422 mips_74k_agen_reorder (ready, *nreadyp);
11423
11424 return mips_issue_rate ();
11425 }
11426
11427 /* Update round-robin counters for ALU1/2 and FALU1/2. */
11428
11429 static void
11430 mips_ls2_variable_issue (rtx insn)
11431 {
11432 if (mips_ls2.alu1_turn_p)
11433 {
11434 if (cpu_unit_reservation_p (curr_state, mips_ls2.alu1_core_unit_code))
11435 mips_ls2.alu1_turn_p = false;
11436 }
11437 else
11438 {
11439 if (cpu_unit_reservation_p (curr_state, mips_ls2.alu2_core_unit_code))
11440 mips_ls2.alu1_turn_p = true;
11441 }
11442
11443 if (mips_ls2.falu1_turn_p)
11444 {
11445 if (cpu_unit_reservation_p (curr_state, mips_ls2.falu1_core_unit_code))
11446 mips_ls2.falu1_turn_p = false;
11447 }
11448 else
11449 {
11450 if (cpu_unit_reservation_p (curr_state, mips_ls2.falu2_core_unit_code))
11451 mips_ls2.falu1_turn_p = true;
11452 }
11453
11454 if (recog_memoized (insn) >= 0)
11455 mips_ls2.cycle_has_multi_p |= (get_attr_type (insn) == TYPE_MULTI);
11456 }
11457
11458 /* Implement TARGET_SCHED_VARIABLE_ISSUE. */
11459
11460 static int
11461 mips_variable_issue (FILE *file ATTRIBUTE_UNUSED, int verbose ATTRIBUTE_UNUSED,
11462 rtx insn, int more)
11463 {
11464 /* Ignore USEs and CLOBBERs; don't count them against the issue rate. */
11465 if (USEFUL_INSN_P (insn))
11466 {
11467 more--;
11468 if (!reload_completed && TUNE_MACC_CHAINS)
11469 mips_macc_chains_record (insn);
11470 vr4130_last_insn = insn;
11471 if (TUNE_74K)
11472 mips_74k_agen_init (insn);
11473 else if (TUNE_LOONGSON_2EF)
11474 mips_ls2_variable_issue (insn);
11475 }
11476
11477 /* Instructions of type 'multi' should all be split before
11478 the second scheduling pass. */
11479 gcc_assert (!reload_completed
11480 || recog_memoized (insn) < 0
11481 || get_attr_type (insn) != TYPE_MULTI);
11482
11483 return more;
11484 }
11485 \f
11486 /* Given that we have an rtx of the form (prefetch ... WRITE LOCALITY),
11487 return the first operand of the associated PREF or PREFX insn. */
11488
11489 rtx
11490 mips_prefetch_cookie (rtx write, rtx locality)
11491 {
11492 /* store_streamed / load_streamed. */
11493 if (INTVAL (locality) <= 0)
11494 return GEN_INT (INTVAL (write) + 4);
11495
11496 /* store / load. */
11497 if (INTVAL (locality) <= 2)
11498 return write;
11499
11500 /* store_retained / load_retained. */
11501 return GEN_INT (INTVAL (write) + 6);
11502 }
11503 \f
11504 /* Flags that indicate when a built-in function is available.
11505
11506 BUILTIN_AVAIL_NON_MIPS16
11507 The function is available on the current target, but only
11508 in non-MIPS16 mode. */
11509 #define BUILTIN_AVAIL_NON_MIPS16 1
11510
11511 /* Declare an availability predicate for built-in functions that
11512 require non-MIPS16 mode and also require COND to be true.
11513 NAME is the main part of the predicate's name. */
11514 #define AVAIL_NON_MIPS16(NAME, COND) \
11515 static unsigned int \
11516 mips_builtin_avail_##NAME (void) \
11517 { \
11518 return (COND) ? BUILTIN_AVAIL_NON_MIPS16 : 0; \
11519 }
11520
11521 /* This structure describes a single built-in function. */
11522 struct mips_builtin_description {
11523 /* The code of the main .md file instruction. See mips_builtin_type
11524 for more information. */
11525 enum insn_code icode;
11526
11527 /* The floating-point comparison code to use with ICODE, if any. */
11528 enum mips_fp_condition cond;
11529
11530 /* The name of the built-in function. */
11531 const char *name;
11532
11533 /* Specifies how the function should be expanded. */
11534 enum mips_builtin_type builtin_type;
11535
11536 /* The function's prototype. */
11537 enum mips_function_type function_type;
11538
11539 /* Whether the function is available. */
11540 unsigned int (*avail) (void);
11541 };
11542
11543 AVAIL_NON_MIPS16 (paired_single, TARGET_PAIRED_SINGLE_FLOAT)
11544 AVAIL_NON_MIPS16 (sb1_paired_single, TARGET_SB1 && TARGET_PAIRED_SINGLE_FLOAT)
11545 AVAIL_NON_MIPS16 (mips3d, TARGET_MIPS3D)
11546 AVAIL_NON_MIPS16 (dsp, TARGET_DSP)
11547 AVAIL_NON_MIPS16 (dspr2, TARGET_DSPR2)
11548 AVAIL_NON_MIPS16 (dsp_32, !TARGET_64BIT && TARGET_DSP)
11549 AVAIL_NON_MIPS16 (dspr2_32, !TARGET_64BIT && TARGET_DSPR2)
11550 AVAIL_NON_MIPS16 (loongson, TARGET_LOONGSON_VECTORS)
11551 AVAIL_NON_MIPS16 (cache, TARGET_CACHE_BUILTIN)
11552
11553 /* Construct a mips_builtin_description from the given arguments.
11554
11555 INSN is the name of the associated instruction pattern, without the
11556 leading CODE_FOR_mips_.
11557
11558 CODE is the floating-point condition code associated with the
11559 function. It can be 'f' if the field is not applicable.
11560
11561 NAME is the name of the function itself, without the leading
11562 "__builtin_mips_".
11563
11564 BUILTIN_TYPE and FUNCTION_TYPE are mips_builtin_description fields.
11565
11566 AVAIL is the name of the availability predicate, without the leading
11567 mips_builtin_avail_. */
11568 #define MIPS_BUILTIN(INSN, COND, NAME, BUILTIN_TYPE, \
11569 FUNCTION_TYPE, AVAIL) \
11570 { CODE_FOR_mips_ ## INSN, MIPS_FP_COND_ ## COND, \
11571 "__builtin_mips_" NAME, BUILTIN_TYPE, FUNCTION_TYPE, \
11572 mips_builtin_avail_ ## AVAIL }
11573
11574 /* Define __builtin_mips_<INSN>, which is a MIPS_BUILTIN_DIRECT function
11575 mapped to instruction CODE_FOR_mips_<INSN>, FUNCTION_TYPE and AVAIL
11576 are as for MIPS_BUILTIN. */
11577 #define DIRECT_BUILTIN(INSN, FUNCTION_TYPE, AVAIL) \
11578 MIPS_BUILTIN (INSN, f, #INSN, MIPS_BUILTIN_DIRECT, FUNCTION_TYPE, AVAIL)
11579
11580 /* Define __builtin_mips_<INSN>_<COND>_{s,d} functions, both of which
11581 are subject to mips_builtin_avail_<AVAIL>. */
11582 #define CMP_SCALAR_BUILTINS(INSN, COND, AVAIL) \
11583 MIPS_BUILTIN (INSN ## _cond_s, COND, #INSN "_" #COND "_s", \
11584 MIPS_BUILTIN_CMP_SINGLE, MIPS_INT_FTYPE_SF_SF, AVAIL), \
11585 MIPS_BUILTIN (INSN ## _cond_d, COND, #INSN "_" #COND "_d", \
11586 MIPS_BUILTIN_CMP_SINGLE, MIPS_INT_FTYPE_DF_DF, AVAIL)
11587
11588 /* Define __builtin_mips_{any,all,upper,lower}_<INSN>_<COND>_ps.
11589 The lower and upper forms are subject to mips_builtin_avail_<AVAIL>
11590 while the any and all forms are subject to mips_builtin_avail_mips3d. */
11591 #define CMP_PS_BUILTINS(INSN, COND, AVAIL) \
11592 MIPS_BUILTIN (INSN ## _cond_ps, COND, "any_" #INSN "_" #COND "_ps", \
11593 MIPS_BUILTIN_CMP_ANY, MIPS_INT_FTYPE_V2SF_V2SF, \
11594 mips3d), \
11595 MIPS_BUILTIN (INSN ## _cond_ps, COND, "all_" #INSN "_" #COND "_ps", \
11596 MIPS_BUILTIN_CMP_ALL, MIPS_INT_FTYPE_V2SF_V2SF, \
11597 mips3d), \
11598 MIPS_BUILTIN (INSN ## _cond_ps, COND, "lower_" #INSN "_" #COND "_ps", \
11599 MIPS_BUILTIN_CMP_LOWER, MIPS_INT_FTYPE_V2SF_V2SF, \
11600 AVAIL), \
11601 MIPS_BUILTIN (INSN ## _cond_ps, COND, "upper_" #INSN "_" #COND "_ps", \
11602 MIPS_BUILTIN_CMP_UPPER, MIPS_INT_FTYPE_V2SF_V2SF, \
11603 AVAIL)
11604
11605 /* Define __builtin_mips_{any,all}_<INSN>_<COND>_4s. The functions
11606 are subject to mips_builtin_avail_mips3d. */
11607 #define CMP_4S_BUILTINS(INSN, COND) \
11608 MIPS_BUILTIN (INSN ## _cond_4s, COND, "any_" #INSN "_" #COND "_4s", \
11609 MIPS_BUILTIN_CMP_ANY, \
11610 MIPS_INT_FTYPE_V2SF_V2SF_V2SF_V2SF, mips3d), \
11611 MIPS_BUILTIN (INSN ## _cond_4s, COND, "all_" #INSN "_" #COND "_4s", \
11612 MIPS_BUILTIN_CMP_ALL, \
11613 MIPS_INT_FTYPE_V2SF_V2SF_V2SF_V2SF, mips3d)
11614
11615 /* Define __builtin_mips_mov{t,f}_<INSN>_<COND>_ps. The comparison
11616 instruction requires mips_builtin_avail_<AVAIL>. */
11617 #define MOVTF_BUILTINS(INSN, COND, AVAIL) \
11618 MIPS_BUILTIN (INSN ## _cond_ps, COND, "movt_" #INSN "_" #COND "_ps", \
11619 MIPS_BUILTIN_MOVT, MIPS_V2SF_FTYPE_V2SF_V2SF_V2SF_V2SF, \
11620 AVAIL), \
11621 MIPS_BUILTIN (INSN ## _cond_ps, COND, "movf_" #INSN "_" #COND "_ps", \
11622 MIPS_BUILTIN_MOVF, MIPS_V2SF_FTYPE_V2SF_V2SF_V2SF_V2SF, \
11623 AVAIL)
11624
11625 /* Define all the built-in functions related to C.cond.fmt condition COND. */
11626 #define CMP_BUILTINS(COND) \
11627 MOVTF_BUILTINS (c, COND, paired_single), \
11628 MOVTF_BUILTINS (cabs, COND, mips3d), \
11629 CMP_SCALAR_BUILTINS (cabs, COND, mips3d), \
11630 CMP_PS_BUILTINS (c, COND, paired_single), \
11631 CMP_PS_BUILTINS (cabs, COND, mips3d), \
11632 CMP_4S_BUILTINS (c, COND), \
11633 CMP_4S_BUILTINS (cabs, COND)
11634
11635 /* Define __builtin_mips_<INSN>, which is a MIPS_BUILTIN_DIRECT_NO_TARGET
11636 function mapped to instruction CODE_FOR_mips_<INSN>, FUNCTION_TYPE
11637 and AVAIL are as for MIPS_BUILTIN. */
11638 #define DIRECT_NO_TARGET_BUILTIN(INSN, FUNCTION_TYPE, AVAIL) \
11639 MIPS_BUILTIN (INSN, f, #INSN, MIPS_BUILTIN_DIRECT_NO_TARGET, \
11640 FUNCTION_TYPE, AVAIL)
11641
11642 /* Define __builtin_mips_bposge<VALUE>. <VALUE> is 32 for the MIPS32 DSP
11643 branch instruction. AVAIL is as for MIPS_BUILTIN. */
11644 #define BPOSGE_BUILTIN(VALUE, AVAIL) \
11645 MIPS_BUILTIN (bposge, f, "bposge" #VALUE, \
11646 MIPS_BUILTIN_BPOSGE ## VALUE, MIPS_SI_FTYPE_VOID, AVAIL)
11647
11648 /* Define a Loongson MIPS_BUILTIN_DIRECT function __builtin_loongson_<FN_NAME>
11649 for instruction CODE_FOR_loongson_<INSN>. FUNCTION_TYPE is a
11650 builtin_description field. */
11651 #define LOONGSON_BUILTIN_ALIAS(INSN, FN_NAME, FUNCTION_TYPE) \
11652 { CODE_FOR_loongson_ ## INSN, MIPS_FP_COND_f, \
11653 "__builtin_loongson_" #FN_NAME, MIPS_BUILTIN_DIRECT, \
11654 FUNCTION_TYPE, mips_builtin_avail_loongson }
11655
11656 /* Define a Loongson MIPS_BUILTIN_DIRECT function __builtin_loongson_<INSN>
11657 for instruction CODE_FOR_loongson_<INSN>. FUNCTION_TYPE is a
11658 builtin_description field. */
11659 #define LOONGSON_BUILTIN(INSN, FUNCTION_TYPE) \
11660 LOONGSON_BUILTIN_ALIAS (INSN, INSN, FUNCTION_TYPE)
11661
11662 /* Like LOONGSON_BUILTIN, but add _<SUFFIX> to the end of the function name.
11663 We use functions of this form when the same insn can be usefully applied
11664 to more than one datatype. */
11665 #define LOONGSON_BUILTIN_SUFFIX(INSN, SUFFIX, FUNCTION_TYPE) \
11666 LOONGSON_BUILTIN_ALIAS (INSN, INSN ## _ ## SUFFIX, FUNCTION_TYPE)
11667
11668 #define CODE_FOR_mips_sqrt_ps CODE_FOR_sqrtv2sf2
11669 #define CODE_FOR_mips_addq_ph CODE_FOR_addv2hi3
11670 #define CODE_FOR_mips_addu_qb CODE_FOR_addv4qi3
11671 #define CODE_FOR_mips_subq_ph CODE_FOR_subv2hi3
11672 #define CODE_FOR_mips_subu_qb CODE_FOR_subv4qi3
11673 #define CODE_FOR_mips_mul_ph CODE_FOR_mulv2hi3
11674
11675 #define CODE_FOR_loongson_packsswh CODE_FOR_vec_pack_ssat_v2si
11676 #define CODE_FOR_loongson_packsshb CODE_FOR_vec_pack_ssat_v4hi
11677 #define CODE_FOR_loongson_packushb CODE_FOR_vec_pack_usat_v4hi
11678 #define CODE_FOR_loongson_paddw CODE_FOR_addv2si3
11679 #define CODE_FOR_loongson_paddh CODE_FOR_addv4hi3
11680 #define CODE_FOR_loongson_paddb CODE_FOR_addv8qi3
11681 #define CODE_FOR_loongson_paddsh CODE_FOR_ssaddv4hi3
11682 #define CODE_FOR_loongson_paddsb CODE_FOR_ssaddv8qi3
11683 #define CODE_FOR_loongson_paddush CODE_FOR_usaddv4hi3
11684 #define CODE_FOR_loongson_paddusb CODE_FOR_usaddv8qi3
11685 #define CODE_FOR_loongson_pmaxsh CODE_FOR_smaxv4hi3
11686 #define CODE_FOR_loongson_pmaxub CODE_FOR_umaxv8qi3
11687 #define CODE_FOR_loongson_pminsh CODE_FOR_sminv4hi3
11688 #define CODE_FOR_loongson_pminub CODE_FOR_uminv8qi3
11689 #define CODE_FOR_loongson_pmulhuh CODE_FOR_umulv4hi3_highpart
11690 #define CODE_FOR_loongson_pmulhh CODE_FOR_smulv4hi3_highpart
11691 #define CODE_FOR_loongson_psubw CODE_FOR_subv2si3
11692 #define CODE_FOR_loongson_psubh CODE_FOR_subv4hi3
11693 #define CODE_FOR_loongson_psubb CODE_FOR_subv8qi3
11694 #define CODE_FOR_loongson_psubsh CODE_FOR_sssubv4hi3
11695 #define CODE_FOR_loongson_psubsb CODE_FOR_sssubv8qi3
11696 #define CODE_FOR_loongson_psubush CODE_FOR_ussubv4hi3
11697 #define CODE_FOR_loongson_psubusb CODE_FOR_ussubv8qi3
11698 #define CODE_FOR_loongson_punpckhbh CODE_FOR_vec_interleave_highv8qi
11699 #define CODE_FOR_loongson_punpckhhw CODE_FOR_vec_interleave_highv4hi
11700 #define CODE_FOR_loongson_punpckhwd CODE_FOR_vec_interleave_highv2si
11701 #define CODE_FOR_loongson_punpcklbh CODE_FOR_vec_interleave_lowv8qi
11702 #define CODE_FOR_loongson_punpcklhw CODE_FOR_vec_interleave_lowv4hi
11703 #define CODE_FOR_loongson_punpcklwd CODE_FOR_vec_interleave_lowv2si
11704
11705 static const struct mips_builtin_description mips_builtins[] = {
11706 DIRECT_BUILTIN (pll_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, paired_single),
11707 DIRECT_BUILTIN (pul_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, paired_single),
11708 DIRECT_BUILTIN (plu_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, paired_single),
11709 DIRECT_BUILTIN (puu_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, paired_single),
11710 DIRECT_BUILTIN (cvt_ps_s, MIPS_V2SF_FTYPE_SF_SF, paired_single),
11711 DIRECT_BUILTIN (cvt_s_pl, MIPS_SF_FTYPE_V2SF, paired_single),
11712 DIRECT_BUILTIN (cvt_s_pu, MIPS_SF_FTYPE_V2SF, paired_single),
11713 DIRECT_BUILTIN (abs_ps, MIPS_V2SF_FTYPE_V2SF, paired_single),
11714
11715 DIRECT_BUILTIN (alnv_ps, MIPS_V2SF_FTYPE_V2SF_V2SF_INT, paired_single),
11716 DIRECT_BUILTIN (addr_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, mips3d),
11717 DIRECT_BUILTIN (mulr_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, mips3d),
11718 DIRECT_BUILTIN (cvt_pw_ps, MIPS_V2SF_FTYPE_V2SF, mips3d),
11719 DIRECT_BUILTIN (cvt_ps_pw, MIPS_V2SF_FTYPE_V2SF, mips3d),
11720
11721 DIRECT_BUILTIN (recip1_s, MIPS_SF_FTYPE_SF, mips3d),
11722 DIRECT_BUILTIN (recip1_d, MIPS_DF_FTYPE_DF, mips3d),
11723 DIRECT_BUILTIN (recip1_ps, MIPS_V2SF_FTYPE_V2SF, mips3d),
11724 DIRECT_BUILTIN (recip2_s, MIPS_SF_FTYPE_SF_SF, mips3d),
11725 DIRECT_BUILTIN (recip2_d, MIPS_DF_FTYPE_DF_DF, mips3d),
11726 DIRECT_BUILTIN (recip2_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, mips3d),
11727
11728 DIRECT_BUILTIN (rsqrt1_s, MIPS_SF_FTYPE_SF, mips3d),
11729 DIRECT_BUILTIN (rsqrt1_d, MIPS_DF_FTYPE_DF, mips3d),
11730 DIRECT_BUILTIN (rsqrt1_ps, MIPS_V2SF_FTYPE_V2SF, mips3d),
11731 DIRECT_BUILTIN (rsqrt2_s, MIPS_SF_FTYPE_SF_SF, mips3d),
11732 DIRECT_BUILTIN (rsqrt2_d, MIPS_DF_FTYPE_DF_DF, mips3d),
11733 DIRECT_BUILTIN (rsqrt2_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, mips3d),
11734
11735 MIPS_FP_CONDITIONS (CMP_BUILTINS),
11736
11737 /* Built-in functions for the SB-1 processor. */
11738 DIRECT_BUILTIN (sqrt_ps, MIPS_V2SF_FTYPE_V2SF, sb1_paired_single),
11739
11740 /* Built-in functions for the DSP ASE (32-bit and 64-bit). */
11741 DIRECT_BUILTIN (addq_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dsp),
11742 DIRECT_BUILTIN (addq_s_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dsp),
11743 DIRECT_BUILTIN (addq_s_w, MIPS_SI_FTYPE_SI_SI, dsp),
11744 DIRECT_BUILTIN (addu_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dsp),
11745 DIRECT_BUILTIN (addu_s_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dsp),
11746 DIRECT_BUILTIN (subq_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dsp),
11747 DIRECT_BUILTIN (subq_s_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dsp),
11748 DIRECT_BUILTIN (subq_s_w, MIPS_SI_FTYPE_SI_SI, dsp),
11749 DIRECT_BUILTIN (subu_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dsp),
11750 DIRECT_BUILTIN (subu_s_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dsp),
11751 DIRECT_BUILTIN (addsc, MIPS_SI_FTYPE_SI_SI, dsp),
11752 DIRECT_BUILTIN (addwc, MIPS_SI_FTYPE_SI_SI, dsp),
11753 DIRECT_BUILTIN (modsub, MIPS_SI_FTYPE_SI_SI, dsp),
11754 DIRECT_BUILTIN (raddu_w_qb, MIPS_SI_FTYPE_V4QI, dsp),
11755 DIRECT_BUILTIN (absq_s_ph, MIPS_V2HI_FTYPE_V2HI, dsp),
11756 DIRECT_BUILTIN (absq_s_w, MIPS_SI_FTYPE_SI, dsp),
11757 DIRECT_BUILTIN (precrq_qb_ph, MIPS_V4QI_FTYPE_V2HI_V2HI, dsp),
11758 DIRECT_BUILTIN (precrq_ph_w, MIPS_V2HI_FTYPE_SI_SI, dsp),
11759 DIRECT_BUILTIN (precrq_rs_ph_w, MIPS_V2HI_FTYPE_SI_SI, dsp),
11760 DIRECT_BUILTIN (precrqu_s_qb_ph, MIPS_V4QI_FTYPE_V2HI_V2HI, dsp),
11761 DIRECT_BUILTIN (preceq_w_phl, MIPS_SI_FTYPE_V2HI, dsp),
11762 DIRECT_BUILTIN (preceq_w_phr, MIPS_SI_FTYPE_V2HI, dsp),
11763 DIRECT_BUILTIN (precequ_ph_qbl, MIPS_V2HI_FTYPE_V4QI, dsp),
11764 DIRECT_BUILTIN (precequ_ph_qbr, MIPS_V2HI_FTYPE_V4QI, dsp),
11765 DIRECT_BUILTIN (precequ_ph_qbla, MIPS_V2HI_FTYPE_V4QI, dsp),
11766 DIRECT_BUILTIN (precequ_ph_qbra, MIPS_V2HI_FTYPE_V4QI, dsp),
11767 DIRECT_BUILTIN (preceu_ph_qbl, MIPS_V2HI_FTYPE_V4QI, dsp),
11768 DIRECT_BUILTIN (preceu_ph_qbr, MIPS_V2HI_FTYPE_V4QI, dsp),
11769 DIRECT_BUILTIN (preceu_ph_qbla, MIPS_V2HI_FTYPE_V4QI, dsp),
11770 DIRECT_BUILTIN (preceu_ph_qbra, MIPS_V2HI_FTYPE_V4QI, dsp),
11771 DIRECT_BUILTIN (shll_qb, MIPS_V4QI_FTYPE_V4QI_SI, dsp),
11772 DIRECT_BUILTIN (shll_ph, MIPS_V2HI_FTYPE_V2HI_SI, dsp),
11773 DIRECT_BUILTIN (shll_s_ph, MIPS_V2HI_FTYPE_V2HI_SI, dsp),
11774 DIRECT_BUILTIN (shll_s_w, MIPS_SI_FTYPE_SI_SI, dsp),
11775 DIRECT_BUILTIN (shrl_qb, MIPS_V4QI_FTYPE_V4QI_SI, dsp),
11776 DIRECT_BUILTIN (shra_ph, MIPS_V2HI_FTYPE_V2HI_SI, dsp),
11777 DIRECT_BUILTIN (shra_r_ph, MIPS_V2HI_FTYPE_V2HI_SI, dsp),
11778 DIRECT_BUILTIN (shra_r_w, MIPS_SI_FTYPE_SI_SI, dsp),
11779 DIRECT_BUILTIN (muleu_s_ph_qbl, MIPS_V2HI_FTYPE_V4QI_V2HI, dsp),
11780 DIRECT_BUILTIN (muleu_s_ph_qbr, MIPS_V2HI_FTYPE_V4QI_V2HI, dsp),
11781 DIRECT_BUILTIN (mulq_rs_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dsp),
11782 DIRECT_BUILTIN (muleq_s_w_phl, MIPS_SI_FTYPE_V2HI_V2HI, dsp),
11783 DIRECT_BUILTIN (muleq_s_w_phr, MIPS_SI_FTYPE_V2HI_V2HI, dsp),
11784 DIRECT_BUILTIN (bitrev, MIPS_SI_FTYPE_SI, dsp),
11785 DIRECT_BUILTIN (insv, MIPS_SI_FTYPE_SI_SI, dsp),
11786 DIRECT_BUILTIN (repl_qb, MIPS_V4QI_FTYPE_SI, dsp),
11787 DIRECT_BUILTIN (repl_ph, MIPS_V2HI_FTYPE_SI, dsp),
11788 DIRECT_NO_TARGET_BUILTIN (cmpu_eq_qb, MIPS_VOID_FTYPE_V4QI_V4QI, dsp),
11789 DIRECT_NO_TARGET_BUILTIN (cmpu_lt_qb, MIPS_VOID_FTYPE_V4QI_V4QI, dsp),
11790 DIRECT_NO_TARGET_BUILTIN (cmpu_le_qb, MIPS_VOID_FTYPE_V4QI_V4QI, dsp),
11791 DIRECT_BUILTIN (cmpgu_eq_qb, MIPS_SI_FTYPE_V4QI_V4QI, dsp),
11792 DIRECT_BUILTIN (cmpgu_lt_qb, MIPS_SI_FTYPE_V4QI_V4QI, dsp),
11793 DIRECT_BUILTIN (cmpgu_le_qb, MIPS_SI_FTYPE_V4QI_V4QI, dsp),
11794 DIRECT_NO_TARGET_BUILTIN (cmp_eq_ph, MIPS_VOID_FTYPE_V2HI_V2HI, dsp),
11795 DIRECT_NO_TARGET_BUILTIN (cmp_lt_ph, MIPS_VOID_FTYPE_V2HI_V2HI, dsp),
11796 DIRECT_NO_TARGET_BUILTIN (cmp_le_ph, MIPS_VOID_FTYPE_V2HI_V2HI, dsp),
11797 DIRECT_BUILTIN (pick_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dsp),
11798 DIRECT_BUILTIN (pick_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dsp),
11799 DIRECT_BUILTIN (packrl_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dsp),
11800 DIRECT_NO_TARGET_BUILTIN (wrdsp, MIPS_VOID_FTYPE_SI_SI, dsp),
11801 DIRECT_BUILTIN (rddsp, MIPS_SI_FTYPE_SI, dsp),
11802 DIRECT_BUILTIN (lbux, MIPS_SI_FTYPE_POINTER_SI, dsp),
11803 DIRECT_BUILTIN (lhx, MIPS_SI_FTYPE_POINTER_SI, dsp),
11804 DIRECT_BUILTIN (lwx, MIPS_SI_FTYPE_POINTER_SI, dsp),
11805 BPOSGE_BUILTIN (32, dsp),
11806
11807 /* The following are for the MIPS DSP ASE REV 2 (32-bit and 64-bit). */
11808 DIRECT_BUILTIN (absq_s_qb, MIPS_V4QI_FTYPE_V4QI, dspr2),
11809 DIRECT_BUILTIN (addu_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
11810 DIRECT_BUILTIN (addu_s_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
11811 DIRECT_BUILTIN (adduh_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dspr2),
11812 DIRECT_BUILTIN (adduh_r_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dspr2),
11813 DIRECT_BUILTIN (append, MIPS_SI_FTYPE_SI_SI_SI, dspr2),
11814 DIRECT_BUILTIN (balign, MIPS_SI_FTYPE_SI_SI_SI, dspr2),
11815 DIRECT_BUILTIN (cmpgdu_eq_qb, MIPS_SI_FTYPE_V4QI_V4QI, dspr2),
11816 DIRECT_BUILTIN (cmpgdu_lt_qb, MIPS_SI_FTYPE_V4QI_V4QI, dspr2),
11817 DIRECT_BUILTIN (cmpgdu_le_qb, MIPS_SI_FTYPE_V4QI_V4QI, dspr2),
11818 DIRECT_BUILTIN (mul_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
11819 DIRECT_BUILTIN (mul_s_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
11820 DIRECT_BUILTIN (mulq_rs_w, MIPS_SI_FTYPE_SI_SI, dspr2),
11821 DIRECT_BUILTIN (mulq_s_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
11822 DIRECT_BUILTIN (mulq_s_w, MIPS_SI_FTYPE_SI_SI, dspr2),
11823 DIRECT_BUILTIN (precr_qb_ph, MIPS_V4QI_FTYPE_V2HI_V2HI, dspr2),
11824 DIRECT_BUILTIN (precr_sra_ph_w, MIPS_V2HI_FTYPE_SI_SI_SI, dspr2),
11825 DIRECT_BUILTIN (precr_sra_r_ph_w, MIPS_V2HI_FTYPE_SI_SI_SI, dspr2),
11826 DIRECT_BUILTIN (prepend, MIPS_SI_FTYPE_SI_SI_SI, dspr2),
11827 DIRECT_BUILTIN (shra_qb, MIPS_V4QI_FTYPE_V4QI_SI, dspr2),
11828 DIRECT_BUILTIN (shra_r_qb, MIPS_V4QI_FTYPE_V4QI_SI, dspr2),
11829 DIRECT_BUILTIN (shrl_ph, MIPS_V2HI_FTYPE_V2HI_SI, dspr2),
11830 DIRECT_BUILTIN (subu_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
11831 DIRECT_BUILTIN (subu_s_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
11832 DIRECT_BUILTIN (subuh_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dspr2),
11833 DIRECT_BUILTIN (subuh_r_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dspr2),
11834 DIRECT_BUILTIN (addqh_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
11835 DIRECT_BUILTIN (addqh_r_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
11836 DIRECT_BUILTIN (addqh_w, MIPS_SI_FTYPE_SI_SI, dspr2),
11837 DIRECT_BUILTIN (addqh_r_w, MIPS_SI_FTYPE_SI_SI, dspr2),
11838 DIRECT_BUILTIN (subqh_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
11839 DIRECT_BUILTIN (subqh_r_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
11840 DIRECT_BUILTIN (subqh_w, MIPS_SI_FTYPE_SI_SI, dspr2),
11841 DIRECT_BUILTIN (subqh_r_w, MIPS_SI_FTYPE_SI_SI, dspr2),
11842
11843 /* Built-in functions for the DSP ASE (32-bit only). */
11844 DIRECT_BUILTIN (dpau_h_qbl, MIPS_DI_FTYPE_DI_V4QI_V4QI, dsp_32),
11845 DIRECT_BUILTIN (dpau_h_qbr, MIPS_DI_FTYPE_DI_V4QI_V4QI, dsp_32),
11846 DIRECT_BUILTIN (dpsu_h_qbl, MIPS_DI_FTYPE_DI_V4QI_V4QI, dsp_32),
11847 DIRECT_BUILTIN (dpsu_h_qbr, MIPS_DI_FTYPE_DI_V4QI_V4QI, dsp_32),
11848 DIRECT_BUILTIN (dpaq_s_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dsp_32),
11849 DIRECT_BUILTIN (dpsq_s_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dsp_32),
11850 DIRECT_BUILTIN (mulsaq_s_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dsp_32),
11851 DIRECT_BUILTIN (dpaq_sa_l_w, MIPS_DI_FTYPE_DI_SI_SI, dsp_32),
11852 DIRECT_BUILTIN (dpsq_sa_l_w, MIPS_DI_FTYPE_DI_SI_SI, dsp_32),
11853 DIRECT_BUILTIN (maq_s_w_phl, MIPS_DI_FTYPE_DI_V2HI_V2HI, dsp_32),
11854 DIRECT_BUILTIN (maq_s_w_phr, MIPS_DI_FTYPE_DI_V2HI_V2HI, dsp_32),
11855 DIRECT_BUILTIN (maq_sa_w_phl, MIPS_DI_FTYPE_DI_V2HI_V2HI, dsp_32),
11856 DIRECT_BUILTIN (maq_sa_w_phr, MIPS_DI_FTYPE_DI_V2HI_V2HI, dsp_32),
11857 DIRECT_BUILTIN (extr_w, MIPS_SI_FTYPE_DI_SI, dsp_32),
11858 DIRECT_BUILTIN (extr_r_w, MIPS_SI_FTYPE_DI_SI, dsp_32),
11859 DIRECT_BUILTIN (extr_rs_w, MIPS_SI_FTYPE_DI_SI, dsp_32),
11860 DIRECT_BUILTIN (extr_s_h, MIPS_SI_FTYPE_DI_SI, dsp_32),
11861 DIRECT_BUILTIN (extp, MIPS_SI_FTYPE_DI_SI, dsp_32),
11862 DIRECT_BUILTIN (extpdp, MIPS_SI_FTYPE_DI_SI, dsp_32),
11863 DIRECT_BUILTIN (shilo, MIPS_DI_FTYPE_DI_SI, dsp_32),
11864 DIRECT_BUILTIN (mthlip, MIPS_DI_FTYPE_DI_SI, dsp_32),
11865
11866 /* The following are for the MIPS DSP ASE REV 2 (32-bit only). */
11867 DIRECT_BUILTIN (dpa_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32),
11868 DIRECT_BUILTIN (dps_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32),
11869 DIRECT_BUILTIN (madd, MIPS_DI_FTYPE_DI_SI_SI, dspr2_32),
11870 DIRECT_BUILTIN (maddu, MIPS_DI_FTYPE_DI_USI_USI, dspr2_32),
11871 DIRECT_BUILTIN (msub, MIPS_DI_FTYPE_DI_SI_SI, dspr2_32),
11872 DIRECT_BUILTIN (msubu, MIPS_DI_FTYPE_DI_USI_USI, dspr2_32),
11873 DIRECT_BUILTIN (mulsa_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32),
11874 DIRECT_BUILTIN (mult, MIPS_DI_FTYPE_SI_SI, dspr2_32),
11875 DIRECT_BUILTIN (multu, MIPS_DI_FTYPE_USI_USI, dspr2_32),
11876 DIRECT_BUILTIN (dpax_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32),
11877 DIRECT_BUILTIN (dpsx_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32),
11878 DIRECT_BUILTIN (dpaqx_s_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32),
11879 DIRECT_BUILTIN (dpaqx_sa_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32),
11880 DIRECT_BUILTIN (dpsqx_s_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32),
11881 DIRECT_BUILTIN (dpsqx_sa_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32),
11882
11883 /* Builtin functions for ST Microelectronics Loongson-2E/2F cores. */
11884 LOONGSON_BUILTIN (packsswh, MIPS_V4HI_FTYPE_V2SI_V2SI),
11885 LOONGSON_BUILTIN (packsshb, MIPS_V8QI_FTYPE_V4HI_V4HI),
11886 LOONGSON_BUILTIN (packushb, MIPS_UV8QI_FTYPE_UV4HI_UV4HI),
11887 LOONGSON_BUILTIN_SUFFIX (paddw, u, MIPS_UV2SI_FTYPE_UV2SI_UV2SI),
11888 LOONGSON_BUILTIN_SUFFIX (paddh, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
11889 LOONGSON_BUILTIN_SUFFIX (paddb, u, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
11890 LOONGSON_BUILTIN_SUFFIX (paddw, s, MIPS_V2SI_FTYPE_V2SI_V2SI),
11891 LOONGSON_BUILTIN_SUFFIX (paddh, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
11892 LOONGSON_BUILTIN_SUFFIX (paddb, s, MIPS_V8QI_FTYPE_V8QI_V8QI),
11893 LOONGSON_BUILTIN_SUFFIX (paddd, u, MIPS_UDI_FTYPE_UDI_UDI),
11894 LOONGSON_BUILTIN_SUFFIX (paddd, s, MIPS_DI_FTYPE_DI_DI),
11895 LOONGSON_BUILTIN (paddsh, MIPS_V4HI_FTYPE_V4HI_V4HI),
11896 LOONGSON_BUILTIN (paddsb, MIPS_V8QI_FTYPE_V8QI_V8QI),
11897 LOONGSON_BUILTIN (paddush, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
11898 LOONGSON_BUILTIN (paddusb, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
11899 LOONGSON_BUILTIN_ALIAS (pandn_d, pandn_ud, MIPS_UDI_FTYPE_UDI_UDI),
11900 LOONGSON_BUILTIN_ALIAS (pandn_w, pandn_uw, MIPS_UV2SI_FTYPE_UV2SI_UV2SI),
11901 LOONGSON_BUILTIN_ALIAS (pandn_h, pandn_uh, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
11902 LOONGSON_BUILTIN_ALIAS (pandn_b, pandn_ub, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
11903 LOONGSON_BUILTIN_ALIAS (pandn_d, pandn_sd, MIPS_DI_FTYPE_DI_DI),
11904 LOONGSON_BUILTIN_ALIAS (pandn_w, pandn_sw, MIPS_V2SI_FTYPE_V2SI_V2SI),
11905 LOONGSON_BUILTIN_ALIAS (pandn_h, pandn_sh, MIPS_V4HI_FTYPE_V4HI_V4HI),
11906 LOONGSON_BUILTIN_ALIAS (pandn_b, pandn_sb, MIPS_V8QI_FTYPE_V8QI_V8QI),
11907 LOONGSON_BUILTIN (pavgh, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
11908 LOONGSON_BUILTIN (pavgb, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
11909 LOONGSON_BUILTIN_SUFFIX (pcmpeqw, u, MIPS_UV2SI_FTYPE_UV2SI_UV2SI),
11910 LOONGSON_BUILTIN_SUFFIX (pcmpeqh, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
11911 LOONGSON_BUILTIN_SUFFIX (pcmpeqb, u, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
11912 LOONGSON_BUILTIN_SUFFIX (pcmpeqw, s, MIPS_V2SI_FTYPE_V2SI_V2SI),
11913 LOONGSON_BUILTIN_SUFFIX (pcmpeqh, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
11914 LOONGSON_BUILTIN_SUFFIX (pcmpeqb, s, MIPS_V8QI_FTYPE_V8QI_V8QI),
11915 LOONGSON_BUILTIN_SUFFIX (pcmpgtw, u, MIPS_UV2SI_FTYPE_UV2SI_UV2SI),
11916 LOONGSON_BUILTIN_SUFFIX (pcmpgth, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
11917 LOONGSON_BUILTIN_SUFFIX (pcmpgtb, u, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
11918 LOONGSON_BUILTIN_SUFFIX (pcmpgtw, s, MIPS_V2SI_FTYPE_V2SI_V2SI),
11919 LOONGSON_BUILTIN_SUFFIX (pcmpgth, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
11920 LOONGSON_BUILTIN_SUFFIX (pcmpgtb, s, MIPS_V8QI_FTYPE_V8QI_V8QI),
11921 LOONGSON_BUILTIN_SUFFIX (pextrh, u, MIPS_UV4HI_FTYPE_UV4HI_USI),
11922 LOONGSON_BUILTIN_SUFFIX (pextrh, s, MIPS_V4HI_FTYPE_V4HI_USI),
11923 LOONGSON_BUILTIN_SUFFIX (pinsrh_0, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
11924 LOONGSON_BUILTIN_SUFFIX (pinsrh_1, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
11925 LOONGSON_BUILTIN_SUFFIX (pinsrh_2, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
11926 LOONGSON_BUILTIN_SUFFIX (pinsrh_3, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
11927 LOONGSON_BUILTIN_SUFFIX (pinsrh_0, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
11928 LOONGSON_BUILTIN_SUFFIX (pinsrh_1, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
11929 LOONGSON_BUILTIN_SUFFIX (pinsrh_2, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
11930 LOONGSON_BUILTIN_SUFFIX (pinsrh_3, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
11931 LOONGSON_BUILTIN (pmaddhw, MIPS_V2SI_FTYPE_V4HI_V4HI),
11932 LOONGSON_BUILTIN (pmaxsh, MIPS_V4HI_FTYPE_V4HI_V4HI),
11933 LOONGSON_BUILTIN (pmaxub, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
11934 LOONGSON_BUILTIN (pminsh, MIPS_V4HI_FTYPE_V4HI_V4HI),
11935 LOONGSON_BUILTIN (pminub, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
11936 LOONGSON_BUILTIN_SUFFIX (pmovmskb, u, MIPS_UV8QI_FTYPE_UV8QI),
11937 LOONGSON_BUILTIN_SUFFIX (pmovmskb, s, MIPS_V8QI_FTYPE_V8QI),
11938 LOONGSON_BUILTIN (pmulhuh, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
11939 LOONGSON_BUILTIN (pmulhh, MIPS_V4HI_FTYPE_V4HI_V4HI),
11940 LOONGSON_BUILTIN (pmullh, MIPS_V4HI_FTYPE_V4HI_V4HI),
11941 LOONGSON_BUILTIN (pmuluw, MIPS_UDI_FTYPE_UV2SI_UV2SI),
11942 LOONGSON_BUILTIN (pasubub, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
11943 LOONGSON_BUILTIN (biadd, MIPS_UV4HI_FTYPE_UV8QI),
11944 LOONGSON_BUILTIN (psadbh, MIPS_UV4HI_FTYPE_UV8QI_UV8QI),
11945 LOONGSON_BUILTIN_SUFFIX (pshufh, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI_UQI),
11946 LOONGSON_BUILTIN_SUFFIX (pshufh, s, MIPS_V4HI_FTYPE_V4HI_V4HI_UQI),
11947 LOONGSON_BUILTIN_SUFFIX (psllh, u, MIPS_UV4HI_FTYPE_UV4HI_UQI),
11948 LOONGSON_BUILTIN_SUFFIX (psllh, s, MIPS_V4HI_FTYPE_V4HI_UQI),
11949 LOONGSON_BUILTIN_SUFFIX (psllw, u, MIPS_UV2SI_FTYPE_UV2SI_UQI),
11950 LOONGSON_BUILTIN_SUFFIX (psllw, s, MIPS_V2SI_FTYPE_V2SI_UQI),
11951 LOONGSON_BUILTIN_SUFFIX (psrah, u, MIPS_UV4HI_FTYPE_UV4HI_UQI),
11952 LOONGSON_BUILTIN_SUFFIX (psrah, s, MIPS_V4HI_FTYPE_V4HI_UQI),
11953 LOONGSON_BUILTIN_SUFFIX (psraw, u, MIPS_UV2SI_FTYPE_UV2SI_UQI),
11954 LOONGSON_BUILTIN_SUFFIX (psraw, s, MIPS_V2SI_FTYPE_V2SI_UQI),
11955 LOONGSON_BUILTIN_SUFFIX (psrlh, u, MIPS_UV4HI_FTYPE_UV4HI_UQI),
11956 LOONGSON_BUILTIN_SUFFIX (psrlh, s, MIPS_V4HI_FTYPE_V4HI_UQI),
11957 LOONGSON_BUILTIN_SUFFIX (psrlw, u, MIPS_UV2SI_FTYPE_UV2SI_UQI),
11958 LOONGSON_BUILTIN_SUFFIX (psrlw, s, MIPS_V2SI_FTYPE_V2SI_UQI),
11959 LOONGSON_BUILTIN_SUFFIX (psubw, u, MIPS_UV2SI_FTYPE_UV2SI_UV2SI),
11960 LOONGSON_BUILTIN_SUFFIX (psubh, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
11961 LOONGSON_BUILTIN_SUFFIX (psubb, u, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
11962 LOONGSON_BUILTIN_SUFFIX (psubw, s, MIPS_V2SI_FTYPE_V2SI_V2SI),
11963 LOONGSON_BUILTIN_SUFFIX (psubh, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
11964 LOONGSON_BUILTIN_SUFFIX (psubb, s, MIPS_V8QI_FTYPE_V8QI_V8QI),
11965 LOONGSON_BUILTIN_SUFFIX (psubd, u, MIPS_UDI_FTYPE_UDI_UDI),
11966 LOONGSON_BUILTIN_SUFFIX (psubd, s, MIPS_DI_FTYPE_DI_DI),
11967 LOONGSON_BUILTIN (psubsh, MIPS_V4HI_FTYPE_V4HI_V4HI),
11968 LOONGSON_BUILTIN (psubsb, MIPS_V8QI_FTYPE_V8QI_V8QI),
11969 LOONGSON_BUILTIN (psubush, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
11970 LOONGSON_BUILTIN (psubusb, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
11971 LOONGSON_BUILTIN_SUFFIX (punpckhbh, u, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
11972 LOONGSON_BUILTIN_SUFFIX (punpckhhw, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
11973 LOONGSON_BUILTIN_SUFFIX (punpckhwd, u, MIPS_UV2SI_FTYPE_UV2SI_UV2SI),
11974 LOONGSON_BUILTIN_SUFFIX (punpckhbh, s, MIPS_V8QI_FTYPE_V8QI_V8QI),
11975 LOONGSON_BUILTIN_SUFFIX (punpckhhw, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
11976 LOONGSON_BUILTIN_SUFFIX (punpckhwd, s, MIPS_V2SI_FTYPE_V2SI_V2SI),
11977 LOONGSON_BUILTIN_SUFFIX (punpcklbh, u, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
11978 LOONGSON_BUILTIN_SUFFIX (punpcklhw, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
11979 LOONGSON_BUILTIN_SUFFIX (punpcklwd, u, MIPS_UV2SI_FTYPE_UV2SI_UV2SI),
11980 LOONGSON_BUILTIN_SUFFIX (punpcklbh, s, MIPS_V8QI_FTYPE_V8QI_V8QI),
11981 LOONGSON_BUILTIN_SUFFIX (punpcklhw, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
11982 LOONGSON_BUILTIN_SUFFIX (punpcklwd, s, MIPS_V2SI_FTYPE_V2SI_V2SI),
11983
11984 /* Sundry other built-in functions. */
11985 DIRECT_NO_TARGET_BUILTIN (cache, MIPS_VOID_FTYPE_SI_CVPOINTER, cache)
11986 };
11987
11988 /* MODE is a vector mode whose elements have type TYPE. Return the type
11989 of the vector itself. */
11990
11991 static tree
11992 mips_builtin_vector_type (tree type, enum machine_mode mode)
11993 {
11994 static tree types[2 * (int) MAX_MACHINE_MODE];
11995 int mode_index;
11996
11997 mode_index = (int) mode;
11998
11999 if (TREE_CODE (type) == INTEGER_TYPE && TYPE_UNSIGNED (type))
12000 mode_index += MAX_MACHINE_MODE;
12001
12002 if (types[mode_index] == NULL_TREE)
12003 types[mode_index] = build_vector_type_for_mode (type, mode);
12004 return types[mode_index];
12005 }
12006
12007 /* Return a type for 'const volatile void *'. */
12008
12009 static tree
12010 mips_build_cvpointer_type (void)
12011 {
12012 static tree cache;
12013
12014 if (cache == NULL_TREE)
12015 cache = build_pointer_type (build_qualified_type
12016 (void_type_node,
12017 TYPE_QUAL_CONST | TYPE_QUAL_VOLATILE));
12018 return cache;
12019 }
12020
12021 /* Source-level argument types. */
12022 #define MIPS_ATYPE_VOID void_type_node
12023 #define MIPS_ATYPE_INT integer_type_node
12024 #define MIPS_ATYPE_POINTER ptr_type_node
12025 #define MIPS_ATYPE_CVPOINTER mips_build_cvpointer_type ()
12026
12027 /* Standard mode-based argument types. */
12028 #define MIPS_ATYPE_UQI unsigned_intQI_type_node
12029 #define MIPS_ATYPE_SI intSI_type_node
12030 #define MIPS_ATYPE_USI unsigned_intSI_type_node
12031 #define MIPS_ATYPE_DI intDI_type_node
12032 #define MIPS_ATYPE_UDI unsigned_intDI_type_node
12033 #define MIPS_ATYPE_SF float_type_node
12034 #define MIPS_ATYPE_DF double_type_node
12035
12036 /* Vector argument types. */
12037 #define MIPS_ATYPE_V2SF mips_builtin_vector_type (float_type_node, V2SFmode)
12038 #define MIPS_ATYPE_V2HI mips_builtin_vector_type (intHI_type_node, V2HImode)
12039 #define MIPS_ATYPE_V2SI mips_builtin_vector_type (intSI_type_node, V2SImode)
12040 #define MIPS_ATYPE_V4QI mips_builtin_vector_type (intQI_type_node, V4QImode)
12041 #define MIPS_ATYPE_V4HI mips_builtin_vector_type (intHI_type_node, V4HImode)
12042 #define MIPS_ATYPE_V8QI mips_builtin_vector_type (intQI_type_node, V8QImode)
12043 #define MIPS_ATYPE_UV2SI \
12044 mips_builtin_vector_type (unsigned_intSI_type_node, V2SImode)
12045 #define MIPS_ATYPE_UV4HI \
12046 mips_builtin_vector_type (unsigned_intHI_type_node, V4HImode)
12047 #define MIPS_ATYPE_UV8QI \
12048 mips_builtin_vector_type (unsigned_intQI_type_node, V8QImode)
12049
12050 /* MIPS_FTYPE_ATYPESN takes N MIPS_FTYPES-like type codes and lists
12051 their associated MIPS_ATYPEs. */
12052 #define MIPS_FTYPE_ATYPES1(A, B) \
12053 MIPS_ATYPE_##A, MIPS_ATYPE_##B
12054
12055 #define MIPS_FTYPE_ATYPES2(A, B, C) \
12056 MIPS_ATYPE_##A, MIPS_ATYPE_##B, MIPS_ATYPE_##C
12057
12058 #define MIPS_FTYPE_ATYPES3(A, B, C, D) \
12059 MIPS_ATYPE_##A, MIPS_ATYPE_##B, MIPS_ATYPE_##C, MIPS_ATYPE_##D
12060
12061 #define MIPS_FTYPE_ATYPES4(A, B, C, D, E) \
12062 MIPS_ATYPE_##A, MIPS_ATYPE_##B, MIPS_ATYPE_##C, MIPS_ATYPE_##D, \
12063 MIPS_ATYPE_##E
12064
12065 /* Return the function type associated with function prototype TYPE. */
12066
12067 static tree
12068 mips_build_function_type (enum mips_function_type type)
12069 {
12070 static tree types[(int) MIPS_MAX_FTYPE_MAX];
12071
12072 if (types[(int) type] == NULL_TREE)
12073 switch (type)
12074 {
12075 #define DEF_MIPS_FTYPE(NUM, ARGS) \
12076 case MIPS_FTYPE_NAME##NUM ARGS: \
12077 types[(int) type] \
12078 = build_function_type_list (MIPS_FTYPE_ATYPES##NUM ARGS, \
12079 NULL_TREE); \
12080 break;
12081 #include "config/mips/mips-ftypes.def"
12082 #undef DEF_MIPS_FTYPE
12083 default:
12084 gcc_unreachable ();
12085 }
12086
12087 return types[(int) type];
12088 }
12089
12090 /* Implement TARGET_INIT_BUILTINS. */
12091
12092 static void
12093 mips_init_builtins (void)
12094 {
12095 const struct mips_builtin_description *d;
12096 unsigned int i;
12097
12098 /* Iterate through all of the bdesc arrays, initializing all of the
12099 builtin functions. */
12100 for (i = 0; i < ARRAY_SIZE (mips_builtins); i++)
12101 {
12102 d = &mips_builtins[i];
12103 if (d->avail ())
12104 add_builtin_function (d->name,
12105 mips_build_function_type (d->function_type),
12106 i, BUILT_IN_MD, NULL, NULL);
12107 }
12108 }
12109
12110 /* Take argument ARGNO from EXP's argument list and convert it into a
12111 form suitable for input operand OPNO of instruction ICODE. Return the
12112 value. */
12113
12114 static rtx
12115 mips_prepare_builtin_arg (enum insn_code icode,
12116 unsigned int opno, tree exp, unsigned int argno)
12117 {
12118 tree arg;
12119 rtx value;
12120 enum machine_mode mode;
12121
12122 arg = CALL_EXPR_ARG (exp, argno);
12123 value = expand_normal (arg);
12124 mode = insn_data[icode].operand[opno].mode;
12125 if (!insn_data[icode].operand[opno].predicate (value, mode))
12126 {
12127 /* We need to get the mode from ARG for two reasons:
12128
12129 - to cope with address operands, where MODE is the mode of the
12130 memory, rather than of VALUE itself.
12131
12132 - to cope with special predicates like pmode_register_operand,
12133 where MODE is VOIDmode. */
12134 value = copy_to_mode_reg (TYPE_MODE (TREE_TYPE (arg)), value);
12135
12136 /* Check the predicate again. */
12137 if (!insn_data[icode].operand[opno].predicate (value, mode))
12138 {
12139 error ("invalid argument to built-in function");
12140 return const0_rtx;
12141 }
12142 }
12143
12144 return value;
12145 }
12146
12147 /* Return an rtx suitable for output operand OP of instruction ICODE.
12148 If TARGET is non-null, try to use it where possible. */
12149
12150 static rtx
12151 mips_prepare_builtin_target (enum insn_code icode, unsigned int op, rtx target)
12152 {
12153 enum machine_mode mode;
12154
12155 mode = insn_data[icode].operand[op].mode;
12156 if (target == 0 || !insn_data[icode].operand[op].predicate (target, mode))
12157 target = gen_reg_rtx (mode);
12158
12159 return target;
12160 }
12161
12162 /* Expand a MIPS_BUILTIN_DIRECT or MIPS_BUILTIN_DIRECT_NO_TARGET function;
12163 HAS_TARGET_P says which. EXP is the CALL_EXPR that calls the function
12164 and ICODE is the code of the associated .md pattern. TARGET, if nonnull,
12165 suggests a good place to put the result. */
12166
12167 static rtx
12168 mips_expand_builtin_direct (enum insn_code icode, rtx target, tree exp,
12169 bool has_target_p)
12170 {
12171 rtx ops[MAX_RECOG_OPERANDS];
12172 int opno, argno;
12173
12174 /* Map any target to operand 0. */
12175 opno = 0;
12176 if (has_target_p)
12177 {
12178 target = mips_prepare_builtin_target (icode, opno, target);
12179 ops[opno] = target;
12180 opno++;
12181 }
12182
12183 /* Map the arguments to the other operands. The n_operands value
12184 for an expander includes match_dups and match_scratches as well as
12185 match_operands, so n_operands is only an upper bound on the number
12186 of arguments to the expander function. */
12187 gcc_assert (opno + call_expr_nargs (exp) <= insn_data[icode].n_operands);
12188 for (argno = 0; argno < call_expr_nargs (exp); argno++, opno++)
12189 ops[opno] = mips_prepare_builtin_arg (icode, opno, exp, argno);
12190
12191 switch (opno)
12192 {
12193 case 2:
12194 emit_insn (GEN_FCN (icode) (ops[0], ops[1]));
12195 break;
12196
12197 case 3:
12198 emit_insn (GEN_FCN (icode) (ops[0], ops[1], ops[2]));
12199 break;
12200
12201 case 4:
12202 emit_insn (GEN_FCN (icode) (ops[0], ops[1], ops[2], ops[3]));
12203 break;
12204
12205 default:
12206 gcc_unreachable ();
12207 }
12208 return target;
12209 }
12210
12211 /* Expand a __builtin_mips_movt_*_ps or __builtin_mips_movf_*_ps
12212 function; TYPE says which. EXP is the CALL_EXPR that calls the
12213 function, ICODE is the instruction that should be used to compare
12214 the first two arguments, and COND is the condition it should test.
12215 TARGET, if nonnull, suggests a good place to put the result. */
12216
12217 static rtx
12218 mips_expand_builtin_movtf (enum mips_builtin_type type,
12219 enum insn_code icode, enum mips_fp_condition cond,
12220 rtx target, tree exp)
12221 {
12222 rtx cmp_result, op0, op1;
12223
12224 cmp_result = mips_prepare_builtin_target (icode, 0, 0);
12225 op0 = mips_prepare_builtin_arg (icode, 1, exp, 0);
12226 op1 = mips_prepare_builtin_arg (icode, 2, exp, 1);
12227 emit_insn (GEN_FCN (icode) (cmp_result, op0, op1, GEN_INT (cond)));
12228
12229 icode = CODE_FOR_mips_cond_move_tf_ps;
12230 target = mips_prepare_builtin_target (icode, 0, target);
12231 if (type == MIPS_BUILTIN_MOVT)
12232 {
12233 op1 = mips_prepare_builtin_arg (icode, 2, exp, 2);
12234 op0 = mips_prepare_builtin_arg (icode, 1, exp, 3);
12235 }
12236 else
12237 {
12238 op0 = mips_prepare_builtin_arg (icode, 1, exp, 2);
12239 op1 = mips_prepare_builtin_arg (icode, 2, exp, 3);
12240 }
12241 emit_insn (gen_mips_cond_move_tf_ps (target, op0, op1, cmp_result));
12242 return target;
12243 }
12244
12245 /* Move VALUE_IF_TRUE into TARGET if CONDITION is true; move VALUE_IF_FALSE
12246 into TARGET otherwise. Return TARGET. */
12247
12248 static rtx
12249 mips_builtin_branch_and_move (rtx condition, rtx target,
12250 rtx value_if_true, rtx value_if_false)
12251 {
12252 rtx true_label, done_label;
12253
12254 true_label = gen_label_rtx ();
12255 done_label = gen_label_rtx ();
12256
12257 /* First assume that CONDITION is false. */
12258 mips_emit_move (target, value_if_false);
12259
12260 /* Branch to TRUE_LABEL if CONDITION is true and DONE_LABEL otherwise. */
12261 emit_jump_insn (gen_condjump (condition, true_label));
12262 emit_jump_insn (gen_jump (done_label));
12263 emit_barrier ();
12264
12265 /* Fix TARGET if CONDITION is true. */
12266 emit_label (true_label);
12267 mips_emit_move (target, value_if_true);
12268
12269 emit_label (done_label);
12270 return target;
12271 }
12272
12273 /* Expand a comparison built-in function of type BUILTIN_TYPE. EXP is
12274 the CALL_EXPR that calls the function, ICODE is the code of the
12275 comparison instruction, and COND is the condition it should test.
12276 TARGET, if nonnull, suggests a good place to put the boolean result. */
12277
12278 static rtx
12279 mips_expand_builtin_compare (enum mips_builtin_type builtin_type,
12280 enum insn_code icode, enum mips_fp_condition cond,
12281 rtx target, tree exp)
12282 {
12283 rtx offset, condition, cmp_result, args[MAX_RECOG_OPERANDS];
12284 int argno;
12285
12286 if (target == 0 || GET_MODE (target) != SImode)
12287 target = gen_reg_rtx (SImode);
12288
12289 /* The instruction should have a target operand, an operand for each
12290 argument, and an operand for COND. */
12291 gcc_assert (call_expr_nargs (exp) + 2 == insn_data[icode].n_operands);
12292
12293 /* Prepare the operands to the comparison. */
12294 cmp_result = mips_prepare_builtin_target (icode, 0, 0);
12295 for (argno = 0; argno < call_expr_nargs (exp); argno++)
12296 args[argno] = mips_prepare_builtin_arg (icode, argno + 1, exp, argno);
12297
12298 switch (insn_data[icode].n_operands)
12299 {
12300 case 4:
12301 emit_insn (GEN_FCN (icode) (cmp_result, args[0], args[1],
12302 GEN_INT (cond)));
12303 break;
12304
12305 case 6:
12306 emit_insn (GEN_FCN (icode) (cmp_result, args[0], args[1],
12307 args[2], args[3], GEN_INT (cond)));
12308 break;
12309
12310 default:
12311 gcc_unreachable ();
12312 }
12313
12314 /* If the comparison sets more than one register, we define the result
12315 to be 0 if all registers are false and -1 if all registers are true.
12316 The value of the complete result is indeterminate otherwise. */
12317 switch (builtin_type)
12318 {
12319 case MIPS_BUILTIN_CMP_ALL:
12320 condition = gen_rtx_NE (VOIDmode, cmp_result, constm1_rtx);
12321 return mips_builtin_branch_and_move (condition, target,
12322 const0_rtx, const1_rtx);
12323
12324 case MIPS_BUILTIN_CMP_UPPER:
12325 case MIPS_BUILTIN_CMP_LOWER:
12326 offset = GEN_INT (builtin_type == MIPS_BUILTIN_CMP_UPPER);
12327 condition = gen_single_cc (cmp_result, offset);
12328 return mips_builtin_branch_and_move (condition, target,
12329 const1_rtx, const0_rtx);
12330
12331 default:
12332 condition = gen_rtx_NE (VOIDmode, cmp_result, const0_rtx);
12333 return mips_builtin_branch_and_move (condition, target,
12334 const1_rtx, const0_rtx);
12335 }
12336 }
12337
12338 /* Expand a bposge built-in function of type BUILTIN_TYPE. TARGET,
12339 if nonnull, suggests a good place to put the boolean result. */
12340
12341 static rtx
12342 mips_expand_builtin_bposge (enum mips_builtin_type builtin_type, rtx target)
12343 {
12344 rtx condition, cmp_result;
12345 int cmp_value;
12346
12347 if (target == 0 || GET_MODE (target) != SImode)
12348 target = gen_reg_rtx (SImode);
12349
12350 cmp_result = gen_rtx_REG (CCDSPmode, CCDSP_PO_REGNUM);
12351
12352 if (builtin_type == MIPS_BUILTIN_BPOSGE32)
12353 cmp_value = 32;
12354 else
12355 gcc_assert (0);
12356
12357 condition = gen_rtx_GE (VOIDmode, cmp_result, GEN_INT (cmp_value));
12358 return mips_builtin_branch_and_move (condition, target,
12359 const1_rtx, const0_rtx);
12360 }
12361
12362 /* Implement TARGET_EXPAND_BUILTIN. */
12363
12364 static rtx
12365 mips_expand_builtin (tree exp, rtx target, rtx subtarget ATTRIBUTE_UNUSED,
12366 enum machine_mode mode, int ignore)
12367 {
12368 tree fndecl;
12369 unsigned int fcode, avail;
12370 const struct mips_builtin_description *d;
12371
12372 fndecl = TREE_OPERAND (CALL_EXPR_FN (exp), 0);
12373 fcode = DECL_FUNCTION_CODE (fndecl);
12374 gcc_assert (fcode < ARRAY_SIZE (mips_builtins));
12375 d = &mips_builtins[fcode];
12376 avail = d->avail ();
12377 gcc_assert (avail != 0);
12378 if (TARGET_MIPS16)
12379 {
12380 error ("built-in function %qE not supported for MIPS16",
12381 DECL_NAME (fndecl));
12382 return ignore ? const0_rtx : CONST0_RTX (mode);
12383 }
12384 switch (d->builtin_type)
12385 {
12386 case MIPS_BUILTIN_DIRECT:
12387 return mips_expand_builtin_direct (d->icode, target, exp, true);
12388
12389 case MIPS_BUILTIN_DIRECT_NO_TARGET:
12390 return mips_expand_builtin_direct (d->icode, target, exp, false);
12391
12392 case MIPS_BUILTIN_MOVT:
12393 case MIPS_BUILTIN_MOVF:
12394 return mips_expand_builtin_movtf (d->builtin_type, d->icode,
12395 d->cond, target, exp);
12396
12397 case MIPS_BUILTIN_CMP_ANY:
12398 case MIPS_BUILTIN_CMP_ALL:
12399 case MIPS_BUILTIN_CMP_UPPER:
12400 case MIPS_BUILTIN_CMP_LOWER:
12401 case MIPS_BUILTIN_CMP_SINGLE:
12402 return mips_expand_builtin_compare (d->builtin_type, d->icode,
12403 d->cond, target, exp);
12404
12405 case MIPS_BUILTIN_BPOSGE32:
12406 return mips_expand_builtin_bposge (d->builtin_type, target);
12407 }
12408 gcc_unreachable ();
12409 }
12410 \f
12411 /* An entry in the MIPS16 constant pool. VALUE is the pool constant,
12412 MODE is its mode, and LABEL is the CODE_LABEL associated with it. */
12413 struct mips16_constant {
12414 struct mips16_constant *next;
12415 rtx value;
12416 rtx label;
12417 enum machine_mode mode;
12418 };
12419
12420 /* Information about an incomplete MIPS16 constant pool. FIRST is the
12421 first constant, HIGHEST_ADDRESS is the highest address that the first
12422 byte of the pool can have, and INSN_ADDRESS is the current instruction
12423 address. */
12424 struct mips16_constant_pool {
12425 struct mips16_constant *first;
12426 int highest_address;
12427 int insn_address;
12428 };
12429
12430 /* Add constant VALUE to POOL and return its label. MODE is the
12431 value's mode (used for CONST_INTs, etc.). */
12432
12433 static rtx
12434 mips16_add_constant (struct mips16_constant_pool *pool,
12435 rtx value, enum machine_mode mode)
12436 {
12437 struct mips16_constant **p, *c;
12438 bool first_of_size_p;
12439
12440 /* See whether the constant is already in the pool. If so, return the
12441 existing label, otherwise leave P pointing to the place where the
12442 constant should be added.
12443
12444 Keep the pool sorted in increasing order of mode size so that we can
12445 reduce the number of alignments needed. */
12446 first_of_size_p = true;
12447 for (p = &pool->first; *p != 0; p = &(*p)->next)
12448 {
12449 if (mode == (*p)->mode && rtx_equal_p (value, (*p)->value))
12450 return (*p)->label;
12451 if (GET_MODE_SIZE (mode) < GET_MODE_SIZE ((*p)->mode))
12452 break;
12453 if (GET_MODE_SIZE (mode) == GET_MODE_SIZE ((*p)->mode))
12454 first_of_size_p = false;
12455 }
12456
12457 /* In the worst case, the constant needed by the earliest instruction
12458 will end up at the end of the pool. The entire pool must then be
12459 accessible from that instruction.
12460
12461 When adding the first constant, set the pool's highest address to
12462 the address of the first out-of-range byte. Adjust this address
12463 downwards each time a new constant is added. */
12464 if (pool->first == 0)
12465 /* For LWPC, ADDIUPC and DADDIUPC, the base PC value is the address
12466 of the instruction with the lowest two bits clear. The base PC
12467 value for LDPC has the lowest three bits clear. Assume the worst
12468 case here; namely that the PC-relative instruction occupies the
12469 last 2 bytes in an aligned word. */
12470 pool->highest_address = pool->insn_address - (UNITS_PER_WORD - 2) + 0x8000;
12471 pool->highest_address -= GET_MODE_SIZE (mode);
12472 if (first_of_size_p)
12473 /* Take into account the worst possible padding due to alignment. */
12474 pool->highest_address -= GET_MODE_SIZE (mode) - 1;
12475
12476 /* Create a new entry. */
12477 c = XNEW (struct mips16_constant);
12478 c->value = value;
12479 c->mode = mode;
12480 c->label = gen_label_rtx ();
12481 c->next = *p;
12482 *p = c;
12483
12484 return c->label;
12485 }
12486
12487 /* Output constant VALUE after instruction INSN and return the last
12488 instruction emitted. MODE is the mode of the constant. */
12489
12490 static rtx
12491 mips16_emit_constants_1 (enum machine_mode mode, rtx value, rtx insn)
12492 {
12493 if (SCALAR_INT_MODE_P (mode) || ALL_SCALAR_FIXED_POINT_MODE_P (mode))
12494 {
12495 rtx size = GEN_INT (GET_MODE_SIZE (mode));
12496 return emit_insn_after (gen_consttable_int (value, size), insn);
12497 }
12498
12499 if (SCALAR_FLOAT_MODE_P (mode))
12500 return emit_insn_after (gen_consttable_float (value), insn);
12501
12502 if (VECTOR_MODE_P (mode))
12503 {
12504 int i;
12505
12506 for (i = 0; i < CONST_VECTOR_NUNITS (value); i++)
12507 insn = mips16_emit_constants_1 (GET_MODE_INNER (mode),
12508 CONST_VECTOR_ELT (value, i), insn);
12509 return insn;
12510 }
12511
12512 gcc_unreachable ();
12513 }
12514
12515 /* Dump out the constants in CONSTANTS after INSN. */
12516
12517 static void
12518 mips16_emit_constants (struct mips16_constant *constants, rtx insn)
12519 {
12520 struct mips16_constant *c, *next;
12521 int align;
12522
12523 align = 0;
12524 for (c = constants; c != NULL; c = next)
12525 {
12526 /* If necessary, increase the alignment of PC. */
12527 if (align < GET_MODE_SIZE (c->mode))
12528 {
12529 int align_log = floor_log2 (GET_MODE_SIZE (c->mode));
12530 insn = emit_insn_after (gen_align (GEN_INT (align_log)), insn);
12531 }
12532 align = GET_MODE_SIZE (c->mode);
12533
12534 insn = emit_label_after (c->label, insn);
12535 insn = mips16_emit_constants_1 (c->mode, c->value, insn);
12536
12537 next = c->next;
12538 free (c);
12539 }
12540
12541 emit_barrier_after (insn);
12542 }
12543
12544 /* Return the length of instruction INSN. */
12545
12546 static int
12547 mips16_insn_length (rtx insn)
12548 {
12549 if (JUMP_P (insn))
12550 {
12551 rtx body = PATTERN (insn);
12552 if (GET_CODE (body) == ADDR_VEC)
12553 return GET_MODE_SIZE (GET_MODE (body)) * XVECLEN (body, 0);
12554 if (GET_CODE (body) == ADDR_DIFF_VEC)
12555 return GET_MODE_SIZE (GET_MODE (body)) * XVECLEN (body, 1);
12556 }
12557 return get_attr_length (insn);
12558 }
12559
12560 /* If *X is a symbolic constant that refers to the constant pool, add
12561 the constant to POOL and rewrite *X to use the constant's label. */
12562
12563 static void
12564 mips16_rewrite_pool_constant (struct mips16_constant_pool *pool, rtx *x)
12565 {
12566 rtx base, offset, label;
12567
12568 split_const (*x, &base, &offset);
12569 if (GET_CODE (base) == SYMBOL_REF && CONSTANT_POOL_ADDRESS_P (base))
12570 {
12571 label = mips16_add_constant (pool, get_pool_constant (base),
12572 get_pool_mode (base));
12573 base = gen_rtx_LABEL_REF (Pmode, label);
12574 *x = mips_unspec_address_offset (base, offset, SYMBOL_PC_RELATIVE);
12575 }
12576 }
12577
12578 /* This structure is used to communicate with mips16_rewrite_pool_refs.
12579 INSN is the instruction we're rewriting and POOL points to the current
12580 constant pool. */
12581 struct mips16_rewrite_pool_refs_info {
12582 rtx insn;
12583 struct mips16_constant_pool *pool;
12584 };
12585
12586 /* Rewrite *X so that constant pool references refer to the constant's
12587 label instead. DATA points to a mips16_rewrite_pool_refs_info
12588 structure. */
12589
12590 static int
12591 mips16_rewrite_pool_refs (rtx *x, void *data)
12592 {
12593 struct mips16_rewrite_pool_refs_info *info =
12594 (struct mips16_rewrite_pool_refs_info *) data;
12595
12596 if (force_to_mem_operand (*x, Pmode))
12597 {
12598 rtx mem = force_const_mem (GET_MODE (*x), *x);
12599 validate_change (info->insn, x, mem, false);
12600 }
12601
12602 if (MEM_P (*x))
12603 {
12604 mips16_rewrite_pool_constant (info->pool, &XEXP (*x, 0));
12605 return -1;
12606 }
12607
12608 if (TARGET_MIPS16_TEXT_LOADS)
12609 mips16_rewrite_pool_constant (info->pool, x);
12610
12611 return GET_CODE (*x) == CONST ? -1 : 0;
12612 }
12613
12614 /* Build MIPS16 constant pools. */
12615
12616 static void
12617 mips16_lay_out_constants (void)
12618 {
12619 struct mips16_constant_pool pool;
12620 struct mips16_rewrite_pool_refs_info info;
12621 rtx insn, barrier;
12622
12623 if (!TARGET_MIPS16_PCREL_LOADS)
12624 return;
12625
12626 split_all_insns_noflow ();
12627 barrier = 0;
12628 memset (&pool, 0, sizeof (pool));
12629 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
12630 {
12631 /* Rewrite constant pool references in INSN. */
12632 if (INSN_P (insn))
12633 {
12634 info.insn = insn;
12635 info.pool = &pool;
12636 for_each_rtx (&PATTERN (insn), mips16_rewrite_pool_refs, &info);
12637 }
12638
12639 pool.insn_address += mips16_insn_length (insn);
12640
12641 if (pool.first != NULL)
12642 {
12643 /* If there are no natural barriers between the first user of
12644 the pool and the highest acceptable address, we'll need to
12645 create a new instruction to jump around the constant pool.
12646 In the worst case, this instruction will be 4 bytes long.
12647
12648 If it's too late to do this transformation after INSN,
12649 do it immediately before INSN. */
12650 if (barrier == 0 && pool.insn_address + 4 > pool.highest_address)
12651 {
12652 rtx label, jump;
12653
12654 label = gen_label_rtx ();
12655
12656 jump = emit_jump_insn_before (gen_jump (label), insn);
12657 JUMP_LABEL (jump) = label;
12658 LABEL_NUSES (label) = 1;
12659 barrier = emit_barrier_after (jump);
12660
12661 emit_label_after (label, barrier);
12662 pool.insn_address += 4;
12663 }
12664
12665 /* See whether the constant pool is now out of range of the first
12666 user. If so, output the constants after the previous barrier.
12667 Note that any instructions between BARRIER and INSN (inclusive)
12668 will use negative offsets to refer to the pool. */
12669 if (pool.insn_address > pool.highest_address)
12670 {
12671 mips16_emit_constants (pool.first, barrier);
12672 pool.first = NULL;
12673 barrier = 0;
12674 }
12675 else if (BARRIER_P (insn))
12676 barrier = insn;
12677 }
12678 }
12679 mips16_emit_constants (pool.first, get_last_insn ());
12680 }
12681 \f
12682 /* Return true if it is worth r10k_simplify_address's while replacing
12683 an address with X. We are looking for constants, and for addresses
12684 at a known offset from the incoming stack pointer. */
12685
12686 static bool
12687 r10k_simplified_address_p (rtx x)
12688 {
12689 if (GET_CODE (x) == PLUS && CONST_INT_P (XEXP (x, 1)))
12690 x = XEXP (x, 0);
12691 return x == virtual_incoming_args_rtx || CONSTANT_P (x);
12692 }
12693
12694 /* X is an expression that appears in INSN. Try to use the UD chains
12695 to simplify it, returning the simplified form on success and the
12696 original form otherwise. Replace the incoming value of $sp with
12697 virtual_incoming_args_rtx (which should never occur in X otherwise). */
12698
12699 static rtx
12700 r10k_simplify_address (rtx x, rtx insn)
12701 {
12702 rtx newx, op0, op1, set, def_insn, note;
12703 df_ref use, def;
12704 struct df_link *defs;
12705
12706 newx = NULL_RTX;
12707 if (UNARY_P (x))
12708 {
12709 op0 = r10k_simplify_address (XEXP (x, 0), insn);
12710 if (op0 != XEXP (x, 0))
12711 newx = simplify_gen_unary (GET_CODE (x), GET_MODE (x),
12712 op0, GET_MODE (XEXP (x, 0)));
12713 }
12714 else if (BINARY_P (x))
12715 {
12716 op0 = r10k_simplify_address (XEXP (x, 0), insn);
12717 op1 = r10k_simplify_address (XEXP (x, 1), insn);
12718 if (op0 != XEXP (x, 0) || op1 != XEXP (x, 1))
12719 newx = simplify_gen_binary (GET_CODE (x), GET_MODE (x), op0, op1);
12720 }
12721 else if (GET_CODE (x) == LO_SUM)
12722 {
12723 /* LO_SUMs can be offset from HIGHs, if we know they won't
12724 overflow. See mips_classify_address for the rationale behind
12725 the lax check. */
12726 op0 = r10k_simplify_address (XEXP (x, 0), insn);
12727 if (GET_CODE (op0) == HIGH)
12728 newx = XEXP (x, 1);
12729 }
12730 else if (REG_P (x))
12731 {
12732 /* Uses are recorded by regno_reg_rtx, not X itself. */
12733 use = df_find_use (insn, regno_reg_rtx[REGNO (x)]);
12734 gcc_assert (use);
12735 defs = DF_REF_CHAIN (use);
12736
12737 /* Require a single definition. */
12738 if (defs && defs->next == NULL)
12739 {
12740 def = defs->ref;
12741 if (DF_REF_IS_ARTIFICIAL (def))
12742 {
12743 /* Replace the incoming value of $sp with
12744 virtual_incoming_args_rtx. */
12745 if (x == stack_pointer_rtx
12746 && DF_REF_BB (def) == ENTRY_BLOCK_PTR)
12747 newx = virtual_incoming_args_rtx;
12748 }
12749 else if (dominated_by_p (CDI_DOMINATORS, DF_REF_BB (use),
12750 DF_REF_BB (def)))
12751 {
12752 /* Make sure that DEF_INSN is a single set of REG. */
12753 def_insn = DF_REF_INSN (def);
12754 if (NONJUMP_INSN_P (def_insn))
12755 {
12756 set = single_set (def_insn);
12757 if (set && rtx_equal_p (SET_DEST (set), x))
12758 {
12759 /* Prefer to use notes, since the def-use chains
12760 are often shorter. */
12761 note = find_reg_equal_equiv_note (def_insn);
12762 if (note)
12763 newx = XEXP (note, 0);
12764 else
12765 newx = SET_SRC (set);
12766 newx = r10k_simplify_address (newx, def_insn);
12767 }
12768 }
12769 }
12770 }
12771 }
12772 if (newx && r10k_simplified_address_p (newx))
12773 return newx;
12774 return x;
12775 }
12776
12777 /* Return true if ADDRESS is known to be an uncached address
12778 on R10K systems. */
12779
12780 static bool
12781 r10k_uncached_address_p (unsigned HOST_WIDE_INT address)
12782 {
12783 unsigned HOST_WIDE_INT upper;
12784
12785 /* Check for KSEG1. */
12786 if (address + 0x60000000 < 0x20000000)
12787 return true;
12788
12789 /* Check for uncached XKPHYS addresses. */
12790 if (Pmode == DImode)
12791 {
12792 upper = (address >> 40) & 0xf9ffff;
12793 if (upper == 0x900000 || upper == 0xb80000)
12794 return true;
12795 }
12796 return false;
12797 }
12798
12799 /* Return true if we can prove that an access to address X in instruction
12800 INSN would be safe from R10K speculation. This X is a general
12801 expression; it might not be a legitimate address. */
12802
12803 static bool
12804 r10k_safe_address_p (rtx x, rtx insn)
12805 {
12806 rtx base, offset;
12807 HOST_WIDE_INT offset_val;
12808
12809 x = r10k_simplify_address (x, insn);
12810
12811 /* Check for references to the stack frame. It doesn't really matter
12812 how much of the frame has been allocated at INSN; -mr10k-cache-barrier
12813 allows us to assume that accesses to any part of the eventual frame
12814 is safe from speculation at any point in the function. */
12815 mips_split_plus (x, &base, &offset_val);
12816 if (base == virtual_incoming_args_rtx
12817 && offset_val >= -cfun->machine->frame.total_size
12818 && offset_val < cfun->machine->frame.args_size)
12819 return true;
12820
12821 /* Check for uncached addresses. */
12822 if (CONST_INT_P (x))
12823 return r10k_uncached_address_p (INTVAL (x));
12824
12825 /* Check for accesses to a static object. */
12826 split_const (x, &base, &offset);
12827 return offset_within_block_p (base, INTVAL (offset));
12828 }
12829
12830 /* Return true if a MEM with MEM_EXPR EXPR and MEM_OFFSET OFFSET is
12831 an in-range access to an automatic variable, or to an object with
12832 a link-time-constant address. */
12833
12834 static bool
12835 r10k_safe_mem_expr_p (tree expr, rtx offset)
12836 {
12837 if (expr == NULL_TREE
12838 || offset == NULL_RTX
12839 || !CONST_INT_P (offset)
12840 || INTVAL (offset) < 0
12841 || INTVAL (offset) >= int_size_in_bytes (TREE_TYPE (expr)))
12842 return false;
12843
12844 while (TREE_CODE (expr) == COMPONENT_REF)
12845 {
12846 expr = TREE_OPERAND (expr, 0);
12847 if (expr == NULL_TREE)
12848 return false;
12849 }
12850
12851 return DECL_P (expr);
12852 }
12853
12854 /* A for_each_rtx callback for which DATA points to the instruction
12855 containing *X. Stop the search if we find a MEM that is not safe
12856 from R10K speculation. */
12857
12858 static int
12859 r10k_needs_protection_p_1 (rtx *loc, void *data)
12860 {
12861 rtx mem;
12862
12863 mem = *loc;
12864 if (!MEM_P (mem))
12865 return 0;
12866
12867 if (r10k_safe_mem_expr_p (MEM_EXPR (mem), MEM_OFFSET (mem)))
12868 return -1;
12869
12870 if (r10k_safe_address_p (XEXP (mem, 0), (rtx) data))
12871 return -1;
12872
12873 return 1;
12874 }
12875
12876 /* A note_stores callback for which DATA points to an instruction pointer.
12877 If *DATA is nonnull, make it null if it X contains a MEM that is not
12878 safe from R10K speculation. */
12879
12880 static void
12881 r10k_needs_protection_p_store (rtx x, const_rtx pat ATTRIBUTE_UNUSED,
12882 void *data)
12883 {
12884 rtx *insn_ptr;
12885
12886 insn_ptr = (rtx *) data;
12887 if (*insn_ptr && for_each_rtx (&x, r10k_needs_protection_p_1, *insn_ptr))
12888 *insn_ptr = NULL_RTX;
12889 }
12890
12891 /* A for_each_rtx callback that iterates over the pattern of a CALL_INSN.
12892 Return nonzero if the call is not to a declared function. */
12893
12894 static int
12895 r10k_needs_protection_p_call (rtx *loc, void *data ATTRIBUTE_UNUSED)
12896 {
12897 rtx x;
12898
12899 x = *loc;
12900 if (!MEM_P (x))
12901 return 0;
12902
12903 x = XEXP (x, 0);
12904 if (GET_CODE (x) == SYMBOL_REF && SYMBOL_REF_DECL (x))
12905 return -1;
12906
12907 return 1;
12908 }
12909
12910 /* Return true if instruction INSN needs to be protected by an R10K
12911 cache barrier. */
12912
12913 static bool
12914 r10k_needs_protection_p (rtx insn)
12915 {
12916 if (CALL_P (insn))
12917 return for_each_rtx (&PATTERN (insn), r10k_needs_protection_p_call, NULL);
12918
12919 if (mips_r10k_cache_barrier == R10K_CACHE_BARRIER_STORE)
12920 {
12921 note_stores (PATTERN (insn), r10k_needs_protection_p_store, &insn);
12922 return insn == NULL_RTX;
12923 }
12924
12925 return for_each_rtx (&PATTERN (insn), r10k_needs_protection_p_1, insn);
12926 }
12927
12928 /* Return true if BB is only reached by blocks in PROTECTED_BBS and if every
12929 edge is unconditional. */
12930
12931 static bool
12932 r10k_protected_bb_p (basic_block bb, sbitmap protected_bbs)
12933 {
12934 edge_iterator ei;
12935 edge e;
12936
12937 FOR_EACH_EDGE (e, ei, bb->preds)
12938 if (!single_succ_p (e->src)
12939 || !TEST_BIT (protected_bbs, e->src->index)
12940 || (e->flags & EDGE_COMPLEX) != 0)
12941 return false;
12942 return true;
12943 }
12944
12945 /* Implement -mr10k-cache-barrier= for the current function. */
12946
12947 static void
12948 r10k_insert_cache_barriers (void)
12949 {
12950 int *rev_post_order;
12951 unsigned int i, n;
12952 basic_block bb;
12953 sbitmap protected_bbs;
12954 rtx insn, end, unprotected_region;
12955
12956 if (TARGET_MIPS16)
12957 {
12958 sorry ("%qs does not support MIPS16 code", "-mr10k-cache-barrier");
12959 return;
12960 }
12961
12962 /* Restore the BLOCK_FOR_INSN pointers, which are needed by DF. */
12963 compute_bb_for_insn ();
12964
12965 /* Create def-use chains. */
12966 df_set_flags (DF_EQ_NOTES);
12967 df_chain_add_problem (DF_UD_CHAIN);
12968 df_analyze ();
12969
12970 /* Calculate dominators. */
12971 calculate_dominance_info (CDI_DOMINATORS);
12972
12973 /* Bit X of PROTECTED_BBS is set if the last operation in basic block
12974 X is protected by a cache barrier. */
12975 protected_bbs = sbitmap_alloc (last_basic_block);
12976 sbitmap_zero (protected_bbs);
12977
12978 /* Iterate over the basic blocks in reverse post-order. */
12979 rev_post_order = XNEWVEC (int, last_basic_block);
12980 n = pre_and_rev_post_order_compute (NULL, rev_post_order, false);
12981 for (i = 0; i < n; i++)
12982 {
12983 bb = BASIC_BLOCK (rev_post_order[i]);
12984
12985 /* If this block is only reached by unconditional edges, and if the
12986 source of every edge is protected, the beginning of the block is
12987 also protected. */
12988 if (r10k_protected_bb_p (bb, protected_bbs))
12989 unprotected_region = NULL_RTX;
12990 else
12991 unprotected_region = pc_rtx;
12992 end = NEXT_INSN (BB_END (bb));
12993
12994 /* UNPROTECTED_REGION is:
12995
12996 - null if we are processing a protected region,
12997 - pc_rtx if we are processing an unprotected region but have
12998 not yet found the first instruction in it
12999 - the first instruction in an unprotected region otherwise. */
13000 for (insn = BB_HEAD (bb); insn != end; insn = NEXT_INSN (insn))
13001 {
13002 if (unprotected_region && INSN_P (insn))
13003 {
13004 if (recog_memoized (insn) == CODE_FOR_mips_cache)
13005 /* This CACHE instruction protects the following code. */
13006 unprotected_region = NULL_RTX;
13007 else
13008 {
13009 /* See if INSN is the first instruction in this
13010 unprotected region. */
13011 if (unprotected_region == pc_rtx)
13012 unprotected_region = insn;
13013
13014 /* See if INSN needs to be protected. If so,
13015 we must insert a cache barrier somewhere between
13016 PREV_INSN (UNPROTECTED_REGION) and INSN. It isn't
13017 clear which position is better performance-wise,
13018 but as a tie-breaker, we assume that it is better
13019 to allow delay slots to be back-filled where
13020 possible, and that it is better not to insert
13021 barriers in the middle of already-scheduled code.
13022 We therefore insert the barrier at the beginning
13023 of the region. */
13024 if (r10k_needs_protection_p (insn))
13025 {
13026 emit_insn_before (gen_r10k_cache_barrier (),
13027 unprotected_region);
13028 unprotected_region = NULL_RTX;
13029 }
13030 }
13031 }
13032
13033 if (CALL_P (insn))
13034 /* The called function is not required to protect the exit path.
13035 The code that follows a call is therefore unprotected. */
13036 unprotected_region = pc_rtx;
13037 }
13038
13039 /* Record whether the end of this block is protected. */
13040 if (unprotected_region == NULL_RTX)
13041 SET_BIT (protected_bbs, bb->index);
13042 }
13043 XDELETEVEC (rev_post_order);
13044
13045 sbitmap_free (protected_bbs);
13046
13047 free_dominance_info (CDI_DOMINATORS);
13048
13049 df_finish_pass (false);
13050
13051 free_bb_for_insn ();
13052 }
13053 \f
13054 /* A temporary variable used by for_each_rtx callbacks, etc. */
13055 static rtx mips_sim_insn;
13056
13057 /* A structure representing the state of the processor pipeline.
13058 Used by the mips_sim_* family of functions. */
13059 struct mips_sim {
13060 /* The maximum number of instructions that can be issued in a cycle.
13061 (Caches mips_issue_rate.) */
13062 unsigned int issue_rate;
13063
13064 /* The current simulation time. */
13065 unsigned int time;
13066
13067 /* How many more instructions can be issued in the current cycle. */
13068 unsigned int insns_left;
13069
13070 /* LAST_SET[X].INSN is the last instruction to set register X.
13071 LAST_SET[X].TIME is the time at which that instruction was issued.
13072 INSN is null if no instruction has yet set register X. */
13073 struct {
13074 rtx insn;
13075 unsigned int time;
13076 } last_set[FIRST_PSEUDO_REGISTER];
13077
13078 /* The pipeline's current DFA state. */
13079 state_t dfa_state;
13080 };
13081
13082 /* Reset STATE to the initial simulation state. */
13083
13084 static void
13085 mips_sim_reset (struct mips_sim *state)
13086 {
13087 state->time = 0;
13088 state->insns_left = state->issue_rate;
13089 memset (&state->last_set, 0, sizeof (state->last_set));
13090 state_reset (state->dfa_state);
13091 }
13092
13093 /* Initialize STATE before its first use. DFA_STATE points to an
13094 allocated but uninitialized DFA state. */
13095
13096 static void
13097 mips_sim_init (struct mips_sim *state, state_t dfa_state)
13098 {
13099 state->issue_rate = mips_issue_rate ();
13100 state->dfa_state = dfa_state;
13101 mips_sim_reset (state);
13102 }
13103
13104 /* Advance STATE by one clock cycle. */
13105
13106 static void
13107 mips_sim_next_cycle (struct mips_sim *state)
13108 {
13109 state->time++;
13110 state->insns_left = state->issue_rate;
13111 state_transition (state->dfa_state, 0);
13112 }
13113
13114 /* Advance simulation state STATE until instruction INSN can read
13115 register REG. */
13116
13117 static void
13118 mips_sim_wait_reg (struct mips_sim *state, rtx insn, rtx reg)
13119 {
13120 unsigned int regno, end_regno;
13121
13122 end_regno = END_REGNO (reg);
13123 for (regno = REGNO (reg); regno < end_regno; regno++)
13124 if (state->last_set[regno].insn != 0)
13125 {
13126 unsigned int t;
13127
13128 t = (state->last_set[regno].time
13129 + insn_latency (state->last_set[regno].insn, insn));
13130 while (state->time < t)
13131 mips_sim_next_cycle (state);
13132 }
13133 }
13134
13135 /* A for_each_rtx callback. If *X is a register, advance simulation state
13136 DATA until mips_sim_insn can read the register's value. */
13137
13138 static int
13139 mips_sim_wait_regs_2 (rtx *x, void *data)
13140 {
13141 if (REG_P (*x))
13142 mips_sim_wait_reg ((struct mips_sim *) data, mips_sim_insn, *x);
13143 return 0;
13144 }
13145
13146 /* Call mips_sim_wait_regs_2 (R, DATA) for each register R mentioned in *X. */
13147
13148 static void
13149 mips_sim_wait_regs_1 (rtx *x, void *data)
13150 {
13151 for_each_rtx (x, mips_sim_wait_regs_2, data);
13152 }
13153
13154 /* Advance simulation state STATE until all of INSN's register
13155 dependencies are satisfied. */
13156
13157 static void
13158 mips_sim_wait_regs (struct mips_sim *state, rtx insn)
13159 {
13160 mips_sim_insn = insn;
13161 note_uses (&PATTERN (insn), mips_sim_wait_regs_1, state);
13162 }
13163
13164 /* Advance simulation state STATE until the units required by
13165 instruction INSN are available. */
13166
13167 static void
13168 mips_sim_wait_units (struct mips_sim *state, rtx insn)
13169 {
13170 state_t tmp_state;
13171
13172 tmp_state = alloca (state_size ());
13173 while (state->insns_left == 0
13174 || (memcpy (tmp_state, state->dfa_state, state_size ()),
13175 state_transition (tmp_state, insn) >= 0))
13176 mips_sim_next_cycle (state);
13177 }
13178
13179 /* Advance simulation state STATE until INSN is ready to issue. */
13180
13181 static void
13182 mips_sim_wait_insn (struct mips_sim *state, rtx insn)
13183 {
13184 mips_sim_wait_regs (state, insn);
13185 mips_sim_wait_units (state, insn);
13186 }
13187
13188 /* mips_sim_insn has just set X. Update the LAST_SET array
13189 in simulation state DATA. */
13190
13191 static void
13192 mips_sim_record_set (rtx x, const_rtx pat ATTRIBUTE_UNUSED, void *data)
13193 {
13194 struct mips_sim *state;
13195
13196 state = (struct mips_sim *) data;
13197 if (REG_P (x))
13198 {
13199 unsigned int regno, end_regno;
13200
13201 end_regno = END_REGNO (x);
13202 for (regno = REGNO (x); regno < end_regno; regno++)
13203 {
13204 state->last_set[regno].insn = mips_sim_insn;
13205 state->last_set[regno].time = state->time;
13206 }
13207 }
13208 }
13209
13210 /* Issue instruction INSN in scheduler state STATE. Assume that INSN
13211 can issue immediately (i.e., that mips_sim_wait_insn has already
13212 been called). */
13213
13214 static void
13215 mips_sim_issue_insn (struct mips_sim *state, rtx insn)
13216 {
13217 state_transition (state->dfa_state, insn);
13218 state->insns_left--;
13219
13220 mips_sim_insn = insn;
13221 note_stores (PATTERN (insn), mips_sim_record_set, state);
13222 }
13223
13224 /* Simulate issuing a NOP in state STATE. */
13225
13226 static void
13227 mips_sim_issue_nop (struct mips_sim *state)
13228 {
13229 if (state->insns_left == 0)
13230 mips_sim_next_cycle (state);
13231 state->insns_left--;
13232 }
13233
13234 /* Update simulation state STATE so that it's ready to accept the instruction
13235 after INSN. INSN should be part of the main rtl chain, not a member of a
13236 SEQUENCE. */
13237
13238 static void
13239 mips_sim_finish_insn (struct mips_sim *state, rtx insn)
13240 {
13241 /* If INSN is a jump with an implicit delay slot, simulate a nop. */
13242 if (JUMP_P (insn))
13243 mips_sim_issue_nop (state);
13244
13245 switch (GET_CODE (SEQ_BEGIN (insn)))
13246 {
13247 case CODE_LABEL:
13248 case CALL_INSN:
13249 /* We can't predict the processor state after a call or label. */
13250 mips_sim_reset (state);
13251 break;
13252
13253 case JUMP_INSN:
13254 /* The delay slots of branch likely instructions are only executed
13255 when the branch is taken. Therefore, if the caller has simulated
13256 the delay slot instruction, STATE does not really reflect the state
13257 of the pipeline for the instruction after the delay slot. Also,
13258 branch likely instructions tend to incur a penalty when not taken,
13259 so there will probably be an extra delay between the branch and
13260 the instruction after the delay slot. */
13261 if (INSN_ANNULLED_BRANCH_P (SEQ_BEGIN (insn)))
13262 mips_sim_reset (state);
13263 break;
13264
13265 default:
13266 break;
13267 }
13268 }
13269 \f
13270 /* The VR4130 pipeline issues aligned pairs of instructions together,
13271 but it stalls the second instruction if it depends on the first.
13272 In order to cut down the amount of logic required, this dependence
13273 check is not based on a full instruction decode. Instead, any non-SPECIAL
13274 instruction is assumed to modify the register specified by bits 20-16
13275 (which is usually the "rt" field).
13276
13277 In BEQ, BEQL, BNE and BNEL instructions, the rt field is actually an
13278 input, so we can end up with a false dependence between the branch
13279 and its delay slot. If this situation occurs in instruction INSN,
13280 try to avoid it by swapping rs and rt. */
13281
13282 static void
13283 vr4130_avoid_branch_rt_conflict (rtx insn)
13284 {
13285 rtx first, second;
13286
13287 first = SEQ_BEGIN (insn);
13288 second = SEQ_END (insn);
13289 if (JUMP_P (first)
13290 && NONJUMP_INSN_P (second)
13291 && GET_CODE (PATTERN (first)) == SET
13292 && GET_CODE (SET_DEST (PATTERN (first))) == PC
13293 && GET_CODE (SET_SRC (PATTERN (first))) == IF_THEN_ELSE)
13294 {
13295 /* Check for the right kind of condition. */
13296 rtx cond = XEXP (SET_SRC (PATTERN (first)), 0);
13297 if ((GET_CODE (cond) == EQ || GET_CODE (cond) == NE)
13298 && REG_P (XEXP (cond, 0))
13299 && REG_P (XEXP (cond, 1))
13300 && reg_referenced_p (XEXP (cond, 1), PATTERN (second))
13301 && !reg_referenced_p (XEXP (cond, 0), PATTERN (second)))
13302 {
13303 /* SECOND mentions the rt register but not the rs register. */
13304 rtx tmp = XEXP (cond, 0);
13305 XEXP (cond, 0) = XEXP (cond, 1);
13306 XEXP (cond, 1) = tmp;
13307 }
13308 }
13309 }
13310
13311 /* Implement -mvr4130-align. Go through each basic block and simulate the
13312 processor pipeline. If we find that a pair of instructions could execute
13313 in parallel, and the first of those instructions is not 8-byte aligned,
13314 insert a nop to make it aligned. */
13315
13316 static void
13317 vr4130_align_insns (void)
13318 {
13319 struct mips_sim state;
13320 rtx insn, subinsn, last, last2, next;
13321 bool aligned_p;
13322
13323 dfa_start ();
13324
13325 /* LAST is the last instruction before INSN to have a nonzero length.
13326 LAST2 is the last such instruction before LAST. */
13327 last = 0;
13328 last2 = 0;
13329
13330 /* ALIGNED_P is true if INSN is known to be at an aligned address. */
13331 aligned_p = true;
13332
13333 mips_sim_init (&state, alloca (state_size ()));
13334 for (insn = get_insns (); insn != 0; insn = next)
13335 {
13336 unsigned int length;
13337
13338 next = NEXT_INSN (insn);
13339
13340 /* See the comment above vr4130_avoid_branch_rt_conflict for details.
13341 This isn't really related to the alignment pass, but we do it on
13342 the fly to avoid a separate instruction walk. */
13343 vr4130_avoid_branch_rt_conflict (insn);
13344
13345 if (USEFUL_INSN_P (insn))
13346 FOR_EACH_SUBINSN (subinsn, insn)
13347 {
13348 mips_sim_wait_insn (&state, subinsn);
13349
13350 /* If we want this instruction to issue in parallel with the
13351 previous one, make sure that the previous instruction is
13352 aligned. There are several reasons why this isn't worthwhile
13353 when the second instruction is a call:
13354
13355 - Calls are less likely to be performance critical,
13356 - There's a good chance that the delay slot can execute
13357 in parallel with the call.
13358 - The return address would then be unaligned.
13359
13360 In general, if we're going to insert a nop between instructions
13361 X and Y, it's better to insert it immediately after X. That
13362 way, if the nop makes Y aligned, it will also align any labels
13363 between X and Y. */
13364 if (state.insns_left != state.issue_rate
13365 && !CALL_P (subinsn))
13366 {
13367 if (subinsn == SEQ_BEGIN (insn) && aligned_p)
13368 {
13369 /* SUBINSN is the first instruction in INSN and INSN is
13370 aligned. We want to align the previous instruction
13371 instead, so insert a nop between LAST2 and LAST.
13372
13373 Note that LAST could be either a single instruction
13374 or a branch with a delay slot. In the latter case,
13375 LAST, like INSN, is already aligned, but the delay
13376 slot must have some extra delay that stops it from
13377 issuing at the same time as the branch. We therefore
13378 insert a nop before the branch in order to align its
13379 delay slot. */
13380 emit_insn_after (gen_nop (), last2);
13381 aligned_p = false;
13382 }
13383 else if (subinsn != SEQ_BEGIN (insn) && !aligned_p)
13384 {
13385 /* SUBINSN is the delay slot of INSN, but INSN is
13386 currently unaligned. Insert a nop between
13387 LAST and INSN to align it. */
13388 emit_insn_after (gen_nop (), last);
13389 aligned_p = true;
13390 }
13391 }
13392 mips_sim_issue_insn (&state, subinsn);
13393 }
13394 mips_sim_finish_insn (&state, insn);
13395
13396 /* Update LAST, LAST2 and ALIGNED_P for the next instruction. */
13397 length = get_attr_length (insn);
13398 if (length > 0)
13399 {
13400 /* If the instruction is an asm statement or multi-instruction
13401 mips.md patern, the length is only an estimate. Insert an
13402 8 byte alignment after it so that the following instructions
13403 can be handled correctly. */
13404 if (NONJUMP_INSN_P (SEQ_BEGIN (insn))
13405 && (recog_memoized (insn) < 0 || length >= 8))
13406 {
13407 next = emit_insn_after (gen_align (GEN_INT (3)), insn);
13408 next = NEXT_INSN (next);
13409 mips_sim_next_cycle (&state);
13410 aligned_p = true;
13411 }
13412 else if (length & 4)
13413 aligned_p = !aligned_p;
13414 last2 = last;
13415 last = insn;
13416 }
13417
13418 /* See whether INSN is an aligned label. */
13419 if (LABEL_P (insn) && label_to_alignment (insn) >= 3)
13420 aligned_p = true;
13421 }
13422 dfa_finish ();
13423 }
13424 \f
13425 /* This structure records that the current function has a LO_SUM
13426 involving SYMBOL_REF or LABEL_REF BASE and that MAX_OFFSET is
13427 the largest offset applied to BASE by all such LO_SUMs. */
13428 struct mips_lo_sum_offset {
13429 rtx base;
13430 HOST_WIDE_INT offset;
13431 };
13432
13433 /* Return a hash value for SYMBOL_REF or LABEL_REF BASE. */
13434
13435 static hashval_t
13436 mips_hash_base (rtx base)
13437 {
13438 int do_not_record_p;
13439
13440 return hash_rtx (base, GET_MODE (base), &do_not_record_p, NULL, false);
13441 }
13442
13443 /* Hash-table callbacks for mips_lo_sum_offsets. */
13444
13445 static hashval_t
13446 mips_lo_sum_offset_hash (const void *entry)
13447 {
13448 return mips_hash_base (((const struct mips_lo_sum_offset *) entry)->base);
13449 }
13450
13451 static int
13452 mips_lo_sum_offset_eq (const void *entry, const void *value)
13453 {
13454 return rtx_equal_p (((const struct mips_lo_sum_offset *) entry)->base,
13455 (const_rtx) value);
13456 }
13457
13458 /* Look up symbolic constant X in HTAB, which is a hash table of
13459 mips_lo_sum_offsets. If OPTION is NO_INSERT, return true if X can be
13460 paired with a recorded LO_SUM, otherwise record X in the table. */
13461
13462 static bool
13463 mips_lo_sum_offset_lookup (htab_t htab, rtx x, enum insert_option option)
13464 {
13465 rtx base, offset;
13466 void **slot;
13467 struct mips_lo_sum_offset *entry;
13468
13469 /* Split X into a base and offset. */
13470 split_const (x, &base, &offset);
13471 if (UNSPEC_ADDRESS_P (base))
13472 base = UNSPEC_ADDRESS (base);
13473
13474 /* Look up the base in the hash table. */
13475 slot = htab_find_slot_with_hash (htab, base, mips_hash_base (base), option);
13476 if (slot == NULL)
13477 return false;
13478
13479 entry = (struct mips_lo_sum_offset *) *slot;
13480 if (option == INSERT)
13481 {
13482 if (entry == NULL)
13483 {
13484 entry = XNEW (struct mips_lo_sum_offset);
13485 entry->base = base;
13486 entry->offset = INTVAL (offset);
13487 *slot = entry;
13488 }
13489 else
13490 {
13491 if (INTVAL (offset) > entry->offset)
13492 entry->offset = INTVAL (offset);
13493 }
13494 }
13495 return INTVAL (offset) <= entry->offset;
13496 }
13497
13498 /* A for_each_rtx callback for which DATA is a mips_lo_sum_offset hash table.
13499 Record every LO_SUM in *LOC. */
13500
13501 static int
13502 mips_record_lo_sum (rtx *loc, void *data)
13503 {
13504 if (GET_CODE (*loc) == LO_SUM)
13505 mips_lo_sum_offset_lookup ((htab_t) data, XEXP (*loc, 1), INSERT);
13506 return 0;
13507 }
13508
13509 /* Return true if INSN is a SET of an orphaned high-part relocation.
13510 HTAB is a hash table of mips_lo_sum_offsets that describes all the
13511 LO_SUMs in the current function. */
13512
13513 static bool
13514 mips_orphaned_high_part_p (htab_t htab, rtx insn)
13515 {
13516 enum mips_symbol_type type;
13517 rtx x, set;
13518
13519 set = single_set (insn);
13520 if (set)
13521 {
13522 /* Check for %his. */
13523 x = SET_SRC (set);
13524 if (GET_CODE (x) == HIGH
13525 && absolute_symbolic_operand (XEXP (x, 0), VOIDmode))
13526 return !mips_lo_sum_offset_lookup (htab, XEXP (x, 0), NO_INSERT);
13527
13528 /* Check for local %gots (and %got_pages, which is redundant but OK). */
13529 if (GET_CODE (x) == UNSPEC
13530 && XINT (x, 1) == UNSPEC_LOAD_GOT
13531 && mips_symbolic_constant_p (XVECEXP (x, 0, 1),
13532 SYMBOL_CONTEXT_LEA, &type)
13533 && type == SYMBOL_GOTOFF_PAGE)
13534 return !mips_lo_sum_offset_lookup (htab, XVECEXP (x, 0, 1), NO_INSERT);
13535 }
13536 return false;
13537 }
13538
13539 /* Subroutine of mips_reorg_process_insns. If there is a hazard between
13540 INSN and a previous instruction, avoid it by inserting nops after
13541 instruction AFTER.
13542
13543 *DELAYED_REG and *HILO_DELAY describe the hazards that apply at
13544 this point. If *DELAYED_REG is non-null, INSN must wait a cycle
13545 before using the value of that register. *HILO_DELAY counts the
13546 number of instructions since the last hilo hazard (that is,
13547 the number of instructions since the last MFLO or MFHI).
13548
13549 After inserting nops for INSN, update *DELAYED_REG and *HILO_DELAY
13550 for the next instruction.
13551
13552 LO_REG is an rtx for the LO register, used in dependence checking. */
13553
13554 static void
13555 mips_avoid_hazard (rtx after, rtx insn, int *hilo_delay,
13556 rtx *delayed_reg, rtx lo_reg)
13557 {
13558 rtx pattern, set;
13559 int nops, ninsns;
13560
13561 pattern = PATTERN (insn);
13562
13563 /* Do not put the whole function in .set noreorder if it contains
13564 an asm statement. We don't know whether there will be hazards
13565 between the asm statement and the gcc-generated code. */
13566 if (GET_CODE (pattern) == ASM_INPUT || asm_noperands (pattern) >= 0)
13567 cfun->machine->all_noreorder_p = false;
13568
13569 /* Ignore zero-length instructions (barriers and the like). */
13570 ninsns = get_attr_length (insn) / 4;
13571 if (ninsns == 0)
13572 return;
13573
13574 /* Work out how many nops are needed. Note that we only care about
13575 registers that are explicitly mentioned in the instruction's pattern.
13576 It doesn't matter that calls use the argument registers or that they
13577 clobber hi and lo. */
13578 if (*hilo_delay < 2 && reg_set_p (lo_reg, pattern))
13579 nops = 2 - *hilo_delay;
13580 else if (*delayed_reg != 0 && reg_referenced_p (*delayed_reg, pattern))
13581 nops = 1;
13582 else
13583 nops = 0;
13584
13585 /* Insert the nops between this instruction and the previous one.
13586 Each new nop takes us further from the last hilo hazard. */
13587 *hilo_delay += nops;
13588 while (nops-- > 0)
13589 emit_insn_after (gen_hazard_nop (), after);
13590
13591 /* Set up the state for the next instruction. */
13592 *hilo_delay += ninsns;
13593 *delayed_reg = 0;
13594 if (INSN_CODE (insn) >= 0)
13595 switch (get_attr_hazard (insn))
13596 {
13597 case HAZARD_NONE:
13598 break;
13599
13600 case HAZARD_HILO:
13601 *hilo_delay = 0;
13602 break;
13603
13604 case HAZARD_DELAY:
13605 set = single_set (insn);
13606 gcc_assert (set);
13607 *delayed_reg = SET_DEST (set);
13608 break;
13609 }
13610 }
13611
13612 /* Go through the instruction stream and insert nops where necessary.
13613 Also delete any high-part relocations whose partnering low parts
13614 are now all dead. See if the whole function can then be put into
13615 .set noreorder and .set nomacro. */
13616
13617 static void
13618 mips_reorg_process_insns (void)
13619 {
13620 rtx insn, last_insn, subinsn, next_insn, lo_reg, delayed_reg;
13621 int hilo_delay;
13622 htab_t htab;
13623
13624 /* Force all instructions to be split into their final form. */
13625 split_all_insns_noflow ();
13626
13627 /* Recalculate instruction lengths without taking nops into account. */
13628 cfun->machine->ignore_hazard_length_p = true;
13629 shorten_branches (get_insns ());
13630
13631 cfun->machine->all_noreorder_p = true;
13632
13633 /* We don't track MIPS16 PC-relative offsets closely enough to make
13634 a good job of "set .noreorder" code in MIPS16 mode. */
13635 if (TARGET_MIPS16)
13636 cfun->machine->all_noreorder_p = false;
13637
13638 /* Code that doesn't use explicit relocs can't be ".set nomacro". */
13639 if (!TARGET_EXPLICIT_RELOCS)
13640 cfun->machine->all_noreorder_p = false;
13641
13642 /* Profiled functions can't be all noreorder because the profiler
13643 support uses assembler macros. */
13644 if (crtl->profile)
13645 cfun->machine->all_noreorder_p = false;
13646
13647 /* Code compiled with -mfix-vr4120 can't be all noreorder because
13648 we rely on the assembler to work around some errata. */
13649 if (TARGET_FIX_VR4120)
13650 cfun->machine->all_noreorder_p = false;
13651
13652 /* The same is true for -mfix-vr4130 if we might generate MFLO or
13653 MFHI instructions. Note that we avoid using MFLO and MFHI if
13654 the VR4130 MACC and DMACC instructions are available instead;
13655 see the *mfhilo_{si,di}_macc patterns. */
13656 if (TARGET_FIX_VR4130 && !ISA_HAS_MACCHI)
13657 cfun->machine->all_noreorder_p = false;
13658
13659 htab = htab_create (37, mips_lo_sum_offset_hash,
13660 mips_lo_sum_offset_eq, free);
13661
13662 /* Make a first pass over the instructions, recording all the LO_SUMs. */
13663 for (insn = get_insns (); insn != 0; insn = NEXT_INSN (insn))
13664 FOR_EACH_SUBINSN (subinsn, insn)
13665 if (INSN_P (subinsn))
13666 for_each_rtx (&PATTERN (subinsn), mips_record_lo_sum, htab);
13667
13668 last_insn = 0;
13669 hilo_delay = 2;
13670 delayed_reg = 0;
13671 lo_reg = gen_rtx_REG (SImode, LO_REGNUM);
13672
13673 /* Make a second pass over the instructions. Delete orphaned
13674 high-part relocations or turn them into NOPs. Avoid hazards
13675 by inserting NOPs. */
13676 for (insn = get_insns (); insn != 0; insn = next_insn)
13677 {
13678 next_insn = NEXT_INSN (insn);
13679 if (INSN_P (insn))
13680 {
13681 if (GET_CODE (PATTERN (insn)) == SEQUENCE)
13682 {
13683 /* If we find an orphaned high-part relocation in a delay
13684 slot, it's easier to turn that instruction into a NOP than
13685 to delete it. The delay slot will be a NOP either way. */
13686 FOR_EACH_SUBINSN (subinsn, insn)
13687 if (INSN_P (subinsn))
13688 {
13689 if (mips_orphaned_high_part_p (htab, subinsn))
13690 {
13691 PATTERN (subinsn) = gen_nop ();
13692 INSN_CODE (subinsn) = CODE_FOR_nop;
13693 }
13694 mips_avoid_hazard (last_insn, subinsn, &hilo_delay,
13695 &delayed_reg, lo_reg);
13696 }
13697 last_insn = insn;
13698 }
13699 else
13700 {
13701 /* INSN is a single instruction. Delete it if it's an
13702 orphaned high-part relocation. */
13703 if (mips_orphaned_high_part_p (htab, insn))
13704 delete_insn (insn);
13705 /* Also delete cache barriers if the last instruction
13706 was an annulled branch. INSN will not be speculatively
13707 executed. */
13708 else if (recog_memoized (insn) == CODE_FOR_r10k_cache_barrier
13709 && last_insn
13710 && INSN_ANNULLED_BRANCH_P (SEQ_BEGIN (last_insn)))
13711 delete_insn (insn);
13712 else
13713 {
13714 mips_avoid_hazard (last_insn, insn, &hilo_delay,
13715 &delayed_reg, lo_reg);
13716 last_insn = insn;
13717 }
13718 }
13719 }
13720 }
13721
13722 htab_delete (htab);
13723 }
13724
13725 /* Implement TARGET_MACHINE_DEPENDENT_REORG. */
13726
13727 static void
13728 mips_reorg (void)
13729 {
13730 mips16_lay_out_constants ();
13731 if (mips_r10k_cache_barrier != R10K_CACHE_BARRIER_NONE)
13732 r10k_insert_cache_barriers ();
13733 if (optimize > 0 && flag_delayed_branch)
13734 dbr_schedule (get_insns ());
13735 mips_reorg_process_insns ();
13736 if (!TARGET_MIPS16
13737 && TARGET_EXPLICIT_RELOCS
13738 && TUNE_MIPS4130
13739 && TARGET_VR4130_ALIGN)
13740 vr4130_align_insns ();
13741 }
13742 \f
13743 /* Implement TARGET_ASM_OUTPUT_MI_THUNK. Generate rtl rather than asm text
13744 in order to avoid duplicating too much logic from elsewhere. */
13745
13746 static void
13747 mips_output_mi_thunk (FILE *file, tree thunk_fndecl ATTRIBUTE_UNUSED,
13748 HOST_WIDE_INT delta, HOST_WIDE_INT vcall_offset,
13749 tree function)
13750 {
13751 rtx this_rtx, temp1, temp2, insn, fnaddr;
13752 bool use_sibcall_p;
13753
13754 /* Pretend to be a post-reload pass while generating rtl. */
13755 reload_completed = 1;
13756
13757 /* Mark the end of the (empty) prologue. */
13758 emit_note (NOTE_INSN_PROLOGUE_END);
13759
13760 /* Determine if we can use a sibcall to call FUNCTION directly. */
13761 fnaddr = XEXP (DECL_RTL (function), 0);
13762 use_sibcall_p = (mips_function_ok_for_sibcall (function, NULL)
13763 && const_call_insn_operand (fnaddr, Pmode));
13764
13765 /* Determine if we need to load FNADDR from the GOT. */
13766 if (!use_sibcall_p
13767 && (mips_got_symbol_type_p
13768 (mips_classify_symbol (fnaddr, SYMBOL_CONTEXT_LEA))))
13769 {
13770 /* Pick a global pointer. Use a call-clobbered register if
13771 TARGET_CALL_SAVED_GP. */
13772 cfun->machine->global_pointer
13773 = TARGET_CALL_SAVED_GP ? 15 : GLOBAL_POINTER_REGNUM;
13774 SET_REGNO (pic_offset_table_rtx, cfun->machine->global_pointer);
13775
13776 /* Set up the global pointer for n32 or n64 abicalls. */
13777 mips_emit_loadgp ();
13778 }
13779
13780 /* We need two temporary registers in some cases. */
13781 temp1 = gen_rtx_REG (Pmode, 2);
13782 temp2 = gen_rtx_REG (Pmode, 3);
13783
13784 /* Find out which register contains the "this" pointer. */
13785 if (aggregate_value_p (TREE_TYPE (TREE_TYPE (function)), function))
13786 this_rtx = gen_rtx_REG (Pmode, GP_ARG_FIRST + 1);
13787 else
13788 this_rtx = gen_rtx_REG (Pmode, GP_ARG_FIRST);
13789
13790 /* Add DELTA to THIS_RTX. */
13791 if (delta != 0)
13792 {
13793 rtx offset = GEN_INT (delta);
13794 if (!SMALL_OPERAND (delta))
13795 {
13796 mips_emit_move (temp1, offset);
13797 offset = temp1;
13798 }
13799 emit_insn (gen_add3_insn (this_rtx, this_rtx, offset));
13800 }
13801
13802 /* If needed, add *(*THIS_RTX + VCALL_OFFSET) to THIS_RTX. */
13803 if (vcall_offset != 0)
13804 {
13805 rtx addr;
13806
13807 /* Set TEMP1 to *THIS_RTX. */
13808 mips_emit_move (temp1, gen_rtx_MEM (Pmode, this_rtx));
13809
13810 /* Set ADDR to a legitimate address for *THIS_RTX + VCALL_OFFSET. */
13811 addr = mips_add_offset (temp2, temp1, vcall_offset);
13812
13813 /* Load the offset and add it to THIS_RTX. */
13814 mips_emit_move (temp1, gen_rtx_MEM (Pmode, addr));
13815 emit_insn (gen_add3_insn (this_rtx, this_rtx, temp1));
13816 }
13817
13818 /* Jump to the target function. Use a sibcall if direct jumps are
13819 allowed, otherwise load the address into a register first. */
13820 if (use_sibcall_p)
13821 {
13822 insn = emit_call_insn (gen_sibcall_internal (fnaddr, const0_rtx));
13823 SIBLING_CALL_P (insn) = 1;
13824 }
13825 else
13826 {
13827 /* This is messy. GAS treats "la $25,foo" as part of a call
13828 sequence and may allow a global "foo" to be lazily bound.
13829 The general move patterns therefore reject this combination.
13830
13831 In this context, lazy binding would actually be OK
13832 for TARGET_CALL_CLOBBERED_GP, but it's still wrong for
13833 TARGET_CALL_SAVED_GP; see mips_load_call_address.
13834 We must therefore load the address via a temporary
13835 register if mips_dangerous_for_la25_p.
13836
13837 If we jump to the temporary register rather than $25,
13838 the assembler can use the move insn to fill the jump's
13839 delay slot.
13840
13841 We can use the same technique for MIPS16 code, where $25
13842 is not a valid JR register. */
13843 if (TARGET_USE_PIC_FN_ADDR_REG
13844 && !TARGET_MIPS16
13845 && !mips_dangerous_for_la25_p (fnaddr))
13846 temp1 = gen_rtx_REG (Pmode, PIC_FUNCTION_ADDR_REGNUM);
13847 mips_load_call_address (MIPS_CALL_SIBCALL, temp1, fnaddr);
13848
13849 if (TARGET_USE_PIC_FN_ADDR_REG
13850 && REGNO (temp1) != PIC_FUNCTION_ADDR_REGNUM)
13851 mips_emit_move (gen_rtx_REG (Pmode, PIC_FUNCTION_ADDR_REGNUM), temp1);
13852 emit_jump_insn (gen_indirect_jump (temp1));
13853 }
13854
13855 /* Run just enough of rest_of_compilation. This sequence was
13856 "borrowed" from alpha.c. */
13857 insn = get_insns ();
13858 insn_locators_alloc ();
13859 split_all_insns_noflow ();
13860 mips16_lay_out_constants ();
13861 shorten_branches (insn);
13862 final_start_function (insn, file, 1);
13863 final (insn, file, 1);
13864 final_end_function ();
13865 free_after_compilation (cfun);
13866
13867 /* Clean up the vars set above. Note that final_end_function resets
13868 the global pointer for us. */
13869 reload_completed = 0;
13870 }
13871 \f
13872 /* The last argument passed to mips_set_mips16_mode, or negative if the
13873 function hasn't been called yet.
13874
13875 There are two copies of this information. One is saved and restored
13876 by the PCH process while the other is specific to this compiler
13877 invocation. The information calculated by mips_set_mips16_mode
13878 is invalid unless the two variables are the same. */
13879 static int was_mips16_p = -1;
13880 static GTY(()) int was_mips16_pch_p = -1;
13881
13882 /* Set up the target-dependent global state so that it matches the
13883 current function's ISA mode. */
13884
13885 static void
13886 mips_set_mips16_mode (int mips16_p)
13887 {
13888 if (mips16_p == was_mips16_p
13889 && mips16_p == was_mips16_pch_p)
13890 return;
13891
13892 /* Restore base settings of various flags. */
13893 target_flags = mips_base_target_flags;
13894 flag_schedule_insns = mips_base_schedule_insns;
13895 flag_reorder_blocks_and_partition = mips_base_reorder_blocks_and_partition;
13896 flag_move_loop_invariants = mips_base_move_loop_invariants;
13897 align_loops = mips_base_align_loops;
13898 align_jumps = mips_base_align_jumps;
13899 align_functions = mips_base_align_functions;
13900
13901 if (mips16_p)
13902 {
13903 /* Switch to MIPS16 mode. */
13904 target_flags |= MASK_MIPS16;
13905
13906 /* Don't run the scheduler before reload, since it tends to
13907 increase register pressure. */
13908 flag_schedule_insns = 0;
13909
13910 /* Don't do hot/cold partitioning. mips16_lay_out_constants expects
13911 the whole function to be in a single section. */
13912 flag_reorder_blocks_and_partition = 0;
13913
13914 /* Don't move loop invariants, because it tends to increase
13915 register pressure. It also introduces an extra move in cases
13916 where the constant is the first operand in a two-operand binary
13917 instruction, or when it forms a register argument to a functon
13918 call. */
13919 flag_move_loop_invariants = 0;
13920
13921 target_flags |= MASK_EXPLICIT_RELOCS;
13922
13923 /* Experiments suggest we get the best overall section-anchor
13924 results from using the range of an unextended LW or SW. Code
13925 that makes heavy use of byte or short accesses can do better
13926 with ranges of 0...31 and 0...63 respectively, but most code is
13927 sensitive to the range of LW and SW instead. */
13928 targetm.min_anchor_offset = 0;
13929 targetm.max_anchor_offset = 127;
13930
13931 if (flag_pic && !TARGET_OLDABI)
13932 sorry ("MIPS16 PIC for ABIs other than o32 and o64");
13933
13934 if (TARGET_XGOT)
13935 sorry ("MIPS16 -mxgot code");
13936
13937 if (TARGET_HARD_FLOAT_ABI && !TARGET_OLDABI)
13938 sorry ("hard-float MIPS16 code for ABIs other than o32 and o64");
13939 }
13940 else
13941 {
13942 /* Switch to normal (non-MIPS16) mode. */
13943 target_flags &= ~MASK_MIPS16;
13944
13945 /* Provide default values for align_* for 64-bit targets. */
13946 if (TARGET_64BIT)
13947 {
13948 if (align_loops == 0)
13949 align_loops = 8;
13950 if (align_jumps == 0)
13951 align_jumps = 8;
13952 if (align_functions == 0)
13953 align_functions = 8;
13954 }
13955
13956 targetm.min_anchor_offset = -32768;
13957 targetm.max_anchor_offset = 32767;
13958 }
13959
13960 /* (Re)initialize MIPS target internals for new ISA. */
13961 mips_init_relocs ();
13962
13963 if (was_mips16_p >= 0 || was_mips16_pch_p >= 0)
13964 /* Reinitialize target-dependent state. */
13965 target_reinit ();
13966
13967 was_mips16_p = mips16_p;
13968 was_mips16_pch_p = mips16_p;
13969 }
13970
13971 /* Implement TARGET_SET_CURRENT_FUNCTION. Decide whether the current
13972 function should use the MIPS16 ISA and switch modes accordingly. */
13973
13974 static void
13975 mips_set_current_function (tree fndecl)
13976 {
13977 mips_set_mips16_mode (mips_use_mips16_mode_p (fndecl));
13978 }
13979 \f
13980 /* Allocate a chunk of memory for per-function machine-dependent data. */
13981
13982 static struct machine_function *
13983 mips_init_machine_status (void)
13984 {
13985 return ((struct machine_function *)
13986 ggc_alloc_cleared (sizeof (struct machine_function)));
13987 }
13988
13989 /* Return the processor associated with the given ISA level, or null
13990 if the ISA isn't valid. */
13991
13992 static const struct mips_cpu_info *
13993 mips_cpu_info_from_isa (int isa)
13994 {
13995 unsigned int i;
13996
13997 for (i = 0; i < ARRAY_SIZE (mips_cpu_info_table); i++)
13998 if (mips_cpu_info_table[i].isa == isa)
13999 return mips_cpu_info_table + i;
14000
14001 return NULL;
14002 }
14003
14004 /* Return true if GIVEN is the same as CANONICAL, or if it is CANONICAL
14005 with a final "000" replaced by "k". Ignore case.
14006
14007 Note: this function is shared between GCC and GAS. */
14008
14009 static bool
14010 mips_strict_matching_cpu_name_p (const char *canonical, const char *given)
14011 {
14012 while (*given != 0 && TOLOWER (*given) == TOLOWER (*canonical))
14013 given++, canonical++;
14014
14015 return ((*given == 0 && *canonical == 0)
14016 || (strcmp (canonical, "000") == 0 && strcasecmp (given, "k") == 0));
14017 }
14018
14019 /* Return true if GIVEN matches CANONICAL, where GIVEN is a user-supplied
14020 CPU name. We've traditionally allowed a lot of variation here.
14021
14022 Note: this function is shared between GCC and GAS. */
14023
14024 static bool
14025 mips_matching_cpu_name_p (const char *canonical, const char *given)
14026 {
14027 /* First see if the name matches exactly, or with a final "000"
14028 turned into "k". */
14029 if (mips_strict_matching_cpu_name_p (canonical, given))
14030 return true;
14031
14032 /* If not, try comparing based on numerical designation alone.
14033 See if GIVEN is an unadorned number, or 'r' followed by a number. */
14034 if (TOLOWER (*given) == 'r')
14035 given++;
14036 if (!ISDIGIT (*given))
14037 return false;
14038
14039 /* Skip over some well-known prefixes in the canonical name,
14040 hoping to find a number there too. */
14041 if (TOLOWER (canonical[0]) == 'v' && TOLOWER (canonical[1]) == 'r')
14042 canonical += 2;
14043 else if (TOLOWER (canonical[0]) == 'r' && TOLOWER (canonical[1]) == 'm')
14044 canonical += 2;
14045 else if (TOLOWER (canonical[0]) == 'r')
14046 canonical += 1;
14047
14048 return mips_strict_matching_cpu_name_p (canonical, given);
14049 }
14050
14051 /* Return the mips_cpu_info entry for the processor or ISA given
14052 by CPU_STRING. Return null if the string isn't recognized.
14053
14054 A similar function exists in GAS. */
14055
14056 static const struct mips_cpu_info *
14057 mips_parse_cpu (const char *cpu_string)
14058 {
14059 unsigned int i;
14060 const char *s;
14061
14062 /* In the past, we allowed upper-case CPU names, but it doesn't
14063 work well with the multilib machinery. */
14064 for (s = cpu_string; *s != 0; s++)
14065 if (ISUPPER (*s))
14066 {
14067 warning (0, "CPU names must be lower case");
14068 break;
14069 }
14070
14071 /* 'from-abi' selects the most compatible architecture for the given
14072 ABI: MIPS I for 32-bit ABIs and MIPS III for 64-bit ABIs. For the
14073 EABIs, we have to decide whether we're using the 32-bit or 64-bit
14074 version. */
14075 if (strcasecmp (cpu_string, "from-abi") == 0)
14076 return mips_cpu_info_from_isa (ABI_NEEDS_32BIT_REGS ? 1
14077 : ABI_NEEDS_64BIT_REGS ? 3
14078 : (TARGET_64BIT ? 3 : 1));
14079
14080 /* 'default' has traditionally been a no-op. Probably not very useful. */
14081 if (strcasecmp (cpu_string, "default") == 0)
14082 return NULL;
14083
14084 for (i = 0; i < ARRAY_SIZE (mips_cpu_info_table); i++)
14085 if (mips_matching_cpu_name_p (mips_cpu_info_table[i].name, cpu_string))
14086 return mips_cpu_info_table + i;
14087
14088 return NULL;
14089 }
14090
14091 /* Set up globals to generate code for the ISA or processor
14092 described by INFO. */
14093
14094 static void
14095 mips_set_architecture (const struct mips_cpu_info *info)
14096 {
14097 if (info != 0)
14098 {
14099 mips_arch_info = info;
14100 mips_arch = info->cpu;
14101 mips_isa = info->isa;
14102 }
14103 }
14104
14105 /* Likewise for tuning. */
14106
14107 static void
14108 mips_set_tune (const struct mips_cpu_info *info)
14109 {
14110 if (info != 0)
14111 {
14112 mips_tune_info = info;
14113 mips_tune = info->cpu;
14114 }
14115 }
14116
14117 /* Implement TARGET_HANDLE_OPTION. */
14118
14119 static bool
14120 mips_handle_option (size_t code, const char *arg, int value ATTRIBUTE_UNUSED)
14121 {
14122 switch (code)
14123 {
14124 case OPT_mabi_:
14125 if (strcmp (arg, "32") == 0)
14126 mips_abi = ABI_32;
14127 else if (strcmp (arg, "o64") == 0)
14128 mips_abi = ABI_O64;
14129 else if (strcmp (arg, "n32") == 0)
14130 mips_abi = ABI_N32;
14131 else if (strcmp (arg, "64") == 0)
14132 mips_abi = ABI_64;
14133 else if (strcmp (arg, "eabi") == 0)
14134 mips_abi = ABI_EABI;
14135 else
14136 return false;
14137 return true;
14138
14139 case OPT_march_:
14140 case OPT_mtune_:
14141 return mips_parse_cpu (arg) != 0;
14142
14143 case OPT_mips:
14144 mips_isa_option_info = mips_parse_cpu (ACONCAT (("mips", arg, NULL)));
14145 return mips_isa_option_info != 0;
14146
14147 case OPT_mno_flush_func:
14148 mips_cache_flush_func = NULL;
14149 return true;
14150
14151 case OPT_mcode_readable_:
14152 if (strcmp (arg, "yes") == 0)
14153 mips_code_readable = CODE_READABLE_YES;
14154 else if (strcmp (arg, "pcrel") == 0)
14155 mips_code_readable = CODE_READABLE_PCREL;
14156 else if (strcmp (arg, "no") == 0)
14157 mips_code_readable = CODE_READABLE_NO;
14158 else
14159 return false;
14160 return true;
14161
14162 case OPT_mr10k_cache_barrier_:
14163 if (strcmp (arg, "load-store") == 0)
14164 mips_r10k_cache_barrier = R10K_CACHE_BARRIER_LOAD_STORE;
14165 else if (strcmp (arg, "store") == 0)
14166 mips_r10k_cache_barrier = R10K_CACHE_BARRIER_STORE;
14167 else if (strcmp (arg, "none") == 0)
14168 mips_r10k_cache_barrier = R10K_CACHE_BARRIER_NONE;
14169 else
14170 return false;
14171 return true;
14172
14173 default:
14174 return true;
14175 }
14176 }
14177
14178 /* Implement OVERRIDE_OPTIONS. */
14179
14180 void
14181 mips_override_options (void)
14182 {
14183 int i, start, regno, mode;
14184
14185 /* Process flags as though we were generating non-MIPS16 code. */
14186 mips_base_mips16 = TARGET_MIPS16;
14187 target_flags &= ~MASK_MIPS16;
14188
14189 #ifdef SUBTARGET_OVERRIDE_OPTIONS
14190 SUBTARGET_OVERRIDE_OPTIONS;
14191 #endif
14192
14193 /* Set the small data limit. */
14194 mips_small_data_threshold = (g_switch_set
14195 ? g_switch_value
14196 : MIPS_DEFAULT_GVALUE);
14197
14198 /* The following code determines the architecture and register size.
14199 Similar code was added to GAS 2.14 (see tc-mips.c:md_after_parse_args()).
14200 The GAS and GCC code should be kept in sync as much as possible. */
14201
14202 if (mips_arch_string != 0)
14203 mips_set_architecture (mips_parse_cpu (mips_arch_string));
14204
14205 if (mips_isa_option_info != 0)
14206 {
14207 if (mips_arch_info == 0)
14208 mips_set_architecture (mips_isa_option_info);
14209 else if (mips_arch_info->isa != mips_isa_option_info->isa)
14210 error ("%<-%s%> conflicts with the other architecture options, "
14211 "which specify a %s processor",
14212 mips_isa_option_info->name,
14213 mips_cpu_info_from_isa (mips_arch_info->isa)->name);
14214 }
14215
14216 if (mips_arch_info == 0)
14217 {
14218 #ifdef MIPS_CPU_STRING_DEFAULT
14219 mips_set_architecture (mips_parse_cpu (MIPS_CPU_STRING_DEFAULT));
14220 #else
14221 mips_set_architecture (mips_cpu_info_from_isa (MIPS_ISA_DEFAULT));
14222 #endif
14223 }
14224
14225 if (ABI_NEEDS_64BIT_REGS && !ISA_HAS_64BIT_REGS)
14226 error ("%<-march=%s%> is not compatible with the selected ABI",
14227 mips_arch_info->name);
14228
14229 /* Optimize for mips_arch, unless -mtune selects a different processor. */
14230 if (mips_tune_string != 0)
14231 mips_set_tune (mips_parse_cpu (mips_tune_string));
14232
14233 if (mips_tune_info == 0)
14234 mips_set_tune (mips_arch_info);
14235
14236 if ((target_flags_explicit & MASK_64BIT) != 0)
14237 {
14238 /* The user specified the size of the integer registers. Make sure
14239 it agrees with the ABI and ISA. */
14240 if (TARGET_64BIT && !ISA_HAS_64BIT_REGS)
14241 error ("%<-mgp64%> used with a 32-bit processor");
14242 else if (!TARGET_64BIT && ABI_NEEDS_64BIT_REGS)
14243 error ("%<-mgp32%> used with a 64-bit ABI");
14244 else if (TARGET_64BIT && ABI_NEEDS_32BIT_REGS)
14245 error ("%<-mgp64%> used with a 32-bit ABI");
14246 }
14247 else
14248 {
14249 /* Infer the integer register size from the ABI and processor.
14250 Restrict ourselves to 32-bit registers if that's all the
14251 processor has, or if the ABI cannot handle 64-bit registers. */
14252 if (ABI_NEEDS_32BIT_REGS || !ISA_HAS_64BIT_REGS)
14253 target_flags &= ~MASK_64BIT;
14254 else
14255 target_flags |= MASK_64BIT;
14256 }
14257
14258 if ((target_flags_explicit & MASK_FLOAT64) != 0)
14259 {
14260 if (TARGET_SINGLE_FLOAT && TARGET_FLOAT64)
14261 error ("unsupported combination: %s", "-mfp64 -msingle-float");
14262 else if (TARGET_64BIT && TARGET_DOUBLE_FLOAT && !TARGET_FLOAT64)
14263 error ("unsupported combination: %s", "-mgp64 -mfp32 -mdouble-float");
14264 else if (!TARGET_64BIT && TARGET_FLOAT64)
14265 {
14266 if (!ISA_HAS_MXHC1)
14267 error ("%<-mgp32%> and %<-mfp64%> can only be combined if"
14268 " the target supports the mfhc1 and mthc1 instructions");
14269 else if (mips_abi != ABI_32)
14270 error ("%<-mgp32%> and %<-mfp64%> can only be combined when using"
14271 " the o32 ABI");
14272 }
14273 }
14274 else
14275 {
14276 /* -msingle-float selects 32-bit float registers. Otherwise the
14277 float registers should be the same size as the integer ones. */
14278 if (TARGET_64BIT && TARGET_DOUBLE_FLOAT)
14279 target_flags |= MASK_FLOAT64;
14280 else
14281 target_flags &= ~MASK_FLOAT64;
14282 }
14283
14284 /* End of code shared with GAS. */
14285
14286 /* If no -mlong* option was given, infer it from the other options. */
14287 if ((target_flags_explicit & MASK_LONG64) == 0)
14288 {
14289 if ((mips_abi == ABI_EABI && TARGET_64BIT) || mips_abi == ABI_64)
14290 target_flags |= MASK_LONG64;
14291 else
14292 target_flags &= ~MASK_LONG64;
14293 }
14294
14295 if (!TARGET_OLDABI)
14296 flag_pcc_struct_return = 0;
14297
14298 /* Decide which rtx_costs structure to use. */
14299 if (optimize_size)
14300 mips_cost = &mips_rtx_cost_optimize_size;
14301 else
14302 mips_cost = &mips_rtx_cost_data[mips_tune];
14303
14304 /* If the user hasn't specified a branch cost, use the processor's
14305 default. */
14306 if (mips_branch_cost == 0)
14307 mips_branch_cost = mips_cost->branch_cost;
14308
14309 /* If neither -mbranch-likely nor -mno-branch-likely was given
14310 on the command line, set MASK_BRANCHLIKELY based on the target
14311 architecture and tuning flags. Annulled delay slots are a
14312 size win, so we only consider the processor-specific tuning
14313 for !optimize_size. */
14314 if ((target_flags_explicit & MASK_BRANCHLIKELY) == 0)
14315 {
14316 if (ISA_HAS_BRANCHLIKELY
14317 && (optimize_size
14318 || (mips_tune_info->tune_flags & PTF_AVOID_BRANCHLIKELY) == 0))
14319 target_flags |= MASK_BRANCHLIKELY;
14320 else
14321 target_flags &= ~MASK_BRANCHLIKELY;
14322 }
14323 else if (TARGET_BRANCHLIKELY && !ISA_HAS_BRANCHLIKELY)
14324 warning (0, "the %qs architecture does not support branch-likely"
14325 " instructions", mips_arch_info->name);
14326
14327 /* The effect of -mabicalls isn't defined for the EABI. */
14328 if (mips_abi == ABI_EABI && TARGET_ABICALLS)
14329 {
14330 error ("unsupported combination: %s", "-mabicalls -mabi=eabi");
14331 target_flags &= ~MASK_ABICALLS;
14332 }
14333
14334 if (TARGET_ABICALLS_PIC2)
14335 /* We need to set flag_pic for executables as well as DSOs
14336 because we may reference symbols that are not defined in
14337 the final executable. (MIPS does not use things like
14338 copy relocs, for example.)
14339
14340 There is a body of code that uses __PIC__ to distinguish
14341 between -mabicalls and -mno-abicalls code. The non-__PIC__
14342 variant is usually appropriate for TARGET_ABICALLS_PIC0, as
14343 long as any indirect jumps use $25. */
14344 flag_pic = 1;
14345
14346 /* -mvr4130-align is a "speed over size" optimization: it usually produces
14347 faster code, but at the expense of more nops. Enable it at -O3 and
14348 above. */
14349 if (optimize > 2 && (target_flags_explicit & MASK_VR4130_ALIGN) == 0)
14350 target_flags |= MASK_VR4130_ALIGN;
14351
14352 /* Prefer a call to memcpy over inline code when optimizing for size,
14353 though see MOVE_RATIO in mips.h. */
14354 if (optimize_size && (target_flags_explicit & MASK_MEMCPY) == 0)
14355 target_flags |= MASK_MEMCPY;
14356
14357 /* If we have a nonzero small-data limit, check that the -mgpopt
14358 setting is consistent with the other target flags. */
14359 if (mips_small_data_threshold > 0)
14360 {
14361 if (!TARGET_GPOPT)
14362 {
14363 if (!TARGET_EXPLICIT_RELOCS)
14364 error ("%<-mno-gpopt%> needs %<-mexplicit-relocs%>");
14365
14366 TARGET_LOCAL_SDATA = false;
14367 TARGET_EXTERN_SDATA = false;
14368 }
14369 else
14370 {
14371 if (TARGET_VXWORKS_RTP)
14372 warning (0, "cannot use small-data accesses for %qs", "-mrtp");
14373
14374 if (TARGET_ABICALLS)
14375 warning (0, "cannot use small-data accesses for %qs",
14376 "-mabicalls");
14377 }
14378 }
14379
14380 #ifdef MIPS_TFMODE_FORMAT
14381 REAL_MODE_FORMAT (TFmode) = &MIPS_TFMODE_FORMAT;
14382 #endif
14383
14384 /* Make sure that the user didn't turn off paired single support when
14385 MIPS-3D support is requested. */
14386 if (TARGET_MIPS3D
14387 && (target_flags_explicit & MASK_PAIRED_SINGLE_FLOAT)
14388 && !TARGET_PAIRED_SINGLE_FLOAT)
14389 error ("%<-mips3d%> requires %<-mpaired-single%>");
14390
14391 /* If TARGET_MIPS3D, enable MASK_PAIRED_SINGLE_FLOAT. */
14392 if (TARGET_MIPS3D)
14393 target_flags |= MASK_PAIRED_SINGLE_FLOAT;
14394
14395 /* Make sure that when TARGET_PAIRED_SINGLE_FLOAT is true, TARGET_FLOAT64
14396 and TARGET_HARD_FLOAT_ABI are both true. */
14397 if (TARGET_PAIRED_SINGLE_FLOAT && !(TARGET_FLOAT64 && TARGET_HARD_FLOAT_ABI))
14398 error ("%qs must be used with %qs",
14399 TARGET_MIPS3D ? "-mips3d" : "-mpaired-single",
14400 TARGET_HARD_FLOAT_ABI ? "-mfp64" : "-mhard-float");
14401
14402 /* Make sure that the ISA supports TARGET_PAIRED_SINGLE_FLOAT when it is
14403 enabled. */
14404 if (TARGET_PAIRED_SINGLE_FLOAT && !ISA_HAS_PAIRED_SINGLE)
14405 warning (0, "the %qs architecture does not support paired-single"
14406 " instructions", mips_arch_info->name);
14407
14408 if (mips_r10k_cache_barrier != R10K_CACHE_BARRIER_NONE
14409 && !TARGET_CACHE_BUILTIN)
14410 {
14411 error ("%qs requires a target that provides the %qs instruction",
14412 "-mr10k-cache-barrier", "cache");
14413 mips_r10k_cache_barrier = R10K_CACHE_BARRIER_NONE;
14414 }
14415
14416 /* If TARGET_DSPR2, enable MASK_DSP. */
14417 if (TARGET_DSPR2)
14418 target_flags |= MASK_DSP;
14419
14420 /* .eh_frame addresses should be the same width as a C pointer.
14421 Most MIPS ABIs support only one pointer size, so the assembler
14422 will usually know exactly how big an .eh_frame address is.
14423
14424 Unfortunately, this is not true of the 64-bit EABI. The ABI was
14425 originally defined to use 64-bit pointers (i.e. it is LP64), and
14426 this is still the default mode. However, we also support an n32-like
14427 ILP32 mode, which is selected by -mlong32. The problem is that the
14428 assembler has traditionally not had an -mlong option, so it has
14429 traditionally not known whether we're using the ILP32 or LP64 form.
14430
14431 As it happens, gas versions up to and including 2.19 use _32-bit_
14432 addresses for EABI64 .cfi_* directives. This is wrong for the
14433 default LP64 mode, so we can't use the directives by default.
14434 Moreover, since gas's current behavior is at odds with gcc's
14435 default behavior, it seems unwise to rely on future versions
14436 of gas behaving the same way. We therefore avoid using .cfi
14437 directives for -mlong32 as well. */
14438 if (mips_abi == ABI_EABI && TARGET_64BIT)
14439 flag_dwarf2_cfi_asm = 0;
14440
14441 mips_init_print_operand_punct ();
14442
14443 /* Set up array to map GCC register number to debug register number.
14444 Ignore the special purpose register numbers. */
14445
14446 for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
14447 {
14448 mips_dbx_regno[i] = INVALID_REGNUM;
14449 if (GP_REG_P (i) || FP_REG_P (i) || ALL_COP_REG_P (i))
14450 mips_dwarf_regno[i] = i;
14451 else
14452 mips_dwarf_regno[i] = INVALID_REGNUM;
14453 }
14454
14455 start = GP_DBX_FIRST - GP_REG_FIRST;
14456 for (i = GP_REG_FIRST; i <= GP_REG_LAST; i++)
14457 mips_dbx_regno[i] = i + start;
14458
14459 start = FP_DBX_FIRST - FP_REG_FIRST;
14460 for (i = FP_REG_FIRST; i <= FP_REG_LAST; i++)
14461 mips_dbx_regno[i] = i + start;
14462
14463 /* Accumulator debug registers use big-endian ordering. */
14464 mips_dbx_regno[HI_REGNUM] = MD_DBX_FIRST + 0;
14465 mips_dbx_regno[LO_REGNUM] = MD_DBX_FIRST + 1;
14466 mips_dwarf_regno[HI_REGNUM] = MD_REG_FIRST + 0;
14467 mips_dwarf_regno[LO_REGNUM] = MD_REG_FIRST + 1;
14468 for (i = DSP_ACC_REG_FIRST; i <= DSP_ACC_REG_LAST; i += 2)
14469 {
14470 mips_dwarf_regno[i + TARGET_LITTLE_ENDIAN] = i;
14471 mips_dwarf_regno[i + TARGET_BIG_ENDIAN] = i + 1;
14472 }
14473
14474 /* Set up mips_hard_regno_mode_ok. */
14475 for (mode = 0; mode < MAX_MACHINE_MODE; mode++)
14476 for (regno = 0; regno < FIRST_PSEUDO_REGISTER; regno++)
14477 mips_hard_regno_mode_ok[mode][regno]
14478 = mips_hard_regno_mode_ok_p (regno, (enum machine_mode) mode);
14479
14480 /* Function to allocate machine-dependent function status. */
14481 init_machine_status = &mips_init_machine_status;
14482
14483 /* Default to working around R4000 errata only if the processor
14484 was selected explicitly. */
14485 if ((target_flags_explicit & MASK_FIX_R4000) == 0
14486 && mips_matching_cpu_name_p (mips_arch_info->name, "r4000"))
14487 target_flags |= MASK_FIX_R4000;
14488
14489 /* Default to working around R4400 errata only if the processor
14490 was selected explicitly. */
14491 if ((target_flags_explicit & MASK_FIX_R4400) == 0
14492 && mips_matching_cpu_name_p (mips_arch_info->name, "r4400"))
14493 target_flags |= MASK_FIX_R4400;
14494
14495 /* Default to working around R10000 errata only if the processor
14496 was selected explicitly. */
14497 if ((target_flags_explicit & MASK_FIX_R10000) == 0
14498 && mips_matching_cpu_name_p (mips_arch_info->name, "r10000"))
14499 target_flags |= MASK_FIX_R10000;
14500
14501 /* Make sure that branch-likely instructions available when using
14502 -mfix-r10000. The instructions are not available if either:
14503
14504 1. -mno-branch-likely was passed.
14505 2. The selected ISA does not support branch-likely and
14506 the command line does not include -mbranch-likely. */
14507 if (TARGET_FIX_R10000
14508 && ((target_flags_explicit & MASK_BRANCHLIKELY) == 0
14509 ? !ISA_HAS_BRANCHLIKELY
14510 : !TARGET_BRANCHLIKELY))
14511 sorry ("%qs requires branch-likely instructions", "-mfix-r10000");
14512
14513 /* Save base state of options. */
14514 mips_base_target_flags = target_flags;
14515 mips_base_schedule_insns = flag_schedule_insns;
14516 mips_base_reorder_blocks_and_partition = flag_reorder_blocks_and_partition;
14517 mips_base_move_loop_invariants = flag_move_loop_invariants;
14518 mips_base_align_loops = align_loops;
14519 mips_base_align_jumps = align_jumps;
14520 mips_base_align_functions = align_functions;
14521
14522 /* Now select the ISA mode.
14523
14524 Do all CPP-sensitive stuff in non-MIPS16 mode; we'll switch to
14525 MIPS16 mode afterwards if need be. */
14526 mips_set_mips16_mode (false);
14527 }
14528
14529 /* Swap the register information for registers I and I + 1, which
14530 currently have the wrong endianness. Note that the registers'
14531 fixedness and call-clobberedness might have been set on the
14532 command line. */
14533
14534 static void
14535 mips_swap_registers (unsigned int i)
14536 {
14537 int tmpi;
14538 const char *tmps;
14539
14540 #define SWAP_INT(X, Y) (tmpi = (X), (X) = (Y), (Y) = tmpi)
14541 #define SWAP_STRING(X, Y) (tmps = (X), (X) = (Y), (Y) = tmps)
14542
14543 SWAP_INT (fixed_regs[i], fixed_regs[i + 1]);
14544 SWAP_INT (call_used_regs[i], call_used_regs[i + 1]);
14545 SWAP_INT (call_really_used_regs[i], call_really_used_regs[i + 1]);
14546 SWAP_STRING (reg_names[i], reg_names[i + 1]);
14547
14548 #undef SWAP_STRING
14549 #undef SWAP_INT
14550 }
14551
14552 /* Implement CONDITIONAL_REGISTER_USAGE. */
14553
14554 void
14555 mips_conditional_register_usage (void)
14556 {
14557
14558 if (ISA_HAS_DSP)
14559 {
14560 /* These DSP control register fields are global. */
14561 global_regs[CCDSP_PO_REGNUM] = 1;
14562 global_regs[CCDSP_SC_REGNUM] = 1;
14563 }
14564 else
14565 {
14566 int regno;
14567
14568 for (regno = DSP_ACC_REG_FIRST; regno <= DSP_ACC_REG_LAST; regno++)
14569 fixed_regs[regno] = call_used_regs[regno] = 1;
14570 }
14571 if (!TARGET_HARD_FLOAT)
14572 {
14573 int regno;
14574
14575 for (regno = FP_REG_FIRST; regno <= FP_REG_LAST; regno++)
14576 fixed_regs[regno] = call_used_regs[regno] = 1;
14577 for (regno = ST_REG_FIRST; regno <= ST_REG_LAST; regno++)
14578 fixed_regs[regno] = call_used_regs[regno] = 1;
14579 }
14580 else if (! ISA_HAS_8CC)
14581 {
14582 int regno;
14583
14584 /* We only have a single condition-code register. We implement
14585 this by fixing all the condition-code registers and generating
14586 RTL that refers directly to ST_REG_FIRST. */
14587 for (regno = ST_REG_FIRST; regno <= ST_REG_LAST; regno++)
14588 fixed_regs[regno] = call_used_regs[regno] = 1;
14589 }
14590 /* In MIPS16 mode, we permit the $t temporary registers to be used
14591 for reload. We prohibit the unused $s registers, since they
14592 are call-saved, and saving them via a MIPS16 register would
14593 probably waste more time than just reloading the value. */
14594 if (TARGET_MIPS16)
14595 {
14596 fixed_regs[18] = call_used_regs[18] = 1;
14597 fixed_regs[19] = call_used_regs[19] = 1;
14598 fixed_regs[20] = call_used_regs[20] = 1;
14599 fixed_regs[21] = call_used_regs[21] = 1;
14600 fixed_regs[22] = call_used_regs[22] = 1;
14601 fixed_regs[23] = call_used_regs[23] = 1;
14602 fixed_regs[26] = call_used_regs[26] = 1;
14603 fixed_regs[27] = call_used_regs[27] = 1;
14604 fixed_regs[30] = call_used_regs[30] = 1;
14605 }
14606 /* $f20-$f23 are call-clobbered for n64. */
14607 if (mips_abi == ABI_64)
14608 {
14609 int regno;
14610 for (regno = FP_REG_FIRST + 20; regno < FP_REG_FIRST + 24; regno++)
14611 call_really_used_regs[regno] = call_used_regs[regno] = 1;
14612 }
14613 /* Odd registers in the range $f21-$f31 (inclusive) are call-clobbered
14614 for n32. */
14615 if (mips_abi == ABI_N32)
14616 {
14617 int regno;
14618 for (regno = FP_REG_FIRST + 21; regno <= FP_REG_FIRST + 31; regno+=2)
14619 call_really_used_regs[regno] = call_used_regs[regno] = 1;
14620 }
14621 /* Make sure that double-register accumulator values are correctly
14622 ordered for the current endianness. */
14623 if (TARGET_LITTLE_ENDIAN)
14624 {
14625 unsigned int regno;
14626
14627 mips_swap_registers (MD_REG_FIRST);
14628 for (regno = DSP_ACC_REG_FIRST; regno <= DSP_ACC_REG_LAST; regno += 2)
14629 mips_swap_registers (regno);
14630 }
14631 }
14632
14633 /* Initialize vector TARGET to VALS. */
14634
14635 void
14636 mips_expand_vector_init (rtx target, rtx vals)
14637 {
14638 enum machine_mode mode;
14639 enum machine_mode inner;
14640 unsigned int i, n_elts;
14641 rtx mem;
14642
14643 mode = GET_MODE (target);
14644 inner = GET_MODE_INNER (mode);
14645 n_elts = GET_MODE_NUNITS (mode);
14646
14647 gcc_assert (VECTOR_MODE_P (mode));
14648
14649 mem = assign_stack_temp (mode, GET_MODE_SIZE (mode), 0);
14650 for (i = 0; i < n_elts; i++)
14651 emit_move_insn (adjust_address_nv (mem, inner, i * GET_MODE_SIZE (inner)),
14652 XVECEXP (vals, 0, i));
14653
14654 emit_move_insn (target, mem);
14655 }
14656
14657 /* When generating MIPS16 code, we want to allocate $24 (T_REG) before
14658 other registers for instructions for which it is possible. This
14659 encourages the compiler to use CMP in cases where an XOR would
14660 require some register shuffling. */
14661
14662 void
14663 mips_order_regs_for_local_alloc (void)
14664 {
14665 int i;
14666
14667 for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
14668 reg_alloc_order[i] = i;
14669
14670 if (TARGET_MIPS16)
14671 {
14672 /* It really doesn't matter where we put register 0, since it is
14673 a fixed register anyhow. */
14674 reg_alloc_order[0] = 24;
14675 reg_alloc_order[24] = 0;
14676 }
14677 }
14678
14679 /* Implement EPILOGUE_USES. */
14680
14681 bool
14682 mips_epilogue_uses (unsigned int regno)
14683 {
14684 /* Say that the epilogue uses the return address register. Note that
14685 in the case of sibcalls, the values "used by the epilogue" are
14686 considered live at the start of the called function. */
14687 if (regno == 31)
14688 return true;
14689
14690 /* If using a GOT, say that the epilogue also uses GOT_VERSION_REGNUM.
14691 See the comment above load_call<mode> for details. */
14692 if (TARGET_USE_GOT && (regno) == GOT_VERSION_REGNUM)
14693 return true;
14694
14695 /* An interrupt handler must preserve some registers that are
14696 ordinarily call-clobbered. */
14697 if (cfun->machine->interrupt_handler_p
14698 && mips_interrupt_extra_call_saved_reg_p (regno))
14699 return true;
14700
14701 return false;
14702 }
14703
14704 /* A for_each_rtx callback. Stop the search if *X is an AT register. */
14705
14706 static int
14707 mips_at_reg_p (rtx *x, void *data ATTRIBUTE_UNUSED)
14708 {
14709 return GET_CODE (*x) == REG && REGNO (*x) == AT_REGNUM;
14710 }
14711
14712
14713 /* Implement FINAL_PRESCAN_INSN. */
14714
14715 void
14716 mips_final_prescan_insn (rtx insn, rtx *opvec, int noperands)
14717 {
14718 int i;
14719
14720 /* We need to emit ".set noat" before an instruction that accesses
14721 $1 (AT). */
14722 if (recog_memoized (insn) >= 0)
14723 for (i = 0; i < noperands; i++)
14724 if (for_each_rtx (&opvec[i], mips_at_reg_p, NULL))
14725 if (set_noat++ == 0)
14726 fprintf (asm_out_file, "\t.set\tnoat\n");
14727 }
14728
14729 /* Implement TARGET_ASM_FINAL_POSTSCAN_INSN. */
14730
14731 static void
14732 mips_final_postscan_insn (FILE *file, rtx insn, rtx *opvec, int noperands)
14733 {
14734 int i;
14735
14736 /* Close any ".set noat" block opened by mips_final_prescan_insn. */
14737 if (recog_memoized (insn) >= 0)
14738 for (i = 0; i < noperands; i++)
14739 if (for_each_rtx (&opvec[i], mips_at_reg_p, NULL))
14740 if (--set_noat == 0)
14741 fprintf (file, "\t.set\tat\n");
14742 }
14743 \f
14744 /* Initialize the GCC target structure. */
14745 #undef TARGET_ASM_ALIGNED_HI_OP
14746 #define TARGET_ASM_ALIGNED_HI_OP "\t.half\t"
14747 #undef TARGET_ASM_ALIGNED_SI_OP
14748 #define TARGET_ASM_ALIGNED_SI_OP "\t.word\t"
14749 #undef TARGET_ASM_ALIGNED_DI_OP
14750 #define TARGET_ASM_ALIGNED_DI_OP "\t.dword\t"
14751
14752 #undef TARGET_LEGITIMIZE_ADDRESS
14753 #define TARGET_LEGITIMIZE_ADDRESS mips_legitimize_address
14754
14755 #undef TARGET_ASM_FUNCTION_PROLOGUE
14756 #define TARGET_ASM_FUNCTION_PROLOGUE mips_output_function_prologue
14757 #undef TARGET_ASM_FUNCTION_EPILOGUE
14758 #define TARGET_ASM_FUNCTION_EPILOGUE mips_output_function_epilogue
14759 #undef TARGET_ASM_SELECT_RTX_SECTION
14760 #define TARGET_ASM_SELECT_RTX_SECTION mips_select_rtx_section
14761 #undef TARGET_ASM_FUNCTION_RODATA_SECTION
14762 #define TARGET_ASM_FUNCTION_RODATA_SECTION mips_function_rodata_section
14763
14764 #undef TARGET_SCHED_INIT
14765 #define TARGET_SCHED_INIT mips_sched_init
14766 #undef TARGET_SCHED_REORDER
14767 #define TARGET_SCHED_REORDER mips_sched_reorder
14768 #undef TARGET_SCHED_REORDER2
14769 #define TARGET_SCHED_REORDER2 mips_sched_reorder
14770 #undef TARGET_SCHED_VARIABLE_ISSUE
14771 #define TARGET_SCHED_VARIABLE_ISSUE mips_variable_issue
14772 #undef TARGET_SCHED_ADJUST_COST
14773 #define TARGET_SCHED_ADJUST_COST mips_adjust_cost
14774 #undef TARGET_SCHED_ISSUE_RATE
14775 #define TARGET_SCHED_ISSUE_RATE mips_issue_rate
14776 #undef TARGET_SCHED_INIT_DFA_POST_CYCLE_INSN
14777 #define TARGET_SCHED_INIT_DFA_POST_CYCLE_INSN mips_init_dfa_post_cycle_insn
14778 #undef TARGET_SCHED_DFA_POST_ADVANCE_CYCLE
14779 #define TARGET_SCHED_DFA_POST_ADVANCE_CYCLE mips_dfa_post_advance_cycle
14780 #undef TARGET_SCHED_FIRST_CYCLE_MULTIPASS_DFA_LOOKAHEAD
14781 #define TARGET_SCHED_FIRST_CYCLE_MULTIPASS_DFA_LOOKAHEAD \
14782 mips_multipass_dfa_lookahead
14783
14784 #undef TARGET_DEFAULT_TARGET_FLAGS
14785 #define TARGET_DEFAULT_TARGET_FLAGS \
14786 (TARGET_DEFAULT \
14787 | TARGET_CPU_DEFAULT \
14788 | TARGET_ENDIAN_DEFAULT \
14789 | TARGET_FP_EXCEPTIONS_DEFAULT \
14790 | MASK_CHECK_ZERO_DIV \
14791 | MASK_FUSED_MADD)
14792 #undef TARGET_HANDLE_OPTION
14793 #define TARGET_HANDLE_OPTION mips_handle_option
14794
14795 #undef TARGET_FUNCTION_OK_FOR_SIBCALL
14796 #define TARGET_FUNCTION_OK_FOR_SIBCALL mips_function_ok_for_sibcall
14797
14798 #undef TARGET_INSERT_ATTRIBUTES
14799 #define TARGET_INSERT_ATTRIBUTES mips_insert_attributes
14800 #undef TARGET_MERGE_DECL_ATTRIBUTES
14801 #define TARGET_MERGE_DECL_ATTRIBUTES mips_merge_decl_attributes
14802 #undef TARGET_SET_CURRENT_FUNCTION
14803 #define TARGET_SET_CURRENT_FUNCTION mips_set_current_function
14804
14805 #undef TARGET_VALID_POINTER_MODE
14806 #define TARGET_VALID_POINTER_MODE mips_valid_pointer_mode
14807 #undef TARGET_RTX_COSTS
14808 #define TARGET_RTX_COSTS mips_rtx_costs
14809 #undef TARGET_ADDRESS_COST
14810 #define TARGET_ADDRESS_COST mips_address_cost
14811
14812 #undef TARGET_IN_SMALL_DATA_P
14813 #define TARGET_IN_SMALL_DATA_P mips_in_small_data_p
14814
14815 #undef TARGET_MACHINE_DEPENDENT_REORG
14816 #define TARGET_MACHINE_DEPENDENT_REORG mips_reorg
14817
14818 #undef TARGET_ASM_FILE_START
14819 #define TARGET_ASM_FILE_START mips_file_start
14820 #undef TARGET_ASM_FILE_START_FILE_DIRECTIVE
14821 #define TARGET_ASM_FILE_START_FILE_DIRECTIVE true
14822
14823 #undef TARGET_INIT_LIBFUNCS
14824 #define TARGET_INIT_LIBFUNCS mips_init_libfuncs
14825
14826 #undef TARGET_BUILD_BUILTIN_VA_LIST
14827 #define TARGET_BUILD_BUILTIN_VA_LIST mips_build_builtin_va_list
14828 #undef TARGET_EXPAND_BUILTIN_VA_START
14829 #define TARGET_EXPAND_BUILTIN_VA_START mips_va_start
14830 #undef TARGET_GIMPLIFY_VA_ARG_EXPR
14831 #define TARGET_GIMPLIFY_VA_ARG_EXPR mips_gimplify_va_arg_expr
14832
14833 #undef TARGET_PROMOTE_FUNCTION_ARGS
14834 #define TARGET_PROMOTE_FUNCTION_ARGS hook_bool_const_tree_true
14835 #undef TARGET_PROMOTE_FUNCTION_RETURN
14836 #define TARGET_PROMOTE_FUNCTION_RETURN hook_bool_const_tree_true
14837 #undef TARGET_PROMOTE_PROTOTYPES
14838 #define TARGET_PROMOTE_PROTOTYPES hook_bool_const_tree_true
14839
14840 #undef TARGET_RETURN_IN_MEMORY
14841 #define TARGET_RETURN_IN_MEMORY mips_return_in_memory
14842 #undef TARGET_RETURN_IN_MSB
14843 #define TARGET_RETURN_IN_MSB mips_return_in_msb
14844
14845 #undef TARGET_ASM_OUTPUT_MI_THUNK
14846 #define TARGET_ASM_OUTPUT_MI_THUNK mips_output_mi_thunk
14847 #undef TARGET_ASM_CAN_OUTPUT_MI_THUNK
14848 #define TARGET_ASM_CAN_OUTPUT_MI_THUNK hook_bool_const_tree_hwi_hwi_const_tree_true
14849
14850 #undef TARGET_SETUP_INCOMING_VARARGS
14851 #define TARGET_SETUP_INCOMING_VARARGS mips_setup_incoming_varargs
14852 #undef TARGET_STRICT_ARGUMENT_NAMING
14853 #define TARGET_STRICT_ARGUMENT_NAMING mips_strict_argument_naming
14854 #undef TARGET_MUST_PASS_IN_STACK
14855 #define TARGET_MUST_PASS_IN_STACK must_pass_in_stack_var_size
14856 #undef TARGET_PASS_BY_REFERENCE
14857 #define TARGET_PASS_BY_REFERENCE mips_pass_by_reference
14858 #undef TARGET_CALLEE_COPIES
14859 #define TARGET_CALLEE_COPIES mips_callee_copies
14860 #undef TARGET_ARG_PARTIAL_BYTES
14861 #define TARGET_ARG_PARTIAL_BYTES mips_arg_partial_bytes
14862
14863 #undef TARGET_MODE_REP_EXTENDED
14864 #define TARGET_MODE_REP_EXTENDED mips_mode_rep_extended
14865
14866 #undef TARGET_VECTOR_MODE_SUPPORTED_P
14867 #define TARGET_VECTOR_MODE_SUPPORTED_P mips_vector_mode_supported_p
14868
14869 #undef TARGET_SCALAR_MODE_SUPPORTED_P
14870 #define TARGET_SCALAR_MODE_SUPPORTED_P mips_scalar_mode_supported_p
14871
14872 #undef TARGET_INIT_BUILTINS
14873 #define TARGET_INIT_BUILTINS mips_init_builtins
14874 #undef TARGET_EXPAND_BUILTIN
14875 #define TARGET_EXPAND_BUILTIN mips_expand_builtin
14876
14877 #undef TARGET_HAVE_TLS
14878 #define TARGET_HAVE_TLS HAVE_AS_TLS
14879
14880 #undef TARGET_CANNOT_FORCE_CONST_MEM
14881 #define TARGET_CANNOT_FORCE_CONST_MEM mips_cannot_force_const_mem
14882
14883 #undef TARGET_ENCODE_SECTION_INFO
14884 #define TARGET_ENCODE_SECTION_INFO mips_encode_section_info
14885
14886 #undef TARGET_ATTRIBUTE_TABLE
14887 #define TARGET_ATTRIBUTE_TABLE mips_attribute_table
14888 /* All our function attributes are related to how out-of-line copies should
14889 be compiled or called. They don't in themselves prevent inlining. */
14890 #undef TARGET_FUNCTION_ATTRIBUTE_INLINABLE_P
14891 #define TARGET_FUNCTION_ATTRIBUTE_INLINABLE_P hook_bool_const_tree_true
14892
14893 #undef TARGET_EXTRA_LIVE_ON_ENTRY
14894 #define TARGET_EXTRA_LIVE_ON_ENTRY mips_extra_live_on_entry
14895
14896 #undef TARGET_USE_BLOCKS_FOR_CONSTANT_P
14897 #define TARGET_USE_BLOCKS_FOR_CONSTANT_P mips_use_blocks_for_constant_p
14898 #undef TARGET_USE_ANCHORS_FOR_SYMBOL_P
14899 #define TARGET_USE_ANCHORS_FOR_SYMBOL_P mips_use_anchors_for_symbol_p
14900
14901 #undef TARGET_COMP_TYPE_ATTRIBUTES
14902 #define TARGET_COMP_TYPE_ATTRIBUTES mips_comp_type_attributes
14903
14904 #ifdef HAVE_AS_DTPRELWORD
14905 #undef TARGET_ASM_OUTPUT_DWARF_DTPREL
14906 #define TARGET_ASM_OUTPUT_DWARF_DTPREL mips_output_dwarf_dtprel
14907 #endif
14908 #undef TARGET_DWARF_REGISTER_SPAN
14909 #define TARGET_DWARF_REGISTER_SPAN mips_dwarf_register_span
14910
14911 #undef TARGET_IRA_COVER_CLASSES
14912 #define TARGET_IRA_COVER_CLASSES mips_ira_cover_classes
14913
14914 #undef TARGET_ASM_FINAL_POSTSCAN_INSN
14915 #define TARGET_ASM_FINAL_POSTSCAN_INSN mips_final_postscan_insn
14916
14917 #undef TARGET_LEGITIMATE_ADDRESS_P
14918 #define TARGET_LEGITIMATE_ADDRESS_P mips_legitimate_address_p
14919
14920 struct gcc_target targetm = TARGET_INITIALIZER;
14921 \f
14922 #include "gt-mips.h"