mips.c (insert_pass_mips_machine_reorg2): Move into...
[gcc.git] / gcc / config / mips / mips.c
1 /* Subroutines used for MIPS code generation.
2 Copyright (C) 1989-2013 Free Software Foundation, Inc.
3 Contributed by A. Lichnewsky, lich@inria.inria.fr.
4 Changes by Michael Meissner, meissner@osf.org.
5 64-bit r4000 support by Ian Lance Taylor, ian@cygnus.com, and
6 Brendan Eich, brendan@microunity.com.
7
8 This file is part of GCC.
9
10 GCC is free software; you can redistribute it and/or modify
11 it under the terms of the GNU General Public License as published by
12 the Free Software Foundation; either version 3, or (at your option)
13 any later version.
14
15 GCC is distributed in the hope that it will be useful,
16 but WITHOUT ANY WARRANTY; without even the implied warranty of
17 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 GNU General Public License for more details.
19
20 You should have received a copy of the GNU General Public License
21 along with GCC; see the file COPYING3. If not see
22 <http://www.gnu.org/licenses/>. */
23
24 #include "config.h"
25 #include "system.h"
26 #include "coretypes.h"
27 #include "tm.h"
28 #include "rtl.h"
29 #include "regs.h"
30 #include "hard-reg-set.h"
31 #include "insn-config.h"
32 #include "conditions.h"
33 #include "insn-attr.h"
34 #include "recog.h"
35 #include "output.h"
36 #include "tree.h"
37 #include "function.h"
38 #include "expr.h"
39 #include "optabs.h"
40 #include "libfuncs.h"
41 #include "flags.h"
42 #include "reload.h"
43 #include "tm_p.h"
44 #include "ggc.h"
45 #include "gstab.h"
46 #include "hash-table.h"
47 #include "debug.h"
48 #include "target.h"
49 #include "target-def.h"
50 #include "common/common-target.h"
51 #include "langhooks.h"
52 #include "sched-int.h"
53 #include "gimple.h"
54 #include "bitmap.h"
55 #include "diagnostic.h"
56 #include "target-globals.h"
57 #include "opts.h"
58 #include "tree-pass.h"
59 #include "context.h"
60
61 /* True if X is an UNSPEC wrapper around a SYMBOL_REF or LABEL_REF. */
62 #define UNSPEC_ADDRESS_P(X) \
63 (GET_CODE (X) == UNSPEC \
64 && XINT (X, 1) >= UNSPEC_ADDRESS_FIRST \
65 && XINT (X, 1) < UNSPEC_ADDRESS_FIRST + NUM_SYMBOL_TYPES)
66
67 /* Extract the symbol or label from UNSPEC wrapper X. */
68 #define UNSPEC_ADDRESS(X) \
69 XVECEXP (X, 0, 0)
70
71 /* Extract the symbol type from UNSPEC wrapper X. */
72 #define UNSPEC_ADDRESS_TYPE(X) \
73 ((enum mips_symbol_type) (XINT (X, 1) - UNSPEC_ADDRESS_FIRST))
74
75 /* The maximum distance between the top of the stack frame and the
76 value $sp has when we save and restore registers.
77
78 The value for normal-mode code must be a SMALL_OPERAND and must
79 preserve the maximum stack alignment. We therefore use a value
80 of 0x7ff0 in this case.
81
82 microMIPS LWM and SWM support 12-bit offsets (from -0x800 to 0x7ff),
83 so we use a maximum of 0x7f0 for TARGET_MICROMIPS.
84
85 MIPS16e SAVE and RESTORE instructions can adjust the stack pointer by
86 up to 0x7f8 bytes and can usually save or restore all the registers
87 that we need to save or restore. (Note that we can only use these
88 instructions for o32, for which the stack alignment is 8 bytes.)
89
90 We use a maximum gap of 0x100 or 0x400 for MIPS16 code when SAVE and
91 RESTORE are not available. We can then use unextended instructions
92 to save and restore registers, and to allocate and deallocate the top
93 part of the frame. */
94 #define MIPS_MAX_FIRST_STACK_STEP \
95 (!TARGET_COMPRESSION ? 0x7ff0 \
96 : TARGET_MICROMIPS || GENERATE_MIPS16E_SAVE_RESTORE ? 0x7f8 \
97 : TARGET_64BIT ? 0x100 : 0x400)
98
99 /* True if INSN is a mips.md pattern or asm statement. */
100 /* ??? This test exists through the compiler, perhaps it should be
101 moved to rtl.h. */
102 #define USEFUL_INSN_P(INSN) \
103 (NONDEBUG_INSN_P (INSN) \
104 && GET_CODE (PATTERN (INSN)) != USE \
105 && GET_CODE (PATTERN (INSN)) != CLOBBER)
106
107 /* If INSN is a delayed branch sequence, return the first instruction
108 in the sequence, otherwise return INSN itself. */
109 #define SEQ_BEGIN(INSN) \
110 (INSN_P (INSN) && GET_CODE (PATTERN (INSN)) == SEQUENCE \
111 ? XVECEXP (PATTERN (INSN), 0, 0) \
112 : (INSN))
113
114 /* Likewise for the last instruction in a delayed branch sequence. */
115 #define SEQ_END(INSN) \
116 (INSN_P (INSN) && GET_CODE (PATTERN (INSN)) == SEQUENCE \
117 ? XVECEXP (PATTERN (INSN), 0, XVECLEN (PATTERN (INSN), 0) - 1) \
118 : (INSN))
119
120 /* Execute the following loop body with SUBINSN set to each instruction
121 between SEQ_BEGIN (INSN) and SEQ_END (INSN) inclusive. */
122 #define FOR_EACH_SUBINSN(SUBINSN, INSN) \
123 for ((SUBINSN) = SEQ_BEGIN (INSN); \
124 (SUBINSN) != NEXT_INSN (SEQ_END (INSN)); \
125 (SUBINSN) = NEXT_INSN (SUBINSN))
126
127 /* True if bit BIT is set in VALUE. */
128 #define BITSET_P(VALUE, BIT) (((VALUE) & (1 << (BIT))) != 0)
129
130 /* Return the opcode for a ptr_mode load of the form:
131
132 l[wd] DEST, OFFSET(BASE). */
133 #define MIPS_LOAD_PTR(DEST, OFFSET, BASE) \
134 (((ptr_mode == DImode ? 0x37 : 0x23) << 26) \
135 | ((BASE) << 21) \
136 | ((DEST) << 16) \
137 | (OFFSET))
138
139 /* Return the opcode to move register SRC into register DEST. */
140 #define MIPS_MOVE(DEST, SRC) \
141 ((TARGET_64BIT ? 0x2d : 0x21) \
142 | ((DEST) << 11) \
143 | ((SRC) << 21))
144
145 /* Return the opcode for:
146
147 lui DEST, VALUE. */
148 #define MIPS_LUI(DEST, VALUE) \
149 ((0xf << 26) | ((DEST) << 16) | (VALUE))
150
151 /* Return the opcode to jump to register DEST. */
152 #define MIPS_JR(DEST) \
153 (((DEST) << 21) | 0x8)
154
155 /* Return the opcode for:
156
157 bal . + (1 + OFFSET) * 4. */
158 #define MIPS_BAL(OFFSET) \
159 ((0x1 << 26) | (0x11 << 16) | (OFFSET))
160
161 /* Return the usual opcode for a nop. */
162 #define MIPS_NOP 0
163
164 /* Classifies an address.
165
166 ADDRESS_REG
167 A natural register + offset address. The register satisfies
168 mips_valid_base_register_p and the offset is a const_arith_operand.
169
170 ADDRESS_LO_SUM
171 A LO_SUM rtx. The first operand is a valid base register and
172 the second operand is a symbolic address.
173
174 ADDRESS_CONST_INT
175 A signed 16-bit constant address.
176
177 ADDRESS_SYMBOLIC:
178 A constant symbolic address. */
179 enum mips_address_type {
180 ADDRESS_REG,
181 ADDRESS_LO_SUM,
182 ADDRESS_CONST_INT,
183 ADDRESS_SYMBOLIC
184 };
185
186 /* Macros to create an enumeration identifier for a function prototype. */
187 #define MIPS_FTYPE_NAME1(A, B) MIPS_##A##_FTYPE_##B
188 #define MIPS_FTYPE_NAME2(A, B, C) MIPS_##A##_FTYPE_##B##_##C
189 #define MIPS_FTYPE_NAME3(A, B, C, D) MIPS_##A##_FTYPE_##B##_##C##_##D
190 #define MIPS_FTYPE_NAME4(A, B, C, D, E) MIPS_##A##_FTYPE_##B##_##C##_##D##_##E
191
192 /* Classifies the prototype of a built-in function. */
193 enum mips_function_type {
194 #define DEF_MIPS_FTYPE(NARGS, LIST) MIPS_FTYPE_NAME##NARGS LIST,
195 #include "config/mips/mips-ftypes.def"
196 #undef DEF_MIPS_FTYPE
197 MIPS_MAX_FTYPE_MAX
198 };
199
200 /* Specifies how a built-in function should be converted into rtl. */
201 enum mips_builtin_type {
202 /* The function corresponds directly to an .md pattern. The return
203 value is mapped to operand 0 and the arguments are mapped to
204 operands 1 and above. */
205 MIPS_BUILTIN_DIRECT,
206
207 /* The function corresponds directly to an .md pattern. There is no return
208 value and the arguments are mapped to operands 0 and above. */
209 MIPS_BUILTIN_DIRECT_NO_TARGET,
210
211 /* The function corresponds to a comparison instruction followed by
212 a mips_cond_move_tf_ps pattern. The first two arguments are the
213 values to compare and the second two arguments are the vector
214 operands for the movt.ps or movf.ps instruction (in assembly order). */
215 MIPS_BUILTIN_MOVF,
216 MIPS_BUILTIN_MOVT,
217
218 /* The function corresponds to a V2SF comparison instruction. Operand 0
219 of this instruction is the result of the comparison, which has mode
220 CCV2 or CCV4. The function arguments are mapped to operands 1 and
221 above. The function's return value is an SImode boolean that is
222 true under the following conditions:
223
224 MIPS_BUILTIN_CMP_ANY: one of the registers is true
225 MIPS_BUILTIN_CMP_ALL: all of the registers are true
226 MIPS_BUILTIN_CMP_LOWER: the first register is true
227 MIPS_BUILTIN_CMP_UPPER: the second register is true. */
228 MIPS_BUILTIN_CMP_ANY,
229 MIPS_BUILTIN_CMP_ALL,
230 MIPS_BUILTIN_CMP_UPPER,
231 MIPS_BUILTIN_CMP_LOWER,
232
233 /* As above, but the instruction only sets a single $fcc register. */
234 MIPS_BUILTIN_CMP_SINGLE,
235
236 /* For generating bposge32 branch instructions in MIPS32 DSP ASE. */
237 MIPS_BUILTIN_BPOSGE32
238 };
239
240 /* Invoke MACRO (COND) for each C.cond.fmt condition. */
241 #define MIPS_FP_CONDITIONS(MACRO) \
242 MACRO (f), \
243 MACRO (un), \
244 MACRO (eq), \
245 MACRO (ueq), \
246 MACRO (olt), \
247 MACRO (ult), \
248 MACRO (ole), \
249 MACRO (ule), \
250 MACRO (sf), \
251 MACRO (ngle), \
252 MACRO (seq), \
253 MACRO (ngl), \
254 MACRO (lt), \
255 MACRO (nge), \
256 MACRO (le), \
257 MACRO (ngt)
258
259 /* Enumerates the codes above as MIPS_FP_COND_<X>. */
260 #define DECLARE_MIPS_COND(X) MIPS_FP_COND_ ## X
261 enum mips_fp_condition {
262 MIPS_FP_CONDITIONS (DECLARE_MIPS_COND)
263 };
264
265 /* Index X provides the string representation of MIPS_FP_COND_<X>. */
266 #define STRINGIFY(X) #X
267 static const char *const mips_fp_conditions[] = {
268 MIPS_FP_CONDITIONS (STRINGIFY)
269 };
270
271 /* Tuning information that is automatically derived from other sources
272 (such as the scheduler). */
273 static struct {
274 /* The architecture and tuning settings that this structure describes. */
275 enum processor arch;
276 enum processor tune;
277
278 /* True if this structure describes MIPS16 settings. */
279 bool mips16_p;
280
281 /* True if the structure has been initialized. */
282 bool initialized_p;
283
284 /* True if "MULT $0, $0" is preferable to "MTLO $0; MTHI $0"
285 when optimizing for speed. */
286 bool fast_mult_zero_zero_p;
287 } mips_tuning_info;
288
289 /* Information about a function's frame layout. */
290 struct GTY(()) mips_frame_info {
291 /* The size of the frame in bytes. */
292 HOST_WIDE_INT total_size;
293
294 /* The number of bytes allocated to variables. */
295 HOST_WIDE_INT var_size;
296
297 /* The number of bytes allocated to outgoing function arguments. */
298 HOST_WIDE_INT args_size;
299
300 /* The number of bytes allocated to the .cprestore slot, or 0 if there
301 is no such slot. */
302 HOST_WIDE_INT cprestore_size;
303
304 /* Bit X is set if the function saves or restores GPR X. */
305 unsigned int mask;
306
307 /* Likewise FPR X. */
308 unsigned int fmask;
309
310 /* Likewise doubleword accumulator X ($acX). */
311 unsigned int acc_mask;
312
313 /* The number of GPRs, FPRs, doubleword accumulators and COP0
314 registers saved. */
315 unsigned int num_gp;
316 unsigned int num_fp;
317 unsigned int num_acc;
318 unsigned int num_cop0_regs;
319
320 /* The offset of the topmost GPR, FPR, accumulator and COP0-register
321 save slots from the top of the frame, or zero if no such slots are
322 needed. */
323 HOST_WIDE_INT gp_save_offset;
324 HOST_WIDE_INT fp_save_offset;
325 HOST_WIDE_INT acc_save_offset;
326 HOST_WIDE_INT cop0_save_offset;
327
328 /* Likewise, but giving offsets from the bottom of the frame. */
329 HOST_WIDE_INT gp_sp_offset;
330 HOST_WIDE_INT fp_sp_offset;
331 HOST_WIDE_INT acc_sp_offset;
332 HOST_WIDE_INT cop0_sp_offset;
333
334 /* Similar, but the value passed to _mcount. */
335 HOST_WIDE_INT ra_fp_offset;
336
337 /* The offset of arg_pointer_rtx from the bottom of the frame. */
338 HOST_WIDE_INT arg_pointer_offset;
339
340 /* The offset of hard_frame_pointer_rtx from the bottom of the frame. */
341 HOST_WIDE_INT hard_frame_pointer_offset;
342 };
343
344 struct GTY(()) machine_function {
345 /* The next floating-point condition-code register to allocate
346 for ISA_HAS_8CC targets, relative to ST_REG_FIRST. */
347 unsigned int next_fcc;
348
349 /* The register returned by mips16_gp_pseudo_reg; see there for details. */
350 rtx mips16_gp_pseudo_rtx;
351
352 /* The number of extra stack bytes taken up by register varargs.
353 This area is allocated by the callee at the very top of the frame. */
354 int varargs_size;
355
356 /* The current frame information, calculated by mips_compute_frame_info. */
357 struct mips_frame_info frame;
358
359 /* The register to use as the function's global pointer, or INVALID_REGNUM
360 if the function doesn't need one. */
361 unsigned int global_pointer;
362
363 /* How many instructions it takes to load a label into $AT, or 0 if
364 this property hasn't yet been calculated. */
365 unsigned int load_label_num_insns;
366
367 /* True if mips_adjust_insn_length should ignore an instruction's
368 hazard attribute. */
369 bool ignore_hazard_length_p;
370
371 /* True if the whole function is suitable for .set noreorder and
372 .set nomacro. */
373 bool all_noreorder_p;
374
375 /* True if the function has "inflexible" and "flexible" references
376 to the global pointer. See mips_cfun_has_inflexible_gp_ref_p
377 and mips_cfun_has_flexible_gp_ref_p for details. */
378 bool has_inflexible_gp_insn_p;
379 bool has_flexible_gp_insn_p;
380
381 /* True if the function's prologue must load the global pointer
382 value into pic_offset_table_rtx and store the same value in
383 the function's cprestore slot (if any). Even if this value
384 is currently false, we may decide to set it to true later;
385 see mips_must_initialize_gp_p () for details. */
386 bool must_initialize_gp_p;
387
388 /* True if the current function must restore $gp after any potential
389 clobber. This value is only meaningful during the first post-epilogue
390 split_insns pass; see mips_must_initialize_gp_p () for details. */
391 bool must_restore_gp_when_clobbered_p;
392
393 /* True if this is an interrupt handler. */
394 bool interrupt_handler_p;
395
396 /* True if this is an interrupt handler that uses shadow registers. */
397 bool use_shadow_register_set_p;
398
399 /* True if this is an interrupt handler that should keep interrupts
400 masked. */
401 bool keep_interrupts_masked_p;
402
403 /* True if this is an interrupt handler that should use DERET
404 instead of ERET. */
405 bool use_debug_exception_return_p;
406 };
407
408 /* Information about a single argument. */
409 struct mips_arg_info {
410 /* True if the argument is passed in a floating-point register, or
411 would have been if we hadn't run out of registers. */
412 bool fpr_p;
413
414 /* The number of words passed in registers, rounded up. */
415 unsigned int reg_words;
416
417 /* For EABI, the offset of the first register from GP_ARG_FIRST or
418 FP_ARG_FIRST. For other ABIs, the offset of the first register from
419 the start of the ABI's argument structure (see the CUMULATIVE_ARGS
420 comment for details).
421
422 The value is MAX_ARGS_IN_REGISTERS if the argument is passed entirely
423 on the stack. */
424 unsigned int reg_offset;
425
426 /* The number of words that must be passed on the stack, rounded up. */
427 unsigned int stack_words;
428
429 /* The offset from the start of the stack overflow area of the argument's
430 first stack word. Only meaningful when STACK_WORDS is nonzero. */
431 unsigned int stack_offset;
432 };
433
434 /* Information about an address described by mips_address_type.
435
436 ADDRESS_CONST_INT
437 No fields are used.
438
439 ADDRESS_REG
440 REG is the base register and OFFSET is the constant offset.
441
442 ADDRESS_LO_SUM
443 REG and OFFSET are the operands to the LO_SUM and SYMBOL_TYPE
444 is the type of symbol it references.
445
446 ADDRESS_SYMBOLIC
447 SYMBOL_TYPE is the type of symbol that the address references. */
448 struct mips_address_info {
449 enum mips_address_type type;
450 rtx reg;
451 rtx offset;
452 enum mips_symbol_type symbol_type;
453 };
454
455 /* One stage in a constant building sequence. These sequences have
456 the form:
457
458 A = VALUE[0]
459 A = A CODE[1] VALUE[1]
460 A = A CODE[2] VALUE[2]
461 ...
462
463 where A is an accumulator, each CODE[i] is a binary rtl operation
464 and each VALUE[i] is a constant integer. CODE[0] is undefined. */
465 struct mips_integer_op {
466 enum rtx_code code;
467 unsigned HOST_WIDE_INT value;
468 };
469
470 /* The largest number of operations needed to load an integer constant.
471 The worst accepted case for 64-bit constants is LUI,ORI,SLL,ORI,SLL,ORI.
472 When the lowest bit is clear, we can try, but reject a sequence with
473 an extra SLL at the end. */
474 #define MIPS_MAX_INTEGER_OPS 7
475
476 /* Information about a MIPS16e SAVE or RESTORE instruction. */
477 struct mips16e_save_restore_info {
478 /* The number of argument registers saved by a SAVE instruction.
479 0 for RESTORE instructions. */
480 unsigned int nargs;
481
482 /* Bit X is set if the instruction saves or restores GPR X. */
483 unsigned int mask;
484
485 /* The total number of bytes to allocate. */
486 HOST_WIDE_INT size;
487 };
488
489 /* Costs of various operations on the different architectures. */
490
491 struct mips_rtx_cost_data
492 {
493 unsigned short fp_add;
494 unsigned short fp_mult_sf;
495 unsigned short fp_mult_df;
496 unsigned short fp_div_sf;
497 unsigned short fp_div_df;
498 unsigned short int_mult_si;
499 unsigned short int_mult_di;
500 unsigned short int_div_si;
501 unsigned short int_div_di;
502 unsigned short branch_cost;
503 unsigned short memory_latency;
504 };
505
506 /* Global variables for machine-dependent things. */
507
508 /* The -G setting, or the configuration's default small-data limit if
509 no -G option is given. */
510 static unsigned int mips_small_data_threshold;
511
512 /* The number of file directives written by mips_output_filename. */
513 int num_source_filenames;
514
515 /* The name that appeared in the last .file directive written by
516 mips_output_filename, or "" if mips_output_filename hasn't
517 written anything yet. */
518 const char *current_function_file = "";
519
520 /* Arrays that map GCC register numbers to debugger register numbers. */
521 int mips_dbx_regno[FIRST_PSEUDO_REGISTER];
522 int mips_dwarf_regno[FIRST_PSEUDO_REGISTER];
523
524 /* Information about the current function's epilogue, used only while
525 expanding it. */
526 static struct {
527 /* A list of queued REG_CFA_RESTORE notes. */
528 rtx cfa_restores;
529
530 /* The CFA is currently defined as CFA_REG + CFA_OFFSET. */
531 rtx cfa_reg;
532 HOST_WIDE_INT cfa_offset;
533
534 /* The offset of the CFA from the stack pointer while restoring
535 registers. */
536 HOST_WIDE_INT cfa_restore_sp_offset;
537 } mips_epilogue;
538
539 /* The nesting depth of the PRINT_OPERAND '%(', '%<' and '%[' constructs. */
540 struct mips_asm_switch mips_noreorder = { "reorder", 0 };
541 struct mips_asm_switch mips_nomacro = { "macro", 0 };
542 struct mips_asm_switch mips_noat = { "at", 0 };
543
544 /* True if we're writing out a branch-likely instruction rather than a
545 normal branch. */
546 static bool mips_branch_likely;
547
548 /* The current instruction-set architecture. */
549 enum processor mips_arch;
550 const struct mips_cpu_info *mips_arch_info;
551
552 /* The processor that we should tune the code for. */
553 enum processor mips_tune;
554 const struct mips_cpu_info *mips_tune_info;
555
556 /* The ISA level associated with mips_arch. */
557 int mips_isa;
558
559 /* The architecture selected by -mipsN, or null if -mipsN wasn't used. */
560 static const struct mips_cpu_info *mips_isa_option_info;
561
562 /* Which cost information to use. */
563 static const struct mips_rtx_cost_data *mips_cost;
564
565 /* The ambient target flags, excluding MASK_MIPS16. */
566 static int mips_base_target_flags;
567
568 /* The default compression mode. */
569 unsigned int mips_base_compression_flags;
570
571 /* The ambient values of other global variables. */
572 static int mips_base_schedule_insns; /* flag_schedule_insns */
573 static int mips_base_reorder_blocks_and_partition; /* flag_reorder... */
574 static int mips_base_move_loop_invariants; /* flag_move_loop_invariants */
575 static int mips_base_align_loops; /* align_loops */
576 static int mips_base_align_jumps; /* align_jumps */
577 static int mips_base_align_functions; /* align_functions */
578
579 /* Index [M][R] is true if register R is allowed to hold a value of mode M. */
580 bool mips_hard_regno_mode_ok[(int) MAX_MACHINE_MODE][FIRST_PSEUDO_REGISTER];
581
582 /* Index C is true if character C is a valid PRINT_OPERAND punctation
583 character. */
584 static bool mips_print_operand_punct[256];
585
586 static GTY (()) int mips_output_filename_first_time = 1;
587
588 /* mips_split_p[X] is true if symbols of type X can be split by
589 mips_split_symbol. */
590 bool mips_split_p[NUM_SYMBOL_TYPES];
591
592 /* mips_split_hi_p[X] is true if the high parts of symbols of type X
593 can be split by mips_split_symbol. */
594 bool mips_split_hi_p[NUM_SYMBOL_TYPES];
595
596 /* mips_use_pcrel_pool_p[X] is true if symbols of type X should be
597 forced into a PC-relative constant pool. */
598 bool mips_use_pcrel_pool_p[NUM_SYMBOL_TYPES];
599
600 /* mips_lo_relocs[X] is the relocation to use when a symbol of type X
601 appears in a LO_SUM. It can be null if such LO_SUMs aren't valid or
602 if they are matched by a special .md file pattern. */
603 const char *mips_lo_relocs[NUM_SYMBOL_TYPES];
604
605 /* Likewise for HIGHs. */
606 const char *mips_hi_relocs[NUM_SYMBOL_TYPES];
607
608 /* Target state for MIPS16. */
609 struct target_globals *mips16_globals;
610
611 /* Cached value of can_issue_more. This is cached in mips_variable_issue hook
612 and returned from mips_sched_reorder2. */
613 static int cached_can_issue_more;
614
615 /* True if the output uses __mips16_rdhwr. */
616 static bool mips_need_mips16_rdhwr_p;
617
618 /* Index R is the smallest register class that contains register R. */
619 const enum reg_class mips_regno_to_class[FIRST_PSEUDO_REGISTER] = {
620 LEA_REGS, LEA_REGS, M16_REGS, V1_REG,
621 M16_REGS, M16_REGS, M16_REGS, M16_REGS,
622 LEA_REGS, LEA_REGS, LEA_REGS, LEA_REGS,
623 LEA_REGS, LEA_REGS, LEA_REGS, LEA_REGS,
624 M16_REGS, M16_REGS, LEA_REGS, LEA_REGS,
625 LEA_REGS, LEA_REGS, LEA_REGS, LEA_REGS,
626 T_REG, PIC_FN_ADDR_REG, LEA_REGS, LEA_REGS,
627 LEA_REGS, LEA_REGS, LEA_REGS, LEA_REGS,
628 FP_REGS, FP_REGS, FP_REGS, FP_REGS,
629 FP_REGS, FP_REGS, FP_REGS, FP_REGS,
630 FP_REGS, FP_REGS, FP_REGS, FP_REGS,
631 FP_REGS, FP_REGS, FP_REGS, FP_REGS,
632 FP_REGS, FP_REGS, FP_REGS, FP_REGS,
633 FP_REGS, FP_REGS, FP_REGS, FP_REGS,
634 FP_REGS, FP_REGS, FP_REGS, FP_REGS,
635 FP_REGS, FP_REGS, FP_REGS, FP_REGS,
636 MD0_REG, MD1_REG, NO_REGS, ST_REGS,
637 ST_REGS, ST_REGS, ST_REGS, ST_REGS,
638 ST_REGS, ST_REGS, ST_REGS, NO_REGS,
639 NO_REGS, FRAME_REGS, FRAME_REGS, NO_REGS,
640 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS,
641 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS,
642 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS,
643 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS,
644 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS,
645 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS,
646 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS,
647 COP0_REGS, COP0_REGS, COP0_REGS, COP0_REGS,
648 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS,
649 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS,
650 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS,
651 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS,
652 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS,
653 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS,
654 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS,
655 COP2_REGS, COP2_REGS, COP2_REGS, COP2_REGS,
656 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS,
657 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS,
658 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS,
659 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS,
660 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS,
661 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS,
662 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS,
663 COP3_REGS, COP3_REGS, COP3_REGS, COP3_REGS,
664 DSP_ACC_REGS, DSP_ACC_REGS, DSP_ACC_REGS, DSP_ACC_REGS,
665 DSP_ACC_REGS, DSP_ACC_REGS, ALL_REGS, ALL_REGS,
666 ALL_REGS, ALL_REGS, ALL_REGS, ALL_REGS
667 };
668
669 /* The value of TARGET_ATTRIBUTE_TABLE. */
670 static const struct attribute_spec mips_attribute_table[] = {
671 /* { name, min_len, max_len, decl_req, type_req, fn_type_req, handler,
672 om_diagnostic } */
673 { "long_call", 0, 0, false, true, true, NULL, false },
674 { "far", 0, 0, false, true, true, NULL, false },
675 { "near", 0, 0, false, true, true, NULL, false },
676 /* We would really like to treat "mips16" and "nomips16" as type
677 attributes, but GCC doesn't provide the hooks we need to support
678 the right conversion rules. As declaration attributes, they affect
679 code generation but don't carry other semantics. */
680 { "mips16", 0, 0, true, false, false, NULL, false },
681 { "nomips16", 0, 0, true, false, false, NULL, false },
682 { "micromips", 0, 0, true, false, false, NULL, false },
683 { "nomicromips", 0, 0, true, false, false, NULL, false },
684 { "nocompression", 0, 0, true, false, false, NULL, false },
685 /* Allow functions to be specified as interrupt handlers */
686 { "interrupt", 0, 0, false, true, true, NULL, false },
687 { "use_shadow_register_set", 0, 0, false, true, true, NULL, false },
688 { "keep_interrupts_masked", 0, 0, false, true, true, NULL, false },
689 { "use_debug_exception_return", 0, 0, false, true, true, NULL, false },
690 { NULL, 0, 0, false, false, false, NULL, false }
691 };
692 \f
693 /* A table describing all the processors GCC knows about; see
694 mips-cpus.def for details. */
695 static const struct mips_cpu_info mips_cpu_info_table[] = {
696 #define MIPS_CPU(NAME, CPU, ISA, FLAGS) \
697 { NAME, CPU, ISA, FLAGS },
698 #include "mips-cpus.def"
699 #undef MIPS_CPU
700 };
701
702 /* Default costs. If these are used for a processor we should look
703 up the actual costs. */
704 #define DEFAULT_COSTS COSTS_N_INSNS (6), /* fp_add */ \
705 COSTS_N_INSNS (7), /* fp_mult_sf */ \
706 COSTS_N_INSNS (8), /* fp_mult_df */ \
707 COSTS_N_INSNS (23), /* fp_div_sf */ \
708 COSTS_N_INSNS (36), /* fp_div_df */ \
709 COSTS_N_INSNS (10), /* int_mult_si */ \
710 COSTS_N_INSNS (10), /* int_mult_di */ \
711 COSTS_N_INSNS (69), /* int_div_si */ \
712 COSTS_N_INSNS (69), /* int_div_di */ \
713 2, /* branch_cost */ \
714 4 /* memory_latency */
715
716 /* Floating-point costs for processors without an FPU. Just assume that
717 all floating-point libcalls are very expensive. */
718 #define SOFT_FP_COSTS COSTS_N_INSNS (256), /* fp_add */ \
719 COSTS_N_INSNS (256), /* fp_mult_sf */ \
720 COSTS_N_INSNS (256), /* fp_mult_df */ \
721 COSTS_N_INSNS (256), /* fp_div_sf */ \
722 COSTS_N_INSNS (256) /* fp_div_df */
723
724 /* Costs to use when optimizing for size. */
725 static const struct mips_rtx_cost_data mips_rtx_cost_optimize_size = {
726 COSTS_N_INSNS (1), /* fp_add */
727 COSTS_N_INSNS (1), /* fp_mult_sf */
728 COSTS_N_INSNS (1), /* fp_mult_df */
729 COSTS_N_INSNS (1), /* fp_div_sf */
730 COSTS_N_INSNS (1), /* fp_div_df */
731 COSTS_N_INSNS (1), /* int_mult_si */
732 COSTS_N_INSNS (1), /* int_mult_di */
733 COSTS_N_INSNS (1), /* int_div_si */
734 COSTS_N_INSNS (1), /* int_div_di */
735 2, /* branch_cost */
736 4 /* memory_latency */
737 };
738
739 /* Costs to use when optimizing for speed, indexed by processor. */
740 static const struct mips_rtx_cost_data
741 mips_rtx_cost_data[NUM_PROCESSOR_VALUES] = {
742 { /* R3000 */
743 COSTS_N_INSNS (2), /* fp_add */
744 COSTS_N_INSNS (4), /* fp_mult_sf */
745 COSTS_N_INSNS (5), /* fp_mult_df */
746 COSTS_N_INSNS (12), /* fp_div_sf */
747 COSTS_N_INSNS (19), /* fp_div_df */
748 COSTS_N_INSNS (12), /* int_mult_si */
749 COSTS_N_INSNS (12), /* int_mult_di */
750 COSTS_N_INSNS (35), /* int_div_si */
751 COSTS_N_INSNS (35), /* int_div_di */
752 1, /* branch_cost */
753 4 /* memory_latency */
754 },
755 { /* 4KC */
756 SOFT_FP_COSTS,
757 COSTS_N_INSNS (6), /* int_mult_si */
758 COSTS_N_INSNS (6), /* int_mult_di */
759 COSTS_N_INSNS (36), /* int_div_si */
760 COSTS_N_INSNS (36), /* int_div_di */
761 1, /* branch_cost */
762 4 /* memory_latency */
763 },
764 { /* 4KP */
765 SOFT_FP_COSTS,
766 COSTS_N_INSNS (36), /* int_mult_si */
767 COSTS_N_INSNS (36), /* int_mult_di */
768 COSTS_N_INSNS (37), /* int_div_si */
769 COSTS_N_INSNS (37), /* int_div_di */
770 1, /* branch_cost */
771 4 /* memory_latency */
772 },
773 { /* 5KC */
774 SOFT_FP_COSTS,
775 COSTS_N_INSNS (4), /* int_mult_si */
776 COSTS_N_INSNS (11), /* int_mult_di */
777 COSTS_N_INSNS (36), /* int_div_si */
778 COSTS_N_INSNS (68), /* int_div_di */
779 1, /* branch_cost */
780 4 /* memory_latency */
781 },
782 { /* 5KF */
783 COSTS_N_INSNS (4), /* fp_add */
784 COSTS_N_INSNS (4), /* fp_mult_sf */
785 COSTS_N_INSNS (5), /* fp_mult_df */
786 COSTS_N_INSNS (17), /* fp_div_sf */
787 COSTS_N_INSNS (32), /* fp_div_df */
788 COSTS_N_INSNS (4), /* int_mult_si */
789 COSTS_N_INSNS (11), /* int_mult_di */
790 COSTS_N_INSNS (36), /* int_div_si */
791 COSTS_N_INSNS (68), /* int_div_di */
792 1, /* branch_cost */
793 4 /* memory_latency */
794 },
795 { /* 20KC */
796 COSTS_N_INSNS (4), /* fp_add */
797 COSTS_N_INSNS (4), /* fp_mult_sf */
798 COSTS_N_INSNS (5), /* fp_mult_df */
799 COSTS_N_INSNS (17), /* fp_div_sf */
800 COSTS_N_INSNS (32), /* fp_div_df */
801 COSTS_N_INSNS (4), /* int_mult_si */
802 COSTS_N_INSNS (7), /* int_mult_di */
803 COSTS_N_INSNS (42), /* int_div_si */
804 COSTS_N_INSNS (72), /* int_div_di */
805 1, /* branch_cost */
806 4 /* memory_latency */
807 },
808 { /* 24KC */
809 SOFT_FP_COSTS,
810 COSTS_N_INSNS (5), /* int_mult_si */
811 COSTS_N_INSNS (5), /* int_mult_di */
812 COSTS_N_INSNS (41), /* int_div_si */
813 COSTS_N_INSNS (41), /* int_div_di */
814 1, /* branch_cost */
815 4 /* memory_latency */
816 },
817 { /* 24KF2_1 */
818 COSTS_N_INSNS (8), /* fp_add */
819 COSTS_N_INSNS (8), /* fp_mult_sf */
820 COSTS_N_INSNS (10), /* fp_mult_df */
821 COSTS_N_INSNS (34), /* fp_div_sf */
822 COSTS_N_INSNS (64), /* fp_div_df */
823 COSTS_N_INSNS (5), /* int_mult_si */
824 COSTS_N_INSNS (5), /* int_mult_di */
825 COSTS_N_INSNS (41), /* int_div_si */
826 COSTS_N_INSNS (41), /* int_div_di */
827 1, /* branch_cost */
828 4 /* memory_latency */
829 },
830 { /* 24KF1_1 */
831 COSTS_N_INSNS (4), /* fp_add */
832 COSTS_N_INSNS (4), /* fp_mult_sf */
833 COSTS_N_INSNS (5), /* fp_mult_df */
834 COSTS_N_INSNS (17), /* fp_div_sf */
835 COSTS_N_INSNS (32), /* fp_div_df */
836 COSTS_N_INSNS (5), /* int_mult_si */
837 COSTS_N_INSNS (5), /* int_mult_di */
838 COSTS_N_INSNS (41), /* int_div_si */
839 COSTS_N_INSNS (41), /* int_div_di */
840 1, /* branch_cost */
841 4 /* memory_latency */
842 },
843 { /* 74KC */
844 SOFT_FP_COSTS,
845 COSTS_N_INSNS (5), /* int_mult_si */
846 COSTS_N_INSNS (5), /* int_mult_di */
847 COSTS_N_INSNS (41), /* int_div_si */
848 COSTS_N_INSNS (41), /* int_div_di */
849 1, /* branch_cost */
850 4 /* memory_latency */
851 },
852 { /* 74KF2_1 */
853 COSTS_N_INSNS (8), /* fp_add */
854 COSTS_N_INSNS (8), /* fp_mult_sf */
855 COSTS_N_INSNS (10), /* fp_mult_df */
856 COSTS_N_INSNS (34), /* fp_div_sf */
857 COSTS_N_INSNS (64), /* fp_div_df */
858 COSTS_N_INSNS (5), /* int_mult_si */
859 COSTS_N_INSNS (5), /* int_mult_di */
860 COSTS_N_INSNS (41), /* int_div_si */
861 COSTS_N_INSNS (41), /* int_div_di */
862 1, /* branch_cost */
863 4 /* memory_latency */
864 },
865 { /* 74KF1_1 */
866 COSTS_N_INSNS (4), /* fp_add */
867 COSTS_N_INSNS (4), /* fp_mult_sf */
868 COSTS_N_INSNS (5), /* fp_mult_df */
869 COSTS_N_INSNS (17), /* fp_div_sf */
870 COSTS_N_INSNS (32), /* fp_div_df */
871 COSTS_N_INSNS (5), /* int_mult_si */
872 COSTS_N_INSNS (5), /* int_mult_di */
873 COSTS_N_INSNS (41), /* int_div_si */
874 COSTS_N_INSNS (41), /* int_div_di */
875 1, /* branch_cost */
876 4 /* memory_latency */
877 },
878 { /* 74KF3_2 */
879 COSTS_N_INSNS (6), /* fp_add */
880 COSTS_N_INSNS (6), /* fp_mult_sf */
881 COSTS_N_INSNS (7), /* fp_mult_df */
882 COSTS_N_INSNS (25), /* fp_div_sf */
883 COSTS_N_INSNS (48), /* fp_div_df */
884 COSTS_N_INSNS (5), /* int_mult_si */
885 COSTS_N_INSNS (5), /* int_mult_di */
886 COSTS_N_INSNS (41), /* int_div_si */
887 COSTS_N_INSNS (41), /* int_div_di */
888 1, /* branch_cost */
889 4 /* memory_latency */
890 },
891 { /* Loongson-2E */
892 DEFAULT_COSTS
893 },
894 { /* Loongson-2F */
895 DEFAULT_COSTS
896 },
897 { /* Loongson-3A */
898 DEFAULT_COSTS
899 },
900 { /* M4k */
901 DEFAULT_COSTS
902 },
903 /* Octeon */
904 {
905 SOFT_FP_COSTS,
906 COSTS_N_INSNS (5), /* int_mult_si */
907 COSTS_N_INSNS (5), /* int_mult_di */
908 COSTS_N_INSNS (72), /* int_div_si */
909 COSTS_N_INSNS (72), /* int_div_di */
910 1, /* branch_cost */
911 4 /* memory_latency */
912 },
913 /* Octeon II */
914 {
915 SOFT_FP_COSTS,
916 COSTS_N_INSNS (6), /* int_mult_si */
917 COSTS_N_INSNS (6), /* int_mult_di */
918 COSTS_N_INSNS (18), /* int_div_si */
919 COSTS_N_INSNS (35), /* int_div_di */
920 4, /* branch_cost */
921 4 /* memory_latency */
922 },
923 { /* R3900 */
924 COSTS_N_INSNS (2), /* fp_add */
925 COSTS_N_INSNS (4), /* fp_mult_sf */
926 COSTS_N_INSNS (5), /* fp_mult_df */
927 COSTS_N_INSNS (12), /* fp_div_sf */
928 COSTS_N_INSNS (19), /* fp_div_df */
929 COSTS_N_INSNS (2), /* int_mult_si */
930 COSTS_N_INSNS (2), /* int_mult_di */
931 COSTS_N_INSNS (35), /* int_div_si */
932 COSTS_N_INSNS (35), /* int_div_di */
933 1, /* branch_cost */
934 4 /* memory_latency */
935 },
936 { /* R6000 */
937 COSTS_N_INSNS (3), /* fp_add */
938 COSTS_N_INSNS (5), /* fp_mult_sf */
939 COSTS_N_INSNS (6), /* fp_mult_df */
940 COSTS_N_INSNS (15), /* fp_div_sf */
941 COSTS_N_INSNS (16), /* fp_div_df */
942 COSTS_N_INSNS (17), /* int_mult_si */
943 COSTS_N_INSNS (17), /* int_mult_di */
944 COSTS_N_INSNS (38), /* int_div_si */
945 COSTS_N_INSNS (38), /* int_div_di */
946 2, /* branch_cost */
947 6 /* memory_latency */
948 },
949 { /* R4000 */
950 COSTS_N_INSNS (6), /* fp_add */
951 COSTS_N_INSNS (7), /* fp_mult_sf */
952 COSTS_N_INSNS (8), /* fp_mult_df */
953 COSTS_N_INSNS (23), /* fp_div_sf */
954 COSTS_N_INSNS (36), /* fp_div_df */
955 COSTS_N_INSNS (10), /* int_mult_si */
956 COSTS_N_INSNS (10), /* int_mult_di */
957 COSTS_N_INSNS (69), /* int_div_si */
958 COSTS_N_INSNS (69), /* int_div_di */
959 2, /* branch_cost */
960 6 /* memory_latency */
961 },
962 { /* R4100 */
963 DEFAULT_COSTS
964 },
965 { /* R4111 */
966 DEFAULT_COSTS
967 },
968 { /* R4120 */
969 DEFAULT_COSTS
970 },
971 { /* R4130 */
972 /* The only costs that appear to be updated here are
973 integer multiplication. */
974 SOFT_FP_COSTS,
975 COSTS_N_INSNS (4), /* int_mult_si */
976 COSTS_N_INSNS (6), /* int_mult_di */
977 COSTS_N_INSNS (69), /* int_div_si */
978 COSTS_N_INSNS (69), /* int_div_di */
979 1, /* branch_cost */
980 4 /* memory_latency */
981 },
982 { /* R4300 */
983 DEFAULT_COSTS
984 },
985 { /* R4600 */
986 DEFAULT_COSTS
987 },
988 { /* R4650 */
989 DEFAULT_COSTS
990 },
991 { /* R4700 */
992 DEFAULT_COSTS
993 },
994 { /* R5000 */
995 COSTS_N_INSNS (6), /* fp_add */
996 COSTS_N_INSNS (4), /* fp_mult_sf */
997 COSTS_N_INSNS (5), /* fp_mult_df */
998 COSTS_N_INSNS (23), /* fp_div_sf */
999 COSTS_N_INSNS (36), /* fp_div_df */
1000 COSTS_N_INSNS (5), /* int_mult_si */
1001 COSTS_N_INSNS (5), /* int_mult_di */
1002 COSTS_N_INSNS (36), /* int_div_si */
1003 COSTS_N_INSNS (36), /* int_div_di */
1004 1, /* branch_cost */
1005 4 /* memory_latency */
1006 },
1007 { /* R5400 */
1008 COSTS_N_INSNS (6), /* fp_add */
1009 COSTS_N_INSNS (5), /* fp_mult_sf */
1010 COSTS_N_INSNS (6), /* fp_mult_df */
1011 COSTS_N_INSNS (30), /* fp_div_sf */
1012 COSTS_N_INSNS (59), /* fp_div_df */
1013 COSTS_N_INSNS (3), /* int_mult_si */
1014 COSTS_N_INSNS (4), /* int_mult_di */
1015 COSTS_N_INSNS (42), /* int_div_si */
1016 COSTS_N_INSNS (74), /* int_div_di */
1017 1, /* branch_cost */
1018 4 /* memory_latency */
1019 },
1020 { /* R5500 */
1021 COSTS_N_INSNS (6), /* fp_add */
1022 COSTS_N_INSNS (5), /* fp_mult_sf */
1023 COSTS_N_INSNS (6), /* fp_mult_df */
1024 COSTS_N_INSNS (30), /* fp_div_sf */
1025 COSTS_N_INSNS (59), /* fp_div_df */
1026 COSTS_N_INSNS (5), /* int_mult_si */
1027 COSTS_N_INSNS (9), /* int_mult_di */
1028 COSTS_N_INSNS (42), /* int_div_si */
1029 COSTS_N_INSNS (74), /* int_div_di */
1030 1, /* branch_cost */
1031 4 /* memory_latency */
1032 },
1033 { /* R5900 */
1034 COSTS_N_INSNS (4), /* fp_add */
1035 COSTS_N_INSNS (4), /* fp_mult_sf */
1036 COSTS_N_INSNS (256), /* fp_mult_df */
1037 COSTS_N_INSNS (8), /* fp_div_sf */
1038 COSTS_N_INSNS (256), /* fp_div_df */
1039 COSTS_N_INSNS (4), /* int_mult_si */
1040 COSTS_N_INSNS (256), /* int_mult_di */
1041 COSTS_N_INSNS (37), /* int_div_si */
1042 COSTS_N_INSNS (256), /* int_div_di */
1043 1, /* branch_cost */
1044 4 /* memory_latency */
1045 },
1046 { /* R7000 */
1047 /* The only costs that are changed here are
1048 integer multiplication. */
1049 COSTS_N_INSNS (6), /* fp_add */
1050 COSTS_N_INSNS (7), /* fp_mult_sf */
1051 COSTS_N_INSNS (8), /* fp_mult_df */
1052 COSTS_N_INSNS (23), /* fp_div_sf */
1053 COSTS_N_INSNS (36), /* fp_div_df */
1054 COSTS_N_INSNS (5), /* int_mult_si */
1055 COSTS_N_INSNS (9), /* int_mult_di */
1056 COSTS_N_INSNS (69), /* int_div_si */
1057 COSTS_N_INSNS (69), /* int_div_di */
1058 1, /* branch_cost */
1059 4 /* memory_latency */
1060 },
1061 { /* R8000 */
1062 DEFAULT_COSTS
1063 },
1064 { /* R9000 */
1065 /* The only costs that are changed here are
1066 integer multiplication. */
1067 COSTS_N_INSNS (6), /* fp_add */
1068 COSTS_N_INSNS (7), /* fp_mult_sf */
1069 COSTS_N_INSNS (8), /* fp_mult_df */
1070 COSTS_N_INSNS (23), /* fp_div_sf */
1071 COSTS_N_INSNS (36), /* fp_div_df */
1072 COSTS_N_INSNS (3), /* int_mult_si */
1073 COSTS_N_INSNS (8), /* int_mult_di */
1074 COSTS_N_INSNS (69), /* int_div_si */
1075 COSTS_N_INSNS (69), /* int_div_di */
1076 1, /* branch_cost */
1077 4 /* memory_latency */
1078 },
1079 { /* R1x000 */
1080 COSTS_N_INSNS (2), /* fp_add */
1081 COSTS_N_INSNS (2), /* fp_mult_sf */
1082 COSTS_N_INSNS (2), /* fp_mult_df */
1083 COSTS_N_INSNS (12), /* fp_div_sf */
1084 COSTS_N_INSNS (19), /* fp_div_df */
1085 COSTS_N_INSNS (5), /* int_mult_si */
1086 COSTS_N_INSNS (9), /* int_mult_di */
1087 COSTS_N_INSNS (34), /* int_div_si */
1088 COSTS_N_INSNS (66), /* int_div_di */
1089 1, /* branch_cost */
1090 4 /* memory_latency */
1091 },
1092 { /* SB1 */
1093 /* These costs are the same as the SB-1A below. */
1094 COSTS_N_INSNS (4), /* fp_add */
1095 COSTS_N_INSNS (4), /* fp_mult_sf */
1096 COSTS_N_INSNS (4), /* fp_mult_df */
1097 COSTS_N_INSNS (24), /* fp_div_sf */
1098 COSTS_N_INSNS (32), /* fp_div_df */
1099 COSTS_N_INSNS (3), /* int_mult_si */
1100 COSTS_N_INSNS (4), /* int_mult_di */
1101 COSTS_N_INSNS (36), /* int_div_si */
1102 COSTS_N_INSNS (68), /* int_div_di */
1103 1, /* branch_cost */
1104 4 /* memory_latency */
1105 },
1106 { /* SB1-A */
1107 /* These costs are the same as the SB-1 above. */
1108 COSTS_N_INSNS (4), /* fp_add */
1109 COSTS_N_INSNS (4), /* fp_mult_sf */
1110 COSTS_N_INSNS (4), /* fp_mult_df */
1111 COSTS_N_INSNS (24), /* fp_div_sf */
1112 COSTS_N_INSNS (32), /* fp_div_df */
1113 COSTS_N_INSNS (3), /* int_mult_si */
1114 COSTS_N_INSNS (4), /* int_mult_di */
1115 COSTS_N_INSNS (36), /* int_div_si */
1116 COSTS_N_INSNS (68), /* int_div_di */
1117 1, /* branch_cost */
1118 4 /* memory_latency */
1119 },
1120 { /* SR71000 */
1121 DEFAULT_COSTS
1122 },
1123 { /* XLR */
1124 SOFT_FP_COSTS,
1125 COSTS_N_INSNS (8), /* int_mult_si */
1126 COSTS_N_INSNS (8), /* int_mult_di */
1127 COSTS_N_INSNS (72), /* int_div_si */
1128 COSTS_N_INSNS (72), /* int_div_di */
1129 1, /* branch_cost */
1130 4 /* memory_latency */
1131 },
1132 { /* XLP */
1133 /* These costs are the same as 5KF above. */
1134 COSTS_N_INSNS (4), /* fp_add */
1135 COSTS_N_INSNS (4), /* fp_mult_sf */
1136 COSTS_N_INSNS (5), /* fp_mult_df */
1137 COSTS_N_INSNS (17), /* fp_div_sf */
1138 COSTS_N_INSNS (32), /* fp_div_df */
1139 COSTS_N_INSNS (4), /* int_mult_si */
1140 COSTS_N_INSNS (11), /* int_mult_di */
1141 COSTS_N_INSNS (36), /* int_div_si */
1142 COSTS_N_INSNS (68), /* int_div_di */
1143 1, /* branch_cost */
1144 4 /* memory_latency */
1145 }
1146 };
1147 \f
1148 static rtx mips_find_pic_call_symbol (rtx, rtx, bool);
1149 static int mips_register_move_cost (enum machine_mode, reg_class_t,
1150 reg_class_t);
1151 static unsigned int mips_function_arg_boundary (enum machine_mode, const_tree);
1152 \f
1153 /* This hash table keeps track of implicit "mips16" and "nomips16" attributes
1154 for -mflip_mips16. It maps decl names onto a boolean mode setting. */
1155 struct GTY (()) mflip_mips16_entry {
1156 const char *name;
1157 bool mips16_p;
1158 };
1159 static GTY ((param_is (struct mflip_mips16_entry))) htab_t mflip_mips16_htab;
1160
1161 /* Hash table callbacks for mflip_mips16_htab. */
1162
1163 static hashval_t
1164 mflip_mips16_htab_hash (const void *entry)
1165 {
1166 return htab_hash_string (((const struct mflip_mips16_entry *) entry)->name);
1167 }
1168
1169 static int
1170 mflip_mips16_htab_eq (const void *entry, const void *name)
1171 {
1172 return strcmp (((const struct mflip_mips16_entry *) entry)->name,
1173 (const char *) name) == 0;
1174 }
1175
1176 /* True if -mflip-mips16 should next add an attribute for the default MIPS16
1177 mode, false if it should next add an attribute for the opposite mode. */
1178 static GTY(()) bool mips16_flipper;
1179
1180 /* DECL is a function that needs a default "mips16" or "nomips16" attribute
1181 for -mflip-mips16. Return true if it should use "mips16" and false if
1182 it should use "nomips16". */
1183
1184 static bool
1185 mflip_mips16_use_mips16_p (tree decl)
1186 {
1187 struct mflip_mips16_entry *entry;
1188 const char *name;
1189 hashval_t hash;
1190 void **slot;
1191 bool base_is_mips16 = (mips_base_compression_flags & MASK_MIPS16) != 0;
1192
1193 /* Use the opposite of the command-line setting for anonymous decls. */
1194 if (!DECL_NAME (decl))
1195 return !base_is_mips16;
1196
1197 if (!mflip_mips16_htab)
1198 mflip_mips16_htab = htab_create_ggc (37, mflip_mips16_htab_hash,
1199 mflip_mips16_htab_eq, NULL);
1200
1201 name = IDENTIFIER_POINTER (DECL_NAME (decl));
1202 hash = htab_hash_string (name);
1203 slot = htab_find_slot_with_hash (mflip_mips16_htab, name, hash, INSERT);
1204 entry = (struct mflip_mips16_entry *) *slot;
1205 if (!entry)
1206 {
1207 mips16_flipper = !mips16_flipper;
1208 entry = ggc_alloc_mflip_mips16_entry ();
1209 entry->name = name;
1210 entry->mips16_p = mips16_flipper ? !base_is_mips16 : base_is_mips16;
1211 *slot = entry;
1212 }
1213 return entry->mips16_p;
1214 }
1215 \f
1216 /* Predicates to test for presence of "near" and "far"/"long_call"
1217 attributes on the given TYPE. */
1218
1219 static bool
1220 mips_near_type_p (const_tree type)
1221 {
1222 return lookup_attribute ("near", TYPE_ATTRIBUTES (type)) != NULL;
1223 }
1224
1225 static bool
1226 mips_far_type_p (const_tree type)
1227 {
1228 return (lookup_attribute ("long_call", TYPE_ATTRIBUTES (type)) != NULL
1229 || lookup_attribute ("far", TYPE_ATTRIBUTES (type)) != NULL);
1230 }
1231
1232
1233 /* Check if the interrupt attribute is set for a function. */
1234
1235 static bool
1236 mips_interrupt_type_p (tree type)
1237 {
1238 return lookup_attribute ("interrupt", TYPE_ATTRIBUTES (type)) != NULL;
1239 }
1240
1241 /* Check if the attribute to use shadow register set is set for a function. */
1242
1243 static bool
1244 mips_use_shadow_register_set_p (tree type)
1245 {
1246 return lookup_attribute ("use_shadow_register_set",
1247 TYPE_ATTRIBUTES (type)) != NULL;
1248 }
1249
1250 /* Check if the attribute to keep interrupts masked is set for a function. */
1251
1252 static bool
1253 mips_keep_interrupts_masked_p (tree type)
1254 {
1255 return lookup_attribute ("keep_interrupts_masked",
1256 TYPE_ATTRIBUTES (type)) != NULL;
1257 }
1258
1259 /* Check if the attribute to use debug exception return is set for
1260 a function. */
1261
1262 static bool
1263 mips_use_debug_exception_return_p (tree type)
1264 {
1265 return lookup_attribute ("use_debug_exception_return",
1266 TYPE_ATTRIBUTES (type)) != NULL;
1267 }
1268
1269 /* Return the set of compression modes that are explicitly required
1270 by the attributes in ATTRIBUTES. */
1271
1272 static unsigned int
1273 mips_get_compress_on_flags (tree attributes)
1274 {
1275 unsigned int flags = 0;
1276
1277 if (lookup_attribute ("mips16", attributes) != NULL)
1278 flags |= MASK_MIPS16;
1279
1280 if (lookup_attribute ("micromips", attributes) != NULL)
1281 flags |= MASK_MICROMIPS;
1282
1283 return flags;
1284 }
1285
1286 /* Return the set of compression modes that are explicitly forbidden
1287 by the attributes in ATTRIBUTES. */
1288
1289 static unsigned int
1290 mips_get_compress_off_flags (tree attributes)
1291 {
1292 unsigned int flags = 0;
1293
1294 if (lookup_attribute ("nocompression", attributes) != NULL)
1295 flags |= MASK_MIPS16 | MASK_MICROMIPS;
1296
1297 if (lookup_attribute ("nomips16", attributes) != NULL)
1298 flags |= MASK_MIPS16;
1299
1300 if (lookup_attribute ("nomicromips", attributes) != NULL)
1301 flags |= MASK_MICROMIPS;
1302
1303 return flags;
1304 }
1305
1306 /* Return the compression mode that should be used for function DECL.
1307 Return the ambient setting if DECL is null. */
1308
1309 static unsigned int
1310 mips_get_compress_mode (tree decl)
1311 {
1312 unsigned int flags, force_on;
1313
1314 flags = mips_base_compression_flags;
1315 if (decl)
1316 {
1317 /* Nested functions must use the same frame pointer as their
1318 parent and must therefore use the same ISA mode. */
1319 tree parent = decl_function_context (decl);
1320 if (parent)
1321 decl = parent;
1322 force_on = mips_get_compress_on_flags (DECL_ATTRIBUTES (decl));
1323 if (force_on)
1324 return force_on;
1325 flags &= ~mips_get_compress_off_flags (DECL_ATTRIBUTES (decl));
1326 }
1327 return flags;
1328 }
1329
1330 /* Return the attribute name associated with MASK_MIPS16 and MASK_MICROMIPS
1331 flags FLAGS. */
1332
1333 static const char *
1334 mips_get_compress_on_name (unsigned int flags)
1335 {
1336 if (flags == MASK_MIPS16)
1337 return "mips16";
1338 return "micromips";
1339 }
1340
1341 /* Return the attribute name that forbids MASK_MIPS16 and MASK_MICROMIPS
1342 flags FLAGS. */
1343
1344 static const char *
1345 mips_get_compress_off_name (unsigned int flags)
1346 {
1347 if (flags == MASK_MIPS16)
1348 return "nomips16";
1349 if (flags == MASK_MICROMIPS)
1350 return "nomicromips";
1351 return "nocompression";
1352 }
1353
1354 /* Implement TARGET_COMP_TYPE_ATTRIBUTES. */
1355
1356 static int
1357 mips_comp_type_attributes (const_tree type1, const_tree type2)
1358 {
1359 /* Disallow mixed near/far attributes. */
1360 if (mips_far_type_p (type1) && mips_near_type_p (type2))
1361 return 0;
1362 if (mips_near_type_p (type1) && mips_far_type_p (type2))
1363 return 0;
1364 return 1;
1365 }
1366
1367 /* Implement TARGET_INSERT_ATTRIBUTES. */
1368
1369 static void
1370 mips_insert_attributes (tree decl, tree *attributes)
1371 {
1372 const char *name;
1373 unsigned int compression_flags, nocompression_flags;
1374
1375 /* Check for "mips16" and "nomips16" attributes. */
1376 compression_flags = mips_get_compress_on_flags (*attributes);
1377 nocompression_flags = mips_get_compress_off_flags (*attributes);
1378
1379 if (TREE_CODE (decl) != FUNCTION_DECL)
1380 {
1381 if (nocompression_flags)
1382 error ("%qs attribute only applies to functions",
1383 mips_get_compress_off_name (nocompression_flags));
1384
1385 if (compression_flags)
1386 error ("%qs attribute only applies to functions",
1387 mips_get_compress_on_name (nocompression_flags));
1388 }
1389 else
1390 {
1391 compression_flags |= mips_get_compress_on_flags (DECL_ATTRIBUTES (decl));
1392 nocompression_flags |=
1393 mips_get_compress_off_flags (DECL_ATTRIBUTES (decl));
1394
1395 if (compression_flags && nocompression_flags)
1396 error ("%qE cannot have both %qs and %qs attributes",
1397 DECL_NAME (decl), mips_get_compress_on_name (compression_flags),
1398 mips_get_compress_off_name (nocompression_flags));
1399
1400 if (compression_flags & MASK_MIPS16
1401 && compression_flags & MASK_MICROMIPS)
1402 error ("%qE cannot have both %qs and %qs attributes",
1403 DECL_NAME (decl), "mips16", "micromips");
1404
1405 if (TARGET_FLIP_MIPS16
1406 && !DECL_ARTIFICIAL (decl)
1407 && compression_flags == 0
1408 && nocompression_flags == 0)
1409 {
1410 /* Implement -mflip-mips16. If DECL has neither a "nomips16" nor a
1411 "mips16" attribute, arbitrarily pick one. We must pick the same
1412 setting for duplicate declarations of a function. */
1413 name = mflip_mips16_use_mips16_p (decl) ? "mips16" : "nomips16";
1414 *attributes = tree_cons (get_identifier (name), NULL, *attributes);
1415 name = "nomicromips";
1416 *attributes = tree_cons (get_identifier (name), NULL, *attributes);
1417 }
1418 }
1419 }
1420
1421 /* Implement TARGET_MERGE_DECL_ATTRIBUTES. */
1422
1423 static tree
1424 mips_merge_decl_attributes (tree olddecl, tree newdecl)
1425 {
1426 unsigned int diff;
1427
1428 diff = (mips_get_compress_on_flags (DECL_ATTRIBUTES (olddecl))
1429 ^ mips_get_compress_on_flags (DECL_ATTRIBUTES (newdecl)));
1430 if (diff)
1431 error ("%qE redeclared with conflicting %qs attributes",
1432 DECL_NAME (newdecl), mips_get_compress_on_name (diff));
1433
1434 diff = (mips_get_compress_off_flags (DECL_ATTRIBUTES (olddecl))
1435 ^ mips_get_compress_off_flags (DECL_ATTRIBUTES (newdecl)));
1436 if (diff)
1437 error ("%qE redeclared with conflicting %qs attributes",
1438 DECL_NAME (newdecl), mips_get_compress_off_name (diff));
1439
1440 return merge_attributes (DECL_ATTRIBUTES (olddecl),
1441 DECL_ATTRIBUTES (newdecl));
1442 }
1443
1444 /* Implement TARGET_CAN_INLINE_P. */
1445
1446 static bool
1447 mips_can_inline_p (tree caller, tree callee)
1448 {
1449 if (mips_get_compress_mode (callee) != mips_get_compress_mode (caller))
1450 return false;
1451 return default_target_can_inline_p (caller, callee);
1452 }
1453 \f
1454 /* If X is a PLUS of a CONST_INT, return the two terms in *BASE_PTR
1455 and *OFFSET_PTR. Return X in *BASE_PTR and 0 in *OFFSET_PTR otherwise. */
1456
1457 static void
1458 mips_split_plus (rtx x, rtx *base_ptr, HOST_WIDE_INT *offset_ptr)
1459 {
1460 if (GET_CODE (x) == PLUS && CONST_INT_P (XEXP (x, 1)))
1461 {
1462 *base_ptr = XEXP (x, 0);
1463 *offset_ptr = INTVAL (XEXP (x, 1));
1464 }
1465 else
1466 {
1467 *base_ptr = x;
1468 *offset_ptr = 0;
1469 }
1470 }
1471 \f
1472 static unsigned int mips_build_integer (struct mips_integer_op *,
1473 unsigned HOST_WIDE_INT);
1474
1475 /* A subroutine of mips_build_integer, with the same interface.
1476 Assume that the final action in the sequence should be a left shift. */
1477
1478 static unsigned int
1479 mips_build_shift (struct mips_integer_op *codes, HOST_WIDE_INT value)
1480 {
1481 unsigned int i, shift;
1482
1483 /* Shift VALUE right until its lowest bit is set. Shift arithmetically
1484 since signed numbers are easier to load than unsigned ones. */
1485 shift = 0;
1486 while ((value & 1) == 0)
1487 value /= 2, shift++;
1488
1489 i = mips_build_integer (codes, value);
1490 codes[i].code = ASHIFT;
1491 codes[i].value = shift;
1492 return i + 1;
1493 }
1494
1495 /* As for mips_build_shift, but assume that the final action will be
1496 an IOR or PLUS operation. */
1497
1498 static unsigned int
1499 mips_build_lower (struct mips_integer_op *codes, unsigned HOST_WIDE_INT value)
1500 {
1501 unsigned HOST_WIDE_INT high;
1502 unsigned int i;
1503
1504 high = value & ~(unsigned HOST_WIDE_INT) 0xffff;
1505 if (!LUI_OPERAND (high) && (value & 0x18000) == 0x18000)
1506 {
1507 /* The constant is too complex to load with a simple LUI/ORI pair,
1508 so we want to give the recursive call as many trailing zeros as
1509 possible. In this case, we know bit 16 is set and that the
1510 low 16 bits form a negative number. If we subtract that number
1511 from VALUE, we will clear at least the lowest 17 bits, maybe more. */
1512 i = mips_build_integer (codes, CONST_HIGH_PART (value));
1513 codes[i].code = PLUS;
1514 codes[i].value = CONST_LOW_PART (value);
1515 }
1516 else
1517 {
1518 /* Either this is a simple LUI/ORI pair, or clearing the lowest 16
1519 bits gives a value with at least 17 trailing zeros. */
1520 i = mips_build_integer (codes, high);
1521 codes[i].code = IOR;
1522 codes[i].value = value & 0xffff;
1523 }
1524 return i + 1;
1525 }
1526
1527 /* Fill CODES with a sequence of rtl operations to load VALUE.
1528 Return the number of operations needed. */
1529
1530 static unsigned int
1531 mips_build_integer (struct mips_integer_op *codes,
1532 unsigned HOST_WIDE_INT value)
1533 {
1534 if (SMALL_OPERAND (value)
1535 || SMALL_OPERAND_UNSIGNED (value)
1536 || LUI_OPERAND (value))
1537 {
1538 /* The value can be loaded with a single instruction. */
1539 codes[0].code = UNKNOWN;
1540 codes[0].value = value;
1541 return 1;
1542 }
1543 else if ((value & 1) != 0 || LUI_OPERAND (CONST_HIGH_PART (value)))
1544 {
1545 /* Either the constant is a simple LUI/ORI combination or its
1546 lowest bit is set. We don't want to shift in this case. */
1547 return mips_build_lower (codes, value);
1548 }
1549 else if ((value & 0xffff) == 0)
1550 {
1551 /* The constant will need at least three actions. The lowest
1552 16 bits are clear, so the final action will be a shift. */
1553 return mips_build_shift (codes, value);
1554 }
1555 else
1556 {
1557 /* The final action could be a shift, add or inclusive OR.
1558 Rather than use a complex condition to select the best
1559 approach, try both mips_build_shift and mips_build_lower
1560 and pick the one that gives the shortest sequence.
1561 Note that this case is only used once per constant. */
1562 struct mips_integer_op alt_codes[MIPS_MAX_INTEGER_OPS];
1563 unsigned int cost, alt_cost;
1564
1565 cost = mips_build_shift (codes, value);
1566 alt_cost = mips_build_lower (alt_codes, value);
1567 if (alt_cost < cost)
1568 {
1569 memcpy (codes, alt_codes, alt_cost * sizeof (codes[0]));
1570 cost = alt_cost;
1571 }
1572 return cost;
1573 }
1574 }
1575 \f
1576 /* Implement TARGET_LEGITIMATE_CONSTANT_P. */
1577
1578 static bool
1579 mips_legitimate_constant_p (enum machine_mode mode ATTRIBUTE_UNUSED, rtx x)
1580 {
1581 return mips_const_insns (x) > 0;
1582 }
1583 \f
1584 /* Return a SYMBOL_REF for a MIPS16 function called NAME. */
1585
1586 static rtx
1587 mips16_stub_function (const char *name)
1588 {
1589 rtx x;
1590
1591 x = gen_rtx_SYMBOL_REF (Pmode, ggc_strdup (name));
1592 SYMBOL_REF_FLAGS (x) |= (SYMBOL_FLAG_EXTERNAL | SYMBOL_FLAG_FUNCTION);
1593 return x;
1594 }
1595 \f
1596 /* Return true if symbols of type TYPE require a GOT access. */
1597
1598 static bool
1599 mips_got_symbol_type_p (enum mips_symbol_type type)
1600 {
1601 switch (type)
1602 {
1603 case SYMBOL_GOT_PAGE_OFST:
1604 case SYMBOL_GOT_DISP:
1605 return true;
1606
1607 default:
1608 return false;
1609 }
1610 }
1611
1612 /* Return true if X is a thread-local symbol. */
1613
1614 static bool
1615 mips_tls_symbol_p (rtx x)
1616 {
1617 return GET_CODE (x) == SYMBOL_REF && SYMBOL_REF_TLS_MODEL (x) != 0;
1618 }
1619
1620 /* Return true if SYMBOL_REF X is associated with a global symbol
1621 (in the STB_GLOBAL sense). */
1622
1623 static bool
1624 mips_global_symbol_p (const_rtx x)
1625 {
1626 const_tree decl = SYMBOL_REF_DECL (x);
1627
1628 if (!decl)
1629 return !SYMBOL_REF_LOCAL_P (x) || SYMBOL_REF_EXTERNAL_P (x);
1630
1631 /* Weakref symbols are not TREE_PUBLIC, but their targets are global
1632 or weak symbols. Relocations in the object file will be against
1633 the target symbol, so it's that symbol's binding that matters here. */
1634 return DECL_P (decl) && (TREE_PUBLIC (decl) || DECL_WEAK (decl));
1635 }
1636
1637 /* Return true if function X is a libgcc MIPS16 stub function. */
1638
1639 static bool
1640 mips16_stub_function_p (const_rtx x)
1641 {
1642 return (GET_CODE (x) == SYMBOL_REF
1643 && strncmp (XSTR (x, 0), "__mips16_", 9) == 0);
1644 }
1645
1646 /* Return true if function X is a locally-defined and locally-binding
1647 MIPS16 function. */
1648
1649 static bool
1650 mips16_local_function_p (const_rtx x)
1651 {
1652 return (GET_CODE (x) == SYMBOL_REF
1653 && SYMBOL_REF_LOCAL_P (x)
1654 && !SYMBOL_REF_EXTERNAL_P (x)
1655 && (mips_get_compress_mode (SYMBOL_REF_DECL (x)) & MASK_MIPS16));
1656 }
1657
1658 /* Return true if SYMBOL_REF X binds locally. */
1659
1660 static bool
1661 mips_symbol_binds_local_p (const_rtx x)
1662 {
1663 return (SYMBOL_REF_DECL (x)
1664 ? targetm.binds_local_p (SYMBOL_REF_DECL (x))
1665 : SYMBOL_REF_LOCAL_P (x));
1666 }
1667
1668 /* Return true if rtx constants of mode MODE should be put into a small
1669 data section. */
1670
1671 static bool
1672 mips_rtx_constant_in_small_data_p (enum machine_mode mode)
1673 {
1674 return (!TARGET_EMBEDDED_DATA
1675 && TARGET_LOCAL_SDATA
1676 && GET_MODE_SIZE (mode) <= mips_small_data_threshold);
1677 }
1678
1679 /* Return true if X should not be moved directly into register $25.
1680 We need this because many versions of GAS will treat "la $25,foo" as
1681 part of a call sequence and so allow a global "foo" to be lazily bound. */
1682
1683 bool
1684 mips_dangerous_for_la25_p (rtx x)
1685 {
1686 return (!TARGET_EXPLICIT_RELOCS
1687 && TARGET_USE_GOT
1688 && GET_CODE (x) == SYMBOL_REF
1689 && mips_global_symbol_p (x));
1690 }
1691
1692 /* Return true if calls to X might need $25 to be valid on entry. */
1693
1694 bool
1695 mips_use_pic_fn_addr_reg_p (const_rtx x)
1696 {
1697 if (!TARGET_USE_PIC_FN_ADDR_REG)
1698 return false;
1699
1700 /* MIPS16 stub functions are guaranteed not to use $25. */
1701 if (mips16_stub_function_p (x))
1702 return false;
1703
1704 if (GET_CODE (x) == SYMBOL_REF)
1705 {
1706 /* If PLTs and copy relocations are available, the static linker
1707 will make sure that $25 is valid on entry to the target function. */
1708 if (TARGET_ABICALLS_PIC0)
1709 return false;
1710
1711 /* Locally-defined functions use absolute accesses to set up
1712 the global pointer. */
1713 if (TARGET_ABSOLUTE_ABICALLS
1714 && mips_symbol_binds_local_p (x)
1715 && !SYMBOL_REF_EXTERNAL_P (x))
1716 return false;
1717 }
1718
1719 return true;
1720 }
1721
1722 /* Return the method that should be used to access SYMBOL_REF or
1723 LABEL_REF X in context CONTEXT. */
1724
1725 static enum mips_symbol_type
1726 mips_classify_symbol (const_rtx x, enum mips_symbol_context context)
1727 {
1728 if (TARGET_RTP_PIC)
1729 return SYMBOL_GOT_DISP;
1730
1731 if (GET_CODE (x) == LABEL_REF)
1732 {
1733 /* Only return SYMBOL_PC_RELATIVE if we are generating MIPS16
1734 code and if we know that the label is in the current function's
1735 text section. LABEL_REFs are used for jump tables as well as
1736 text labels, so we must check whether jump tables live in the
1737 text section. */
1738 if (TARGET_MIPS16_SHORT_JUMP_TABLES
1739 && !LABEL_REF_NONLOCAL_P (x))
1740 return SYMBOL_PC_RELATIVE;
1741
1742 if (TARGET_ABICALLS && !TARGET_ABSOLUTE_ABICALLS)
1743 return SYMBOL_GOT_PAGE_OFST;
1744
1745 return SYMBOL_ABSOLUTE;
1746 }
1747
1748 gcc_assert (GET_CODE (x) == SYMBOL_REF);
1749
1750 if (SYMBOL_REF_TLS_MODEL (x))
1751 return SYMBOL_TLS;
1752
1753 if (CONSTANT_POOL_ADDRESS_P (x))
1754 {
1755 if (TARGET_MIPS16_TEXT_LOADS)
1756 return SYMBOL_PC_RELATIVE;
1757
1758 if (TARGET_MIPS16_PCREL_LOADS && context == SYMBOL_CONTEXT_MEM)
1759 return SYMBOL_PC_RELATIVE;
1760
1761 if (mips_rtx_constant_in_small_data_p (get_pool_mode (x)))
1762 return SYMBOL_GP_RELATIVE;
1763 }
1764
1765 /* Do not use small-data accesses for weak symbols; they may end up
1766 being zero. */
1767 if (TARGET_GPOPT && SYMBOL_REF_SMALL_P (x) && !SYMBOL_REF_WEAK (x))
1768 return SYMBOL_GP_RELATIVE;
1769
1770 /* Don't use GOT accesses for locally-binding symbols when -mno-shared
1771 is in effect. */
1772 if (TARGET_ABICALLS_PIC2
1773 && !(TARGET_ABSOLUTE_ABICALLS && mips_symbol_binds_local_p (x)))
1774 {
1775 /* There are three cases to consider:
1776
1777 - o32 PIC (either with or without explicit relocs)
1778 - n32/n64 PIC without explicit relocs
1779 - n32/n64 PIC with explicit relocs
1780
1781 In the first case, both local and global accesses will use an
1782 R_MIPS_GOT16 relocation. We must correctly predict which of
1783 the two semantics (local or global) the assembler and linker
1784 will apply. The choice depends on the symbol's binding rather
1785 than its visibility.
1786
1787 In the second case, the assembler will not use R_MIPS_GOT16
1788 relocations, but it chooses between local and global accesses
1789 in the same way as for o32 PIC.
1790
1791 In the third case we have more freedom since both forms of
1792 access will work for any kind of symbol. However, there seems
1793 little point in doing things differently. */
1794 if (mips_global_symbol_p (x))
1795 return SYMBOL_GOT_DISP;
1796
1797 return SYMBOL_GOT_PAGE_OFST;
1798 }
1799
1800 return SYMBOL_ABSOLUTE;
1801 }
1802
1803 /* Classify the base of symbolic expression X, given that X appears in
1804 context CONTEXT. */
1805
1806 static enum mips_symbol_type
1807 mips_classify_symbolic_expression (rtx x, enum mips_symbol_context context)
1808 {
1809 rtx offset;
1810
1811 split_const (x, &x, &offset);
1812 if (UNSPEC_ADDRESS_P (x))
1813 return UNSPEC_ADDRESS_TYPE (x);
1814
1815 return mips_classify_symbol (x, context);
1816 }
1817
1818 /* Return true if OFFSET is within the range [0, ALIGN), where ALIGN
1819 is the alignment in bytes of SYMBOL_REF X. */
1820
1821 static bool
1822 mips_offset_within_alignment_p (rtx x, HOST_WIDE_INT offset)
1823 {
1824 HOST_WIDE_INT align;
1825
1826 align = SYMBOL_REF_DECL (x) ? DECL_ALIGN_UNIT (SYMBOL_REF_DECL (x)) : 1;
1827 return IN_RANGE (offset, 0, align - 1);
1828 }
1829
1830 /* Return true if X is a symbolic constant that can be used in context
1831 CONTEXT. If it is, store the type of the symbol in *SYMBOL_TYPE. */
1832
1833 bool
1834 mips_symbolic_constant_p (rtx x, enum mips_symbol_context context,
1835 enum mips_symbol_type *symbol_type)
1836 {
1837 rtx offset;
1838
1839 split_const (x, &x, &offset);
1840 if (UNSPEC_ADDRESS_P (x))
1841 {
1842 *symbol_type = UNSPEC_ADDRESS_TYPE (x);
1843 x = UNSPEC_ADDRESS (x);
1844 }
1845 else if (GET_CODE (x) == SYMBOL_REF || GET_CODE (x) == LABEL_REF)
1846 {
1847 *symbol_type = mips_classify_symbol (x, context);
1848 if (*symbol_type == SYMBOL_TLS)
1849 return false;
1850 }
1851 else
1852 return false;
1853
1854 if (offset == const0_rtx)
1855 return true;
1856
1857 /* Check whether a nonzero offset is valid for the underlying
1858 relocations. */
1859 switch (*symbol_type)
1860 {
1861 case SYMBOL_ABSOLUTE:
1862 case SYMBOL_64_HIGH:
1863 case SYMBOL_64_MID:
1864 case SYMBOL_64_LOW:
1865 /* If the target has 64-bit pointers and the object file only
1866 supports 32-bit symbols, the values of those symbols will be
1867 sign-extended. In this case we can't allow an arbitrary offset
1868 in case the 32-bit value X + OFFSET has a different sign from X. */
1869 if (Pmode == DImode && !ABI_HAS_64BIT_SYMBOLS)
1870 return offset_within_block_p (x, INTVAL (offset));
1871
1872 /* In other cases the relocations can handle any offset. */
1873 return true;
1874
1875 case SYMBOL_PC_RELATIVE:
1876 /* Allow constant pool references to be converted to LABEL+CONSTANT.
1877 In this case, we no longer have access to the underlying constant,
1878 but the original symbol-based access was known to be valid. */
1879 if (GET_CODE (x) == LABEL_REF)
1880 return true;
1881
1882 /* Fall through. */
1883
1884 case SYMBOL_GP_RELATIVE:
1885 /* Make sure that the offset refers to something within the
1886 same object block. This should guarantee that the final
1887 PC- or GP-relative offset is within the 16-bit limit. */
1888 return offset_within_block_p (x, INTVAL (offset));
1889
1890 case SYMBOL_GOT_PAGE_OFST:
1891 case SYMBOL_GOTOFF_PAGE:
1892 /* If the symbol is global, the GOT entry will contain the symbol's
1893 address, and we will apply a 16-bit offset after loading it.
1894 If the symbol is local, the linker should provide enough local
1895 GOT entries for a 16-bit offset, but larger offsets may lead
1896 to GOT overflow. */
1897 return SMALL_INT (offset);
1898
1899 case SYMBOL_TPREL:
1900 case SYMBOL_DTPREL:
1901 /* There is no carry between the HI and LO REL relocations, so the
1902 offset is only valid if we know it won't lead to such a carry. */
1903 return mips_offset_within_alignment_p (x, INTVAL (offset));
1904
1905 case SYMBOL_GOT_DISP:
1906 case SYMBOL_GOTOFF_DISP:
1907 case SYMBOL_GOTOFF_CALL:
1908 case SYMBOL_GOTOFF_LOADGP:
1909 case SYMBOL_TLSGD:
1910 case SYMBOL_TLSLDM:
1911 case SYMBOL_GOTTPREL:
1912 case SYMBOL_TLS:
1913 case SYMBOL_HALF:
1914 return false;
1915 }
1916 gcc_unreachable ();
1917 }
1918 \f
1919 /* Like mips_symbol_insns, but treat extended MIPS16 instructions as a
1920 single instruction. We rely on the fact that, in the worst case,
1921 all instructions involved in a MIPS16 address calculation are usually
1922 extended ones. */
1923
1924 static int
1925 mips_symbol_insns_1 (enum mips_symbol_type type, enum machine_mode mode)
1926 {
1927 if (mips_use_pcrel_pool_p[(int) type])
1928 {
1929 if (mode == MAX_MACHINE_MODE)
1930 /* LEAs will be converted into constant-pool references by
1931 mips_reorg. */
1932 type = SYMBOL_PC_RELATIVE;
1933 else
1934 /* The constant must be loaded and then dereferenced. */
1935 return 0;
1936 }
1937
1938 switch (type)
1939 {
1940 case SYMBOL_ABSOLUTE:
1941 /* When using 64-bit symbols, we need 5 preparatory instructions,
1942 such as:
1943
1944 lui $at,%highest(symbol)
1945 daddiu $at,$at,%higher(symbol)
1946 dsll $at,$at,16
1947 daddiu $at,$at,%hi(symbol)
1948 dsll $at,$at,16
1949
1950 The final address is then $at + %lo(symbol). With 32-bit
1951 symbols we just need a preparatory LUI for normal mode and
1952 a preparatory LI and SLL for MIPS16. */
1953 return ABI_HAS_64BIT_SYMBOLS ? 6 : TARGET_MIPS16 ? 3 : 2;
1954
1955 case SYMBOL_GP_RELATIVE:
1956 /* Treat GP-relative accesses as taking a single instruction on
1957 MIPS16 too; the copy of $gp can often be shared. */
1958 return 1;
1959
1960 case SYMBOL_PC_RELATIVE:
1961 /* PC-relative constants can be only be used with ADDIUPC,
1962 DADDIUPC, LWPC and LDPC. */
1963 if (mode == MAX_MACHINE_MODE
1964 || GET_MODE_SIZE (mode) == 4
1965 || GET_MODE_SIZE (mode) == 8)
1966 return 1;
1967
1968 /* The constant must be loaded using ADDIUPC or DADDIUPC first. */
1969 return 0;
1970
1971 case SYMBOL_GOT_DISP:
1972 /* The constant will have to be loaded from the GOT before it
1973 is used in an address. */
1974 if (mode != MAX_MACHINE_MODE)
1975 return 0;
1976
1977 /* Fall through. */
1978
1979 case SYMBOL_GOT_PAGE_OFST:
1980 /* Unless -funit-at-a-time is in effect, we can't be sure whether the
1981 local/global classification is accurate. The worst cases are:
1982
1983 (1) For local symbols when generating o32 or o64 code. The assembler
1984 will use:
1985
1986 lw $at,%got(symbol)
1987 nop
1988
1989 ...and the final address will be $at + %lo(symbol).
1990
1991 (2) For global symbols when -mxgot. The assembler will use:
1992
1993 lui $at,%got_hi(symbol)
1994 (d)addu $at,$at,$gp
1995
1996 ...and the final address will be $at + %got_lo(symbol). */
1997 return 3;
1998
1999 case SYMBOL_GOTOFF_PAGE:
2000 case SYMBOL_GOTOFF_DISP:
2001 case SYMBOL_GOTOFF_CALL:
2002 case SYMBOL_GOTOFF_LOADGP:
2003 case SYMBOL_64_HIGH:
2004 case SYMBOL_64_MID:
2005 case SYMBOL_64_LOW:
2006 case SYMBOL_TLSGD:
2007 case SYMBOL_TLSLDM:
2008 case SYMBOL_DTPREL:
2009 case SYMBOL_GOTTPREL:
2010 case SYMBOL_TPREL:
2011 case SYMBOL_HALF:
2012 /* A 16-bit constant formed by a single relocation, or a 32-bit
2013 constant formed from a high 16-bit relocation and a low 16-bit
2014 relocation. Use mips_split_p to determine which. 32-bit
2015 constants need an "lui; addiu" sequence for normal mode and
2016 an "li; sll; addiu" sequence for MIPS16 mode. */
2017 return !mips_split_p[type] ? 1 : TARGET_MIPS16 ? 3 : 2;
2018
2019 case SYMBOL_TLS:
2020 /* We don't treat a bare TLS symbol as a constant. */
2021 return 0;
2022 }
2023 gcc_unreachable ();
2024 }
2025
2026 /* If MODE is MAX_MACHINE_MODE, return the number of instructions needed
2027 to load symbols of type TYPE into a register. Return 0 if the given
2028 type of symbol cannot be used as an immediate operand.
2029
2030 Otherwise, return the number of instructions needed to load or store
2031 values of mode MODE to or from addresses of type TYPE. Return 0 if
2032 the given type of symbol is not valid in addresses.
2033
2034 In both cases, instruction counts are based off BASE_INSN_LENGTH. */
2035
2036 static int
2037 mips_symbol_insns (enum mips_symbol_type type, enum machine_mode mode)
2038 {
2039 return mips_symbol_insns_1 (type, mode) * (TARGET_MIPS16 ? 2 : 1);
2040 }
2041 \f
2042 /* A for_each_rtx callback. Stop the search if *X references a
2043 thread-local symbol. */
2044
2045 static int
2046 mips_tls_symbol_ref_1 (rtx *x, void *data ATTRIBUTE_UNUSED)
2047 {
2048 return mips_tls_symbol_p (*x);
2049 }
2050
2051 /* Implement TARGET_CANNOT_FORCE_CONST_MEM. */
2052
2053 static bool
2054 mips_cannot_force_const_mem (enum machine_mode mode, rtx x)
2055 {
2056 enum mips_symbol_type type;
2057 rtx base, offset;
2058
2059 /* There is no assembler syntax for expressing an address-sized
2060 high part. */
2061 if (GET_CODE (x) == HIGH)
2062 return true;
2063
2064 /* As an optimization, reject constants that mips_legitimize_move
2065 can expand inline.
2066
2067 Suppose we have a multi-instruction sequence that loads constant C
2068 into register R. If R does not get allocated a hard register, and
2069 R is used in an operand that allows both registers and memory
2070 references, reload will consider forcing C into memory and using
2071 one of the instruction's memory alternatives. Returning false
2072 here will force it to use an input reload instead. */
2073 if (CONST_INT_P (x) && mips_legitimate_constant_p (mode, x))
2074 return true;
2075
2076 split_const (x, &base, &offset);
2077 if (mips_symbolic_constant_p (base, SYMBOL_CONTEXT_LEA, &type))
2078 {
2079 /* See whether we explicitly want these symbols in the pool. */
2080 if (mips_use_pcrel_pool_p[(int) type])
2081 return false;
2082
2083 /* The same optimization as for CONST_INT. */
2084 if (SMALL_INT (offset) && mips_symbol_insns (type, MAX_MACHINE_MODE) > 0)
2085 return true;
2086
2087 /* If MIPS16 constant pools live in the text section, they should
2088 not refer to anything that might need run-time relocation. */
2089 if (TARGET_MIPS16_PCREL_LOADS && mips_got_symbol_type_p (type))
2090 return true;
2091 }
2092
2093 /* TLS symbols must be computed by mips_legitimize_move. */
2094 if (for_each_rtx (&x, &mips_tls_symbol_ref_1, NULL))
2095 return true;
2096
2097 return false;
2098 }
2099
2100 /* Implement TARGET_USE_BLOCKS_FOR_CONSTANT_P. We can't use blocks for
2101 constants when we're using a per-function constant pool. */
2102
2103 static bool
2104 mips_use_blocks_for_constant_p (enum machine_mode mode ATTRIBUTE_UNUSED,
2105 const_rtx x ATTRIBUTE_UNUSED)
2106 {
2107 return !TARGET_MIPS16_PCREL_LOADS;
2108 }
2109 \f
2110 /* Return true if register REGNO is a valid base register for mode MODE.
2111 STRICT_P is true if REG_OK_STRICT is in effect. */
2112
2113 int
2114 mips_regno_mode_ok_for_base_p (int regno, enum machine_mode mode,
2115 bool strict_p)
2116 {
2117 if (!HARD_REGISTER_NUM_P (regno))
2118 {
2119 if (!strict_p)
2120 return true;
2121 regno = reg_renumber[regno];
2122 }
2123
2124 /* These fake registers will be eliminated to either the stack or
2125 hard frame pointer, both of which are usually valid base registers.
2126 Reload deals with the cases where the eliminated form isn't valid. */
2127 if (regno == ARG_POINTER_REGNUM || regno == FRAME_POINTER_REGNUM)
2128 return true;
2129
2130 /* In MIPS16 mode, the stack pointer can only address word and doubleword
2131 values, nothing smaller. There are two problems here:
2132
2133 (a) Instantiating virtual registers can introduce new uses of the
2134 stack pointer. If these virtual registers are valid addresses,
2135 the stack pointer should be too.
2136
2137 (b) Most uses of the stack pointer are not made explicit until
2138 FRAME_POINTER_REGNUM and ARG_POINTER_REGNUM have been eliminated.
2139 We don't know until that stage whether we'll be eliminating to the
2140 stack pointer (which needs the restriction) or the hard frame
2141 pointer (which doesn't).
2142
2143 All in all, it seems more consistent to only enforce this restriction
2144 during and after reload. */
2145 if (TARGET_MIPS16 && regno == STACK_POINTER_REGNUM)
2146 return !strict_p || GET_MODE_SIZE (mode) == 4 || GET_MODE_SIZE (mode) == 8;
2147
2148 return TARGET_MIPS16 ? M16_REG_P (regno) : GP_REG_P (regno);
2149 }
2150
2151 /* Return true if X is a valid base register for mode MODE.
2152 STRICT_P is true if REG_OK_STRICT is in effect. */
2153
2154 static bool
2155 mips_valid_base_register_p (rtx x, enum machine_mode mode, bool strict_p)
2156 {
2157 if (!strict_p && GET_CODE (x) == SUBREG)
2158 x = SUBREG_REG (x);
2159
2160 return (REG_P (x)
2161 && mips_regno_mode_ok_for_base_p (REGNO (x), mode, strict_p));
2162 }
2163
2164 /* Return true if, for every base register BASE_REG, (plus BASE_REG X)
2165 can address a value of mode MODE. */
2166
2167 static bool
2168 mips_valid_offset_p (rtx x, enum machine_mode mode)
2169 {
2170 /* Check that X is a signed 16-bit number. */
2171 if (!const_arith_operand (x, Pmode))
2172 return false;
2173
2174 /* We may need to split multiword moves, so make sure that every word
2175 is accessible. */
2176 if (GET_MODE_SIZE (mode) > UNITS_PER_WORD
2177 && !SMALL_OPERAND (INTVAL (x) + GET_MODE_SIZE (mode) - UNITS_PER_WORD))
2178 return false;
2179
2180 return true;
2181 }
2182
2183 /* Return true if a LO_SUM can address a value of mode MODE when the
2184 LO_SUM symbol has type SYMBOL_TYPE. */
2185
2186 static bool
2187 mips_valid_lo_sum_p (enum mips_symbol_type symbol_type, enum machine_mode mode)
2188 {
2189 /* Check that symbols of type SYMBOL_TYPE can be used to access values
2190 of mode MODE. */
2191 if (mips_symbol_insns (symbol_type, mode) == 0)
2192 return false;
2193
2194 /* Check that there is a known low-part relocation. */
2195 if (mips_lo_relocs[symbol_type] == NULL)
2196 return false;
2197
2198 /* We may need to split multiword moves, so make sure that each word
2199 can be accessed without inducing a carry. This is mainly needed
2200 for o64, which has historically only guaranteed 64-bit alignment
2201 for 128-bit types. */
2202 if (GET_MODE_SIZE (mode) > UNITS_PER_WORD
2203 && GET_MODE_BITSIZE (mode) > GET_MODE_ALIGNMENT (mode))
2204 return false;
2205
2206 return true;
2207 }
2208
2209 /* Return true if X is a valid address for machine mode MODE. If it is,
2210 fill in INFO appropriately. STRICT_P is true if REG_OK_STRICT is in
2211 effect. */
2212
2213 static bool
2214 mips_classify_address (struct mips_address_info *info, rtx x,
2215 enum machine_mode mode, bool strict_p)
2216 {
2217 switch (GET_CODE (x))
2218 {
2219 case REG:
2220 case SUBREG:
2221 info->type = ADDRESS_REG;
2222 info->reg = x;
2223 info->offset = const0_rtx;
2224 return mips_valid_base_register_p (info->reg, mode, strict_p);
2225
2226 case PLUS:
2227 info->type = ADDRESS_REG;
2228 info->reg = XEXP (x, 0);
2229 info->offset = XEXP (x, 1);
2230 return (mips_valid_base_register_p (info->reg, mode, strict_p)
2231 && mips_valid_offset_p (info->offset, mode));
2232
2233 case LO_SUM:
2234 info->type = ADDRESS_LO_SUM;
2235 info->reg = XEXP (x, 0);
2236 info->offset = XEXP (x, 1);
2237 /* We have to trust the creator of the LO_SUM to do something vaguely
2238 sane. Target-independent code that creates a LO_SUM should also
2239 create and verify the matching HIGH. Target-independent code that
2240 adds an offset to a LO_SUM must prove that the offset will not
2241 induce a carry. Failure to do either of these things would be
2242 a bug, and we are not required to check for it here. The MIPS
2243 backend itself should only create LO_SUMs for valid symbolic
2244 constants, with the high part being either a HIGH or a copy
2245 of _gp. */
2246 info->symbol_type
2247 = mips_classify_symbolic_expression (info->offset, SYMBOL_CONTEXT_MEM);
2248 return (mips_valid_base_register_p (info->reg, mode, strict_p)
2249 && mips_valid_lo_sum_p (info->symbol_type, mode));
2250
2251 case CONST_INT:
2252 /* Small-integer addresses don't occur very often, but they
2253 are legitimate if $0 is a valid base register. */
2254 info->type = ADDRESS_CONST_INT;
2255 return !TARGET_MIPS16 && SMALL_INT (x);
2256
2257 case CONST:
2258 case LABEL_REF:
2259 case SYMBOL_REF:
2260 info->type = ADDRESS_SYMBOLIC;
2261 return (mips_symbolic_constant_p (x, SYMBOL_CONTEXT_MEM,
2262 &info->symbol_type)
2263 && mips_symbol_insns (info->symbol_type, mode) > 0
2264 && !mips_split_p[info->symbol_type]);
2265
2266 default:
2267 return false;
2268 }
2269 }
2270
2271 /* Implement TARGET_LEGITIMATE_ADDRESS_P. */
2272
2273 static bool
2274 mips_legitimate_address_p (enum machine_mode mode, rtx x, bool strict_p)
2275 {
2276 struct mips_address_info addr;
2277
2278 return mips_classify_address (&addr, x, mode, strict_p);
2279 }
2280
2281 /* Return true if X is a legitimate $sp-based address for mode MDOE. */
2282
2283 bool
2284 mips_stack_address_p (rtx x, enum machine_mode mode)
2285 {
2286 struct mips_address_info addr;
2287
2288 return (mips_classify_address (&addr, x, mode, false)
2289 && addr.type == ADDRESS_REG
2290 && addr.reg == stack_pointer_rtx);
2291 }
2292
2293 /* Return true if ADDR matches the pattern for the LWXS load scaled indexed
2294 address instruction. Note that such addresses are not considered
2295 legitimate in the TARGET_LEGITIMATE_ADDRESS_P sense, because their use
2296 is so restricted. */
2297
2298 static bool
2299 mips_lwxs_address_p (rtx addr)
2300 {
2301 if (ISA_HAS_LWXS
2302 && GET_CODE (addr) == PLUS
2303 && REG_P (XEXP (addr, 1)))
2304 {
2305 rtx offset = XEXP (addr, 0);
2306 if (GET_CODE (offset) == MULT
2307 && REG_P (XEXP (offset, 0))
2308 && CONST_INT_P (XEXP (offset, 1))
2309 && INTVAL (XEXP (offset, 1)) == 4)
2310 return true;
2311 }
2312 return false;
2313 }
2314
2315 /* Return true if ADDR matches the pattern for the L{B,H,W,D}{,U}X load
2316 indexed address instruction. Note that such addresses are
2317 not considered legitimate in the TARGET_LEGITIMATE_ADDRESS_P
2318 sense, because their use is so restricted. */
2319
2320 static bool
2321 mips_lx_address_p (rtx addr, enum machine_mode mode)
2322 {
2323 if (GET_CODE (addr) != PLUS
2324 || !REG_P (XEXP (addr, 0))
2325 || !REG_P (XEXP (addr, 1)))
2326 return false;
2327 if (ISA_HAS_LBX && mode == QImode)
2328 return true;
2329 if (ISA_HAS_LHX && mode == HImode)
2330 return true;
2331 if (ISA_HAS_LWX && mode == SImode)
2332 return true;
2333 if (ISA_HAS_LDX && mode == DImode)
2334 return true;
2335 return false;
2336 }
2337 \f
2338 /* Return true if a value at OFFSET bytes from base register BASE can be
2339 accessed using an unextended MIPS16 instruction. MODE is the mode of
2340 the value.
2341
2342 Usually the offset in an unextended instruction is a 5-bit field.
2343 The offset is unsigned and shifted left once for LH and SH, twice
2344 for LW and SW, and so on. An exception is LWSP and SWSP, which have
2345 an 8-bit immediate field that's shifted left twice. */
2346
2347 static bool
2348 mips16_unextended_reference_p (enum machine_mode mode, rtx base,
2349 unsigned HOST_WIDE_INT offset)
2350 {
2351 if (mode != BLKmode && offset % GET_MODE_SIZE (mode) == 0)
2352 {
2353 if (GET_MODE_SIZE (mode) == 4 && base == stack_pointer_rtx)
2354 return offset < 256U * GET_MODE_SIZE (mode);
2355 return offset < 32U * GET_MODE_SIZE (mode);
2356 }
2357 return false;
2358 }
2359
2360 /* Return the number of instructions needed to load or store a value
2361 of mode MODE at address X, assuming that BASE_INSN_LENGTH is the
2362 length of one instruction. Return 0 if X isn't valid for MODE.
2363 Assume that multiword moves may need to be split into word moves
2364 if MIGHT_SPLIT_P, otherwise assume that a single load or store is
2365 enough. */
2366
2367 int
2368 mips_address_insns (rtx x, enum machine_mode mode, bool might_split_p)
2369 {
2370 struct mips_address_info addr;
2371 int factor;
2372
2373 /* BLKmode is used for single unaligned loads and stores and should
2374 not count as a multiword mode. (GET_MODE_SIZE (BLKmode) is pretty
2375 meaningless, so we have to single it out as a special case one way
2376 or the other.) */
2377 if (mode != BLKmode && might_split_p)
2378 factor = (GET_MODE_SIZE (mode) + UNITS_PER_WORD - 1) / UNITS_PER_WORD;
2379 else
2380 factor = 1;
2381
2382 if (mips_classify_address (&addr, x, mode, false))
2383 switch (addr.type)
2384 {
2385 case ADDRESS_REG:
2386 if (TARGET_MIPS16
2387 && !mips16_unextended_reference_p (mode, addr.reg,
2388 UINTVAL (addr.offset)))
2389 return factor * 2;
2390 return factor;
2391
2392 case ADDRESS_LO_SUM:
2393 return TARGET_MIPS16 ? factor * 2 : factor;
2394
2395 case ADDRESS_CONST_INT:
2396 return factor;
2397
2398 case ADDRESS_SYMBOLIC:
2399 return factor * mips_symbol_insns (addr.symbol_type, mode);
2400 }
2401 return 0;
2402 }
2403
2404 /* Return true if X fits within an unsigned field of BITS bits that is
2405 shifted left SHIFT bits before being used. */
2406
2407 bool
2408 mips_unsigned_immediate_p (unsigned HOST_WIDE_INT x, int bits, int shift = 0)
2409 {
2410 return (x & ((1 << shift) - 1)) == 0 && x < ((unsigned) 1 << (shift + bits));
2411 }
2412
2413 /* Return true if X fits within a signed field of BITS bits that is
2414 shifted left SHIFT bits before being used. */
2415
2416 bool
2417 mips_signed_immediate_p (unsigned HOST_WIDE_INT x, int bits, int shift = 0)
2418 {
2419 x += 1 << (bits + shift - 1);
2420 return mips_unsigned_immediate_p (x, bits, shift);
2421 }
2422
2423 /* Return true if X is legitimate for accessing values of mode MODE,
2424 if it is based on a MIPS16 register, and if the offset satisfies
2425 OFFSET_PREDICATE. */
2426
2427 bool
2428 m16_based_address_p (rtx x, enum machine_mode mode,
2429 insn_operand_predicate_fn offset_predicate)
2430 {
2431 struct mips_address_info addr;
2432
2433 return (mips_classify_address (&addr, x, mode, false)
2434 && addr.type == ADDRESS_REG
2435 && M16_REG_P (REGNO (addr.reg))
2436 && offset_predicate (addr.offset, mode));
2437 }
2438
2439 /* Return true if X is a legitimate address that conforms to the requirements
2440 for a microMIPS LWSP or SWSP insn. */
2441
2442 bool
2443 lwsp_swsp_address_p (rtx x, enum machine_mode mode)
2444 {
2445 struct mips_address_info addr;
2446
2447 return (mips_classify_address (&addr, x, mode, false)
2448 && addr.type == ADDRESS_REG
2449 && REGNO (addr.reg) == STACK_POINTER_REGNUM
2450 && uw5_operand (addr.offset, mode));
2451 }
2452
2453 /* Return true if X is a legitimate address with a 12-bit offset.
2454 MODE is the mode of the value being accessed. */
2455
2456 bool
2457 umips_12bit_offset_address_p (rtx x, enum machine_mode mode)
2458 {
2459 struct mips_address_info addr;
2460
2461 return (mips_classify_address (&addr, x, mode, false)
2462 && addr.type == ADDRESS_REG
2463 && CONST_INT_P (addr.offset)
2464 && UMIPS_12BIT_OFFSET_P (INTVAL (addr.offset)));
2465 }
2466
2467 /* Return the number of instructions needed to load constant X,
2468 assuming that BASE_INSN_LENGTH is the length of one instruction.
2469 Return 0 if X isn't a valid constant. */
2470
2471 int
2472 mips_const_insns (rtx x)
2473 {
2474 struct mips_integer_op codes[MIPS_MAX_INTEGER_OPS];
2475 enum mips_symbol_type symbol_type;
2476 rtx offset;
2477
2478 switch (GET_CODE (x))
2479 {
2480 case HIGH:
2481 if (!mips_symbolic_constant_p (XEXP (x, 0), SYMBOL_CONTEXT_LEA,
2482 &symbol_type)
2483 || !mips_split_p[symbol_type])
2484 return 0;
2485
2486 /* This is simply an LUI for normal mode. It is an extended
2487 LI followed by an extended SLL for MIPS16. */
2488 return TARGET_MIPS16 ? 4 : 1;
2489
2490 case CONST_INT:
2491 if (TARGET_MIPS16)
2492 /* Unsigned 8-bit constants can be loaded using an unextended
2493 LI instruction. Unsigned 16-bit constants can be loaded
2494 using an extended LI. Negative constants must be loaded
2495 using LI and then negated. */
2496 return (IN_RANGE (INTVAL (x), 0, 255) ? 1
2497 : SMALL_OPERAND_UNSIGNED (INTVAL (x)) ? 2
2498 : IN_RANGE (-INTVAL (x), 0, 255) ? 2
2499 : SMALL_OPERAND_UNSIGNED (-INTVAL (x)) ? 3
2500 : 0);
2501
2502 return mips_build_integer (codes, INTVAL (x));
2503
2504 case CONST_DOUBLE:
2505 case CONST_VECTOR:
2506 /* Allow zeros for normal mode, where we can use $0. */
2507 return !TARGET_MIPS16 && x == CONST0_RTX (GET_MODE (x)) ? 1 : 0;
2508
2509 case CONST:
2510 if (CONST_GP_P (x))
2511 return 1;
2512
2513 /* See if we can refer to X directly. */
2514 if (mips_symbolic_constant_p (x, SYMBOL_CONTEXT_LEA, &symbol_type))
2515 return mips_symbol_insns (symbol_type, MAX_MACHINE_MODE);
2516
2517 /* Otherwise try splitting the constant into a base and offset.
2518 If the offset is a 16-bit value, we can load the base address
2519 into a register and then use (D)ADDIU to add in the offset.
2520 If the offset is larger, we can load the base and offset
2521 into separate registers and add them together with (D)ADDU.
2522 However, the latter is only possible before reload; during
2523 and after reload, we must have the option of forcing the
2524 constant into the pool instead. */
2525 split_const (x, &x, &offset);
2526 if (offset != 0)
2527 {
2528 int n = mips_const_insns (x);
2529 if (n != 0)
2530 {
2531 if (SMALL_INT (offset))
2532 return n + 1;
2533 else if (!targetm.cannot_force_const_mem (GET_MODE (x), x))
2534 return n + 1 + mips_build_integer (codes, INTVAL (offset));
2535 }
2536 }
2537 return 0;
2538
2539 case SYMBOL_REF:
2540 case LABEL_REF:
2541 return mips_symbol_insns (mips_classify_symbol (x, SYMBOL_CONTEXT_LEA),
2542 MAX_MACHINE_MODE);
2543
2544 default:
2545 return 0;
2546 }
2547 }
2548
2549 /* X is a doubleword constant that can be handled by splitting it into
2550 two words and loading each word separately. Return the number of
2551 instructions required to do this, assuming that BASE_INSN_LENGTH
2552 is the length of one instruction. */
2553
2554 int
2555 mips_split_const_insns (rtx x)
2556 {
2557 unsigned int low, high;
2558
2559 low = mips_const_insns (mips_subword (x, false));
2560 high = mips_const_insns (mips_subword (x, true));
2561 gcc_assert (low > 0 && high > 0);
2562 return low + high;
2563 }
2564
2565 /* Return the number of instructions needed to implement INSN,
2566 given that it loads from or stores to MEM. Assume that
2567 BASE_INSN_LENGTH is the length of one instruction. */
2568
2569 int
2570 mips_load_store_insns (rtx mem, rtx insn)
2571 {
2572 enum machine_mode mode;
2573 bool might_split_p;
2574 rtx set;
2575
2576 gcc_assert (MEM_P (mem));
2577 mode = GET_MODE (mem);
2578
2579 /* Try to prove that INSN does not need to be split. */
2580 might_split_p = GET_MODE_SIZE (mode) > UNITS_PER_WORD;
2581 if (might_split_p)
2582 {
2583 set = single_set (insn);
2584 if (set && !mips_split_move_insn_p (SET_DEST (set), SET_SRC (set), insn))
2585 might_split_p = false;
2586 }
2587
2588 return mips_address_insns (XEXP (mem, 0), mode, might_split_p);
2589 }
2590
2591 /* Return the number of instructions needed for an integer division,
2592 assuming that BASE_INSN_LENGTH is the length of one instruction. */
2593
2594 int
2595 mips_idiv_insns (void)
2596 {
2597 int count;
2598
2599 count = 1;
2600 if (TARGET_CHECK_ZERO_DIV)
2601 {
2602 if (GENERATE_DIVIDE_TRAPS)
2603 count++;
2604 else
2605 count += 2;
2606 }
2607
2608 if (TARGET_FIX_R4000 || TARGET_FIX_R4400)
2609 count++;
2610 return count;
2611 }
2612 \f
2613 /* Emit a move from SRC to DEST. Assume that the move expanders can
2614 handle all moves if !can_create_pseudo_p (). The distinction is
2615 important because, unlike emit_move_insn, the move expanders know
2616 how to force Pmode objects into the constant pool even when the
2617 constant pool address is not itself legitimate. */
2618
2619 rtx
2620 mips_emit_move (rtx dest, rtx src)
2621 {
2622 return (can_create_pseudo_p ()
2623 ? emit_move_insn (dest, src)
2624 : emit_move_insn_1 (dest, src));
2625 }
2626
2627 /* Emit a move from SRC to DEST, splitting compound moves into individual
2628 instructions. SPLIT_TYPE is the type of split to perform. */
2629
2630 static void
2631 mips_emit_move_or_split (rtx dest, rtx src, enum mips_split_type split_type)
2632 {
2633 if (mips_split_move_p (dest, src, split_type))
2634 mips_split_move (dest, src, split_type);
2635 else
2636 mips_emit_move (dest, src);
2637 }
2638
2639 /* Emit an instruction of the form (set TARGET (CODE OP0)). */
2640
2641 static void
2642 mips_emit_unary (enum rtx_code code, rtx target, rtx op0)
2643 {
2644 emit_insn (gen_rtx_SET (VOIDmode, target,
2645 gen_rtx_fmt_e (code, GET_MODE (op0), op0)));
2646 }
2647
2648 /* Compute (CODE OP0) and store the result in a new register of mode MODE.
2649 Return that new register. */
2650
2651 static rtx
2652 mips_force_unary (enum machine_mode mode, enum rtx_code code, rtx op0)
2653 {
2654 rtx reg;
2655
2656 reg = gen_reg_rtx (mode);
2657 mips_emit_unary (code, reg, op0);
2658 return reg;
2659 }
2660
2661 /* Emit an instruction of the form (set TARGET (CODE OP0 OP1)). */
2662
2663 void
2664 mips_emit_binary (enum rtx_code code, rtx target, rtx op0, rtx op1)
2665 {
2666 emit_insn (gen_rtx_SET (VOIDmode, target,
2667 gen_rtx_fmt_ee (code, GET_MODE (target), op0, op1)));
2668 }
2669
2670 /* Compute (CODE OP0 OP1) and store the result in a new register
2671 of mode MODE. Return that new register. */
2672
2673 static rtx
2674 mips_force_binary (enum machine_mode mode, enum rtx_code code, rtx op0, rtx op1)
2675 {
2676 rtx reg;
2677
2678 reg = gen_reg_rtx (mode);
2679 mips_emit_binary (code, reg, op0, op1);
2680 return reg;
2681 }
2682
2683 /* Copy VALUE to a register and return that register. If new pseudos
2684 are allowed, copy it into a new register, otherwise use DEST. */
2685
2686 static rtx
2687 mips_force_temporary (rtx dest, rtx value)
2688 {
2689 if (can_create_pseudo_p ())
2690 return force_reg (Pmode, value);
2691 else
2692 {
2693 mips_emit_move (dest, value);
2694 return dest;
2695 }
2696 }
2697
2698 /* Emit a call sequence with call pattern PATTERN and return the call
2699 instruction itself (which is not necessarily the last instruction
2700 emitted). ORIG_ADDR is the original, unlegitimized address,
2701 ADDR is the legitimized form, and LAZY_P is true if the call
2702 address is lazily-bound. */
2703
2704 static rtx
2705 mips_emit_call_insn (rtx pattern, rtx orig_addr, rtx addr, bool lazy_p)
2706 {
2707 rtx insn, reg;
2708
2709 insn = emit_call_insn (pattern);
2710
2711 if (TARGET_MIPS16 && mips_use_pic_fn_addr_reg_p (orig_addr))
2712 {
2713 /* MIPS16 JALRs only take MIPS16 registers. If the target
2714 function requires $25 to be valid on entry, we must copy it
2715 there separately. The move instruction can be put in the
2716 call's delay slot. */
2717 reg = gen_rtx_REG (Pmode, PIC_FUNCTION_ADDR_REGNUM);
2718 emit_insn_before (gen_move_insn (reg, addr), insn);
2719 use_reg (&CALL_INSN_FUNCTION_USAGE (insn), reg);
2720 }
2721
2722 if (lazy_p)
2723 /* Lazy-binding stubs require $gp to be valid on entry. */
2724 use_reg (&CALL_INSN_FUNCTION_USAGE (insn), pic_offset_table_rtx);
2725
2726 if (TARGET_USE_GOT)
2727 {
2728 /* See the comment above load_call<mode> for details. */
2729 use_reg (&CALL_INSN_FUNCTION_USAGE (insn),
2730 gen_rtx_REG (Pmode, GOT_VERSION_REGNUM));
2731 emit_insn (gen_update_got_version ());
2732 }
2733 return insn;
2734 }
2735 \f
2736 /* Wrap symbol or label BASE in an UNSPEC address of type SYMBOL_TYPE,
2737 then add CONST_INT OFFSET to the result. */
2738
2739 static rtx
2740 mips_unspec_address_offset (rtx base, rtx offset,
2741 enum mips_symbol_type symbol_type)
2742 {
2743 base = gen_rtx_UNSPEC (Pmode, gen_rtvec (1, base),
2744 UNSPEC_ADDRESS_FIRST + symbol_type);
2745 if (offset != const0_rtx)
2746 base = gen_rtx_PLUS (Pmode, base, offset);
2747 return gen_rtx_CONST (Pmode, base);
2748 }
2749
2750 /* Return an UNSPEC address with underlying address ADDRESS and symbol
2751 type SYMBOL_TYPE. */
2752
2753 rtx
2754 mips_unspec_address (rtx address, enum mips_symbol_type symbol_type)
2755 {
2756 rtx base, offset;
2757
2758 split_const (address, &base, &offset);
2759 return mips_unspec_address_offset (base, offset, symbol_type);
2760 }
2761
2762 /* If OP is an UNSPEC address, return the address to which it refers,
2763 otherwise return OP itself. */
2764
2765 rtx
2766 mips_strip_unspec_address (rtx op)
2767 {
2768 rtx base, offset;
2769
2770 split_const (op, &base, &offset);
2771 if (UNSPEC_ADDRESS_P (base))
2772 op = plus_constant (Pmode, UNSPEC_ADDRESS (base), INTVAL (offset));
2773 return op;
2774 }
2775
2776 /* If mips_unspec_address (ADDR, SYMBOL_TYPE) is a 32-bit value, add the
2777 high part to BASE and return the result. Just return BASE otherwise.
2778 TEMP is as for mips_force_temporary.
2779
2780 The returned expression can be used as the first operand to a LO_SUM. */
2781
2782 static rtx
2783 mips_unspec_offset_high (rtx temp, rtx base, rtx addr,
2784 enum mips_symbol_type symbol_type)
2785 {
2786 if (mips_split_p[symbol_type])
2787 {
2788 addr = gen_rtx_HIGH (Pmode, mips_unspec_address (addr, symbol_type));
2789 addr = mips_force_temporary (temp, addr);
2790 base = mips_force_temporary (temp, gen_rtx_PLUS (Pmode, addr, base));
2791 }
2792 return base;
2793 }
2794 \f
2795 /* Return an instruction that copies $gp into register REG. We want
2796 GCC to treat the register's value as constant, so that its value
2797 can be rematerialized on demand. */
2798
2799 static rtx
2800 gen_load_const_gp (rtx reg)
2801 {
2802 return PMODE_INSN (gen_load_const_gp, (reg));
2803 }
2804
2805 /* Return a pseudo register that contains the value of $gp throughout
2806 the current function. Such registers are needed by MIPS16 functions,
2807 for which $gp itself is not a valid base register or addition operand. */
2808
2809 static rtx
2810 mips16_gp_pseudo_reg (void)
2811 {
2812 if (cfun->machine->mips16_gp_pseudo_rtx == NULL_RTX)
2813 {
2814 rtx insn, scan;
2815
2816 cfun->machine->mips16_gp_pseudo_rtx = gen_reg_rtx (Pmode);
2817
2818 push_topmost_sequence ();
2819
2820 scan = get_insns ();
2821 while (NEXT_INSN (scan) && !INSN_P (NEXT_INSN (scan)))
2822 scan = NEXT_INSN (scan);
2823
2824 insn = gen_load_const_gp (cfun->machine->mips16_gp_pseudo_rtx);
2825 insn = emit_insn_after (insn, scan);
2826 INSN_LOCATION (insn) = 0;
2827
2828 pop_topmost_sequence ();
2829 }
2830
2831 return cfun->machine->mips16_gp_pseudo_rtx;
2832 }
2833
2834 /* Return a base register that holds pic_offset_table_rtx.
2835 TEMP, if nonnull, is a scratch Pmode base register. */
2836
2837 rtx
2838 mips_pic_base_register (rtx temp)
2839 {
2840 if (!TARGET_MIPS16)
2841 return pic_offset_table_rtx;
2842
2843 if (currently_expanding_to_rtl)
2844 return mips16_gp_pseudo_reg ();
2845
2846 if (can_create_pseudo_p ())
2847 temp = gen_reg_rtx (Pmode);
2848
2849 if (TARGET_USE_GOT)
2850 /* The first post-reload split exposes all references to $gp
2851 (both uses and definitions). All references must remain
2852 explicit after that point.
2853
2854 It is safe to introduce uses of $gp at any time, so for
2855 simplicity, we do that before the split too. */
2856 mips_emit_move (temp, pic_offset_table_rtx);
2857 else
2858 emit_insn (gen_load_const_gp (temp));
2859 return temp;
2860 }
2861
2862 /* Return the RHS of a load_call<mode> insn. */
2863
2864 static rtx
2865 mips_unspec_call (rtx reg, rtx symbol)
2866 {
2867 rtvec vec;
2868
2869 vec = gen_rtvec (3, reg, symbol, gen_rtx_REG (SImode, GOT_VERSION_REGNUM));
2870 return gen_rtx_UNSPEC (Pmode, vec, UNSPEC_LOAD_CALL);
2871 }
2872
2873 /* If SRC is the RHS of a load_call<mode> insn, return the underlying symbol
2874 reference. Return NULL_RTX otherwise. */
2875
2876 static rtx
2877 mips_strip_unspec_call (rtx src)
2878 {
2879 if (GET_CODE (src) == UNSPEC && XINT (src, 1) == UNSPEC_LOAD_CALL)
2880 return mips_strip_unspec_address (XVECEXP (src, 0, 1));
2881 return NULL_RTX;
2882 }
2883
2884 /* Create and return a GOT reference of type TYPE for address ADDR.
2885 TEMP, if nonnull, is a scratch Pmode base register. */
2886
2887 rtx
2888 mips_got_load (rtx temp, rtx addr, enum mips_symbol_type type)
2889 {
2890 rtx base, high, lo_sum_symbol;
2891
2892 base = mips_pic_base_register (temp);
2893
2894 /* If we used the temporary register to load $gp, we can't use
2895 it for the high part as well. */
2896 if (temp != NULL && reg_overlap_mentioned_p (base, temp))
2897 temp = NULL;
2898
2899 high = mips_unspec_offset_high (temp, base, addr, type);
2900 lo_sum_symbol = mips_unspec_address (addr, type);
2901
2902 if (type == SYMBOL_GOTOFF_CALL)
2903 return mips_unspec_call (high, lo_sum_symbol);
2904 else
2905 return PMODE_INSN (gen_unspec_got, (high, lo_sum_symbol));
2906 }
2907
2908 /* If MODE is MAX_MACHINE_MODE, ADDR appears as a move operand, otherwise
2909 it appears in a MEM of that mode. Return true if ADDR is a legitimate
2910 constant in that context and can be split into high and low parts.
2911 If so, and if LOW_OUT is nonnull, emit the high part and store the
2912 low part in *LOW_OUT. Leave *LOW_OUT unchanged otherwise.
2913
2914 TEMP is as for mips_force_temporary and is used to load the high
2915 part into a register.
2916
2917 When MODE is MAX_MACHINE_MODE, the low part is guaranteed to be
2918 a legitimize SET_SRC for an .md pattern, otherwise the low part
2919 is guaranteed to be a legitimate address for mode MODE. */
2920
2921 bool
2922 mips_split_symbol (rtx temp, rtx addr, enum machine_mode mode, rtx *low_out)
2923 {
2924 enum mips_symbol_context context;
2925 enum mips_symbol_type symbol_type;
2926 rtx high;
2927
2928 context = (mode == MAX_MACHINE_MODE
2929 ? SYMBOL_CONTEXT_LEA
2930 : SYMBOL_CONTEXT_MEM);
2931 if (GET_CODE (addr) == HIGH && context == SYMBOL_CONTEXT_LEA)
2932 {
2933 addr = XEXP (addr, 0);
2934 if (mips_symbolic_constant_p (addr, context, &symbol_type)
2935 && mips_symbol_insns (symbol_type, mode) > 0
2936 && mips_split_hi_p[symbol_type])
2937 {
2938 if (low_out)
2939 switch (symbol_type)
2940 {
2941 case SYMBOL_GOT_PAGE_OFST:
2942 /* The high part of a page/ofst pair is loaded from the GOT. */
2943 *low_out = mips_got_load (temp, addr, SYMBOL_GOTOFF_PAGE);
2944 break;
2945
2946 default:
2947 gcc_unreachable ();
2948 }
2949 return true;
2950 }
2951 }
2952 else
2953 {
2954 if (mips_symbolic_constant_p (addr, context, &symbol_type)
2955 && mips_symbol_insns (symbol_type, mode) > 0
2956 && mips_split_p[symbol_type])
2957 {
2958 if (low_out)
2959 switch (symbol_type)
2960 {
2961 case SYMBOL_GOT_DISP:
2962 /* SYMBOL_GOT_DISP symbols are loaded from the GOT. */
2963 *low_out = mips_got_load (temp, addr, SYMBOL_GOTOFF_DISP);
2964 break;
2965
2966 case SYMBOL_GP_RELATIVE:
2967 high = mips_pic_base_register (temp);
2968 *low_out = gen_rtx_LO_SUM (Pmode, high, addr);
2969 break;
2970
2971 default:
2972 high = gen_rtx_HIGH (Pmode, copy_rtx (addr));
2973 high = mips_force_temporary (temp, high);
2974 *low_out = gen_rtx_LO_SUM (Pmode, high, addr);
2975 break;
2976 }
2977 return true;
2978 }
2979 }
2980 return false;
2981 }
2982
2983 /* Return a legitimate address for REG + OFFSET. TEMP is as for
2984 mips_force_temporary; it is only needed when OFFSET is not a
2985 SMALL_OPERAND. */
2986
2987 static rtx
2988 mips_add_offset (rtx temp, rtx reg, HOST_WIDE_INT offset)
2989 {
2990 if (!SMALL_OPERAND (offset))
2991 {
2992 rtx high;
2993
2994 if (TARGET_MIPS16)
2995 {
2996 /* Load the full offset into a register so that we can use
2997 an unextended instruction for the address itself. */
2998 high = GEN_INT (offset);
2999 offset = 0;
3000 }
3001 else
3002 {
3003 /* Leave OFFSET as a 16-bit offset and put the excess in HIGH.
3004 The addition inside the macro CONST_HIGH_PART may cause an
3005 overflow, so we need to force a sign-extension check. */
3006 high = gen_int_mode (CONST_HIGH_PART (offset), Pmode);
3007 offset = CONST_LOW_PART (offset);
3008 }
3009 high = mips_force_temporary (temp, high);
3010 reg = mips_force_temporary (temp, gen_rtx_PLUS (Pmode, high, reg));
3011 }
3012 return plus_constant (Pmode, reg, offset);
3013 }
3014 \f
3015 /* The __tls_get_attr symbol. */
3016 static GTY(()) rtx mips_tls_symbol;
3017
3018 /* Return an instruction sequence that calls __tls_get_addr. SYM is
3019 the TLS symbol we are referencing and TYPE is the symbol type to use
3020 (either global dynamic or local dynamic). V0 is an RTX for the
3021 return value location. */
3022
3023 static rtx
3024 mips_call_tls_get_addr (rtx sym, enum mips_symbol_type type, rtx v0)
3025 {
3026 rtx insn, loc, a0;
3027
3028 a0 = gen_rtx_REG (Pmode, GP_ARG_FIRST);
3029
3030 if (!mips_tls_symbol)
3031 mips_tls_symbol = init_one_libfunc ("__tls_get_addr");
3032
3033 loc = mips_unspec_address (sym, type);
3034
3035 start_sequence ();
3036
3037 emit_insn (gen_rtx_SET (Pmode, a0,
3038 gen_rtx_LO_SUM (Pmode, pic_offset_table_rtx, loc)));
3039 insn = mips_expand_call (MIPS_CALL_NORMAL, v0, mips_tls_symbol,
3040 const0_rtx, NULL_RTX, false);
3041 RTL_CONST_CALL_P (insn) = 1;
3042 use_reg (&CALL_INSN_FUNCTION_USAGE (insn), a0);
3043 insn = get_insns ();
3044
3045 end_sequence ();
3046
3047 return insn;
3048 }
3049
3050 /* Return a pseudo register that contains the current thread pointer. */
3051
3052 rtx
3053 mips_expand_thread_pointer (rtx tp)
3054 {
3055 rtx fn;
3056
3057 if (TARGET_MIPS16)
3058 {
3059 mips_need_mips16_rdhwr_p = true;
3060 fn = mips16_stub_function ("__mips16_rdhwr");
3061 SYMBOL_REF_FLAGS (fn) |= SYMBOL_FLAG_LOCAL;
3062 if (!call_insn_operand (fn, VOIDmode))
3063 fn = force_reg (Pmode, fn);
3064 emit_insn (PMODE_INSN (gen_tls_get_tp_mips16, (tp, fn)));
3065 }
3066 else
3067 emit_insn (PMODE_INSN (gen_tls_get_tp, (tp)));
3068 return tp;
3069 }
3070
3071 static rtx
3072 mips_get_tp (void)
3073 {
3074 return mips_expand_thread_pointer (gen_reg_rtx (Pmode));
3075 }
3076
3077 /* Generate the code to access LOC, a thread-local SYMBOL_REF, and return
3078 its address. The return value will be both a valid address and a valid
3079 SET_SRC (either a REG or a LO_SUM). */
3080
3081 static rtx
3082 mips_legitimize_tls_address (rtx loc)
3083 {
3084 rtx dest, insn, v0, tp, tmp1, tmp2, eqv, offset;
3085 enum tls_model model;
3086
3087 model = SYMBOL_REF_TLS_MODEL (loc);
3088 /* Only TARGET_ABICALLS code can have more than one module; other
3089 code must be be static and should not use a GOT. All TLS models
3090 reduce to local exec in this situation. */
3091 if (!TARGET_ABICALLS)
3092 model = TLS_MODEL_LOCAL_EXEC;
3093
3094 switch (model)
3095 {
3096 case TLS_MODEL_GLOBAL_DYNAMIC:
3097 v0 = gen_rtx_REG (Pmode, GP_RETURN);
3098 insn = mips_call_tls_get_addr (loc, SYMBOL_TLSGD, v0);
3099 dest = gen_reg_rtx (Pmode);
3100 emit_libcall_block (insn, dest, v0, loc);
3101 break;
3102
3103 case TLS_MODEL_LOCAL_DYNAMIC:
3104 v0 = gen_rtx_REG (Pmode, GP_RETURN);
3105 insn = mips_call_tls_get_addr (loc, SYMBOL_TLSLDM, v0);
3106 tmp1 = gen_reg_rtx (Pmode);
3107
3108 /* Attach a unique REG_EQUIV, to allow the RTL optimizers to
3109 share the LDM result with other LD model accesses. */
3110 eqv = gen_rtx_UNSPEC (Pmode, gen_rtvec (1, const0_rtx),
3111 UNSPEC_TLS_LDM);
3112 emit_libcall_block (insn, tmp1, v0, eqv);
3113
3114 offset = mips_unspec_address (loc, SYMBOL_DTPREL);
3115 if (mips_split_p[SYMBOL_DTPREL])
3116 {
3117 tmp2 = mips_unspec_offset_high (NULL, tmp1, loc, SYMBOL_DTPREL);
3118 dest = gen_rtx_LO_SUM (Pmode, tmp2, offset);
3119 }
3120 else
3121 dest = expand_binop (Pmode, add_optab, tmp1, offset,
3122 0, 0, OPTAB_DIRECT);
3123 break;
3124
3125 case TLS_MODEL_INITIAL_EXEC:
3126 tp = mips_get_tp ();
3127 tmp1 = gen_reg_rtx (Pmode);
3128 tmp2 = mips_unspec_address (loc, SYMBOL_GOTTPREL);
3129 if (Pmode == DImode)
3130 emit_insn (gen_load_gotdi (tmp1, pic_offset_table_rtx, tmp2));
3131 else
3132 emit_insn (gen_load_gotsi (tmp1, pic_offset_table_rtx, tmp2));
3133 dest = gen_reg_rtx (Pmode);
3134 emit_insn (gen_add3_insn (dest, tmp1, tp));
3135 break;
3136
3137 case TLS_MODEL_LOCAL_EXEC:
3138 tmp1 = mips_get_tp ();
3139 offset = mips_unspec_address (loc, SYMBOL_TPREL);
3140 if (mips_split_p[SYMBOL_TPREL])
3141 {
3142 tmp2 = mips_unspec_offset_high (NULL, tmp1, loc, SYMBOL_TPREL);
3143 dest = gen_rtx_LO_SUM (Pmode, tmp2, offset);
3144 }
3145 else
3146 dest = expand_binop (Pmode, add_optab, tmp1, offset,
3147 0, 0, OPTAB_DIRECT);
3148 break;
3149
3150 default:
3151 gcc_unreachable ();
3152 }
3153 return dest;
3154 }
3155 \f
3156 /* If X is not a valid address for mode MODE, force it into a register. */
3157
3158 static rtx
3159 mips_force_address (rtx x, enum machine_mode mode)
3160 {
3161 if (!mips_legitimate_address_p (mode, x, false))
3162 x = force_reg (Pmode, x);
3163 return x;
3164 }
3165
3166 /* This function is used to implement LEGITIMIZE_ADDRESS. If X can
3167 be legitimized in a way that the generic machinery might not expect,
3168 return a new address, otherwise return NULL. MODE is the mode of
3169 the memory being accessed. */
3170
3171 static rtx
3172 mips_legitimize_address (rtx x, rtx oldx ATTRIBUTE_UNUSED,
3173 enum machine_mode mode)
3174 {
3175 rtx base, addr;
3176 HOST_WIDE_INT offset;
3177
3178 if (mips_tls_symbol_p (x))
3179 return mips_legitimize_tls_address (x);
3180
3181 /* See if the address can split into a high part and a LO_SUM. */
3182 if (mips_split_symbol (NULL, x, mode, &addr))
3183 return mips_force_address (addr, mode);
3184
3185 /* Handle BASE + OFFSET using mips_add_offset. */
3186 mips_split_plus (x, &base, &offset);
3187 if (offset != 0)
3188 {
3189 if (!mips_valid_base_register_p (base, mode, false))
3190 base = copy_to_mode_reg (Pmode, base);
3191 addr = mips_add_offset (NULL, base, offset);
3192 return mips_force_address (addr, mode);
3193 }
3194
3195 return x;
3196 }
3197
3198 /* Load VALUE into DEST. TEMP is as for mips_force_temporary. */
3199
3200 void
3201 mips_move_integer (rtx temp, rtx dest, unsigned HOST_WIDE_INT value)
3202 {
3203 struct mips_integer_op codes[MIPS_MAX_INTEGER_OPS];
3204 enum machine_mode mode;
3205 unsigned int i, num_ops;
3206 rtx x;
3207
3208 mode = GET_MODE (dest);
3209 num_ops = mips_build_integer (codes, value);
3210
3211 /* Apply each binary operation to X. Invariant: X is a legitimate
3212 source operand for a SET pattern. */
3213 x = GEN_INT (codes[0].value);
3214 for (i = 1; i < num_ops; i++)
3215 {
3216 if (!can_create_pseudo_p ())
3217 {
3218 emit_insn (gen_rtx_SET (VOIDmode, temp, x));
3219 x = temp;
3220 }
3221 else
3222 x = force_reg (mode, x);
3223 x = gen_rtx_fmt_ee (codes[i].code, mode, x, GEN_INT (codes[i].value));
3224 }
3225
3226 emit_insn (gen_rtx_SET (VOIDmode, dest, x));
3227 }
3228
3229 /* Subroutine of mips_legitimize_move. Move constant SRC into register
3230 DEST given that SRC satisfies immediate_operand but doesn't satisfy
3231 move_operand. */
3232
3233 static void
3234 mips_legitimize_const_move (enum machine_mode mode, rtx dest, rtx src)
3235 {
3236 rtx base, offset;
3237
3238 /* Split moves of big integers into smaller pieces. */
3239 if (splittable_const_int_operand (src, mode))
3240 {
3241 mips_move_integer (dest, dest, INTVAL (src));
3242 return;
3243 }
3244
3245 /* Split moves of symbolic constants into high/low pairs. */
3246 if (mips_split_symbol (dest, src, MAX_MACHINE_MODE, &src))
3247 {
3248 emit_insn (gen_rtx_SET (VOIDmode, dest, src));
3249 return;
3250 }
3251
3252 /* Generate the appropriate access sequences for TLS symbols. */
3253 if (mips_tls_symbol_p (src))
3254 {
3255 mips_emit_move (dest, mips_legitimize_tls_address (src));
3256 return;
3257 }
3258
3259 /* If we have (const (plus symbol offset)), and that expression cannot
3260 be forced into memory, load the symbol first and add in the offset.
3261 In non-MIPS16 mode, prefer to do this even if the constant _can_ be
3262 forced into memory, as it usually produces better code. */
3263 split_const (src, &base, &offset);
3264 if (offset != const0_rtx
3265 && (targetm.cannot_force_const_mem (mode, src)
3266 || (!TARGET_MIPS16 && can_create_pseudo_p ())))
3267 {
3268 base = mips_force_temporary (dest, base);
3269 mips_emit_move (dest, mips_add_offset (NULL, base, INTVAL (offset)));
3270 return;
3271 }
3272
3273 src = force_const_mem (mode, src);
3274
3275 /* When using explicit relocs, constant pool references are sometimes
3276 not legitimate addresses. */
3277 mips_split_symbol (dest, XEXP (src, 0), mode, &XEXP (src, 0));
3278 mips_emit_move (dest, src);
3279 }
3280
3281 /* If (set DEST SRC) is not a valid move instruction, emit an equivalent
3282 sequence that is valid. */
3283
3284 bool
3285 mips_legitimize_move (enum machine_mode mode, rtx dest, rtx src)
3286 {
3287 if (!register_operand (dest, mode) && !reg_or_0_operand (src, mode))
3288 {
3289 mips_emit_move (dest, force_reg (mode, src));
3290 return true;
3291 }
3292
3293 /* We need to deal with constants that would be legitimate
3294 immediate_operands but aren't legitimate move_operands. */
3295 if (CONSTANT_P (src) && !move_operand (src, mode))
3296 {
3297 mips_legitimize_const_move (mode, dest, src);
3298 set_unique_reg_note (get_last_insn (), REG_EQUAL, copy_rtx (src));
3299 return true;
3300 }
3301 return false;
3302 }
3303 \f
3304 /* Return true if value X in context CONTEXT is a small-data address
3305 that can be rewritten as a LO_SUM. */
3306
3307 static bool
3308 mips_rewrite_small_data_p (rtx x, enum mips_symbol_context context)
3309 {
3310 enum mips_symbol_type symbol_type;
3311
3312 return (mips_lo_relocs[SYMBOL_GP_RELATIVE]
3313 && !mips_split_p[SYMBOL_GP_RELATIVE]
3314 && mips_symbolic_constant_p (x, context, &symbol_type)
3315 && symbol_type == SYMBOL_GP_RELATIVE);
3316 }
3317
3318 /* A for_each_rtx callback for mips_small_data_pattern_p. DATA is the
3319 containing MEM, or null if none. */
3320
3321 static int
3322 mips_small_data_pattern_1 (rtx *loc, void *data)
3323 {
3324 enum mips_symbol_context context;
3325
3326 /* Ignore things like "g" constraints in asms. We make no particular
3327 guarantee about which symbolic constants are acceptable as asm operands
3328 versus which must be forced into a GPR. */
3329 if (GET_CODE (*loc) == LO_SUM || GET_CODE (*loc) == ASM_OPERANDS)
3330 return -1;
3331
3332 if (MEM_P (*loc))
3333 {
3334 if (for_each_rtx (&XEXP (*loc, 0), mips_small_data_pattern_1, *loc))
3335 return 1;
3336 return -1;
3337 }
3338
3339 context = data ? SYMBOL_CONTEXT_MEM : SYMBOL_CONTEXT_LEA;
3340 return mips_rewrite_small_data_p (*loc, context);
3341 }
3342
3343 /* Return true if OP refers to small data symbols directly, not through
3344 a LO_SUM. */
3345
3346 bool
3347 mips_small_data_pattern_p (rtx op)
3348 {
3349 return for_each_rtx (&op, mips_small_data_pattern_1, NULL);
3350 }
3351
3352 /* A for_each_rtx callback, used by mips_rewrite_small_data.
3353 DATA is the containing MEM, or null if none. */
3354
3355 static int
3356 mips_rewrite_small_data_1 (rtx *loc, void *data)
3357 {
3358 enum mips_symbol_context context;
3359
3360 if (MEM_P (*loc))
3361 {
3362 for_each_rtx (&XEXP (*loc, 0), mips_rewrite_small_data_1, *loc);
3363 return -1;
3364 }
3365
3366 context = data ? SYMBOL_CONTEXT_MEM : SYMBOL_CONTEXT_LEA;
3367 if (mips_rewrite_small_data_p (*loc, context))
3368 *loc = gen_rtx_LO_SUM (Pmode, pic_offset_table_rtx, *loc);
3369
3370 if (GET_CODE (*loc) == LO_SUM)
3371 return -1;
3372
3373 return 0;
3374 }
3375
3376 /* Rewrite instruction pattern PATTERN so that it refers to small data
3377 using explicit relocations. */
3378
3379 rtx
3380 mips_rewrite_small_data (rtx pattern)
3381 {
3382 pattern = copy_insn (pattern);
3383 for_each_rtx (&pattern, mips_rewrite_small_data_1, NULL);
3384 return pattern;
3385 }
3386 \f
3387 /* The cost of loading values from the constant pool. It should be
3388 larger than the cost of any constant we want to synthesize inline. */
3389 #define CONSTANT_POOL_COST COSTS_N_INSNS (TARGET_MIPS16 ? 4 : 8)
3390
3391 /* Return the cost of X when used as an operand to the MIPS16 instruction
3392 that implements CODE. Return -1 if there is no such instruction, or if
3393 X is not a valid immediate operand for it. */
3394
3395 static int
3396 mips16_constant_cost (int code, HOST_WIDE_INT x)
3397 {
3398 switch (code)
3399 {
3400 case ASHIFT:
3401 case ASHIFTRT:
3402 case LSHIFTRT:
3403 /* Shifts by between 1 and 8 bits (inclusive) are unextended,
3404 other shifts are extended. The shift patterns truncate the shift
3405 count to the right size, so there are no out-of-range values. */
3406 if (IN_RANGE (x, 1, 8))
3407 return 0;
3408 return COSTS_N_INSNS (1);
3409
3410 case PLUS:
3411 if (IN_RANGE (x, -128, 127))
3412 return 0;
3413 if (SMALL_OPERAND (x))
3414 return COSTS_N_INSNS (1);
3415 return -1;
3416
3417 case LEU:
3418 /* Like LE, but reject the always-true case. */
3419 if (x == -1)
3420 return -1;
3421 case LE:
3422 /* We add 1 to the immediate and use SLT. */
3423 x += 1;
3424 case XOR:
3425 /* We can use CMPI for an xor with an unsigned 16-bit X. */
3426 case LT:
3427 case LTU:
3428 if (IN_RANGE (x, 0, 255))
3429 return 0;
3430 if (SMALL_OPERAND_UNSIGNED (x))
3431 return COSTS_N_INSNS (1);
3432 return -1;
3433
3434 case EQ:
3435 case NE:
3436 /* Equality comparisons with 0 are cheap. */
3437 if (x == 0)
3438 return 0;
3439 return -1;
3440
3441 default:
3442 return -1;
3443 }
3444 }
3445
3446 /* Return true if there is a non-MIPS16 instruction that implements CODE
3447 and if that instruction accepts X as an immediate operand. */
3448
3449 static int
3450 mips_immediate_operand_p (int code, HOST_WIDE_INT x)
3451 {
3452 switch (code)
3453 {
3454 case ASHIFT:
3455 case ASHIFTRT:
3456 case LSHIFTRT:
3457 /* All shift counts are truncated to a valid constant. */
3458 return true;
3459
3460 case ROTATE:
3461 case ROTATERT:
3462 /* Likewise rotates, if the target supports rotates at all. */
3463 return ISA_HAS_ROR;
3464
3465 case AND:
3466 case IOR:
3467 case XOR:
3468 /* These instructions take 16-bit unsigned immediates. */
3469 return SMALL_OPERAND_UNSIGNED (x);
3470
3471 case PLUS:
3472 case LT:
3473 case LTU:
3474 /* These instructions take 16-bit signed immediates. */
3475 return SMALL_OPERAND (x);
3476
3477 case EQ:
3478 case NE:
3479 case GT:
3480 case GTU:
3481 /* The "immediate" forms of these instructions are really
3482 implemented as comparisons with register 0. */
3483 return x == 0;
3484
3485 case GE:
3486 case GEU:
3487 /* Likewise, meaning that the only valid immediate operand is 1. */
3488 return x == 1;
3489
3490 case LE:
3491 /* We add 1 to the immediate and use SLT. */
3492 return SMALL_OPERAND (x + 1);
3493
3494 case LEU:
3495 /* Likewise SLTU, but reject the always-true case. */
3496 return SMALL_OPERAND (x + 1) && x + 1 != 0;
3497
3498 case SIGN_EXTRACT:
3499 case ZERO_EXTRACT:
3500 /* The bit position and size are immediate operands. */
3501 return ISA_HAS_EXT_INS;
3502
3503 default:
3504 /* By default assume that $0 can be used for 0. */
3505 return x == 0;
3506 }
3507 }
3508
3509 /* Return the cost of binary operation X, given that the instruction
3510 sequence for a word-sized or smaller operation has cost SINGLE_COST
3511 and that the sequence of a double-word operation has cost DOUBLE_COST.
3512 If SPEED is true, optimize for speed otherwise optimize for size. */
3513
3514 static int
3515 mips_binary_cost (rtx x, int single_cost, int double_cost, bool speed)
3516 {
3517 int cost;
3518
3519 if (GET_MODE_SIZE (GET_MODE (x)) == UNITS_PER_WORD * 2)
3520 cost = double_cost;
3521 else
3522 cost = single_cost;
3523 return (cost
3524 + set_src_cost (XEXP (x, 0), speed)
3525 + rtx_cost (XEXP (x, 1), GET_CODE (x), 1, speed));
3526 }
3527
3528 /* Return the cost of floating-point multiplications of mode MODE. */
3529
3530 static int
3531 mips_fp_mult_cost (enum machine_mode mode)
3532 {
3533 return mode == DFmode ? mips_cost->fp_mult_df : mips_cost->fp_mult_sf;
3534 }
3535
3536 /* Return the cost of floating-point divisions of mode MODE. */
3537
3538 static int
3539 mips_fp_div_cost (enum machine_mode mode)
3540 {
3541 return mode == DFmode ? mips_cost->fp_div_df : mips_cost->fp_div_sf;
3542 }
3543
3544 /* Return the cost of sign-extending OP to mode MODE, not including the
3545 cost of OP itself. */
3546
3547 static int
3548 mips_sign_extend_cost (enum machine_mode mode, rtx op)
3549 {
3550 if (MEM_P (op))
3551 /* Extended loads are as cheap as unextended ones. */
3552 return 0;
3553
3554 if (TARGET_64BIT && mode == DImode && GET_MODE (op) == SImode)
3555 /* A sign extension from SImode to DImode in 64-bit mode is free. */
3556 return 0;
3557
3558 if (ISA_HAS_SEB_SEH || GENERATE_MIPS16E)
3559 /* We can use SEB or SEH. */
3560 return COSTS_N_INSNS (1);
3561
3562 /* We need to use a shift left and a shift right. */
3563 return COSTS_N_INSNS (TARGET_MIPS16 ? 4 : 2);
3564 }
3565
3566 /* Return the cost of zero-extending OP to mode MODE, not including the
3567 cost of OP itself. */
3568
3569 static int
3570 mips_zero_extend_cost (enum machine_mode mode, rtx op)
3571 {
3572 if (MEM_P (op))
3573 /* Extended loads are as cheap as unextended ones. */
3574 return 0;
3575
3576 if (TARGET_64BIT && mode == DImode && GET_MODE (op) == SImode)
3577 /* We need a shift left by 32 bits and a shift right by 32 bits. */
3578 return COSTS_N_INSNS (TARGET_MIPS16 ? 4 : 2);
3579
3580 if (GENERATE_MIPS16E)
3581 /* We can use ZEB or ZEH. */
3582 return COSTS_N_INSNS (1);
3583
3584 if (TARGET_MIPS16)
3585 /* We need to load 0xff or 0xffff into a register and use AND. */
3586 return COSTS_N_INSNS (GET_MODE (op) == QImode ? 2 : 3);
3587
3588 /* We can use ANDI. */
3589 return COSTS_N_INSNS (1);
3590 }
3591
3592 /* Return the cost of moving between two registers of mode MODE,
3593 assuming that the move will be in pieces of at most UNITS bytes. */
3594
3595 static int
3596 mips_set_reg_reg_piece_cost (enum machine_mode mode, unsigned int units)
3597 {
3598 return COSTS_N_INSNS ((GET_MODE_SIZE (mode) + units - 1) / units);
3599 }
3600
3601 /* Return the cost of moving between two registers of mode MODE. */
3602
3603 static int
3604 mips_set_reg_reg_cost (enum machine_mode mode)
3605 {
3606 switch (GET_MODE_CLASS (mode))
3607 {
3608 case MODE_CC:
3609 return mips_set_reg_reg_piece_cost (mode, GET_MODE_SIZE (CCmode));
3610
3611 case MODE_FLOAT:
3612 case MODE_COMPLEX_FLOAT:
3613 case MODE_VECTOR_FLOAT:
3614 if (TARGET_HARD_FLOAT)
3615 return mips_set_reg_reg_piece_cost (mode, UNITS_PER_HWFPVALUE);
3616 /* Fall through */
3617
3618 default:
3619 return mips_set_reg_reg_piece_cost (mode, UNITS_PER_WORD);
3620 }
3621 }
3622
3623 /* Return the cost of an operand X that can be trucated for free.
3624 SPEED says whether we're optimizing for size or speed. */
3625
3626 static int
3627 mips_truncated_op_cost (rtx x, bool speed)
3628 {
3629 if (GET_CODE (x) == TRUNCATE)
3630 x = XEXP (x, 0);
3631 return set_src_cost (x, speed);
3632 }
3633
3634 /* Implement TARGET_RTX_COSTS. */
3635
3636 static bool
3637 mips_rtx_costs (rtx x, int code, int outer_code, int opno ATTRIBUTE_UNUSED,
3638 int *total, bool speed)
3639 {
3640 enum machine_mode mode = GET_MODE (x);
3641 bool float_mode_p = FLOAT_MODE_P (mode);
3642 int cost;
3643 rtx addr;
3644
3645 /* The cost of a COMPARE is hard to define for MIPS. COMPAREs don't
3646 appear in the instruction stream, and the cost of a comparison is
3647 really the cost of the branch or scc condition. At the time of
3648 writing, GCC only uses an explicit outer COMPARE code when optabs
3649 is testing whether a constant is expensive enough to force into a
3650 register. We want optabs to pass such constants through the MIPS
3651 expanders instead, so make all constants very cheap here. */
3652 if (outer_code == COMPARE)
3653 {
3654 gcc_assert (CONSTANT_P (x));
3655 *total = 0;
3656 return true;
3657 }
3658
3659 switch (code)
3660 {
3661 case CONST_INT:
3662 /* Treat *clear_upper32-style ANDs as having zero cost in the
3663 second operand. The cost is entirely in the first operand.
3664
3665 ??? This is needed because we would otherwise try to CSE
3666 the constant operand. Although that's the right thing for
3667 instructions that continue to be a register operation throughout
3668 compilation, it is disastrous for instructions that could
3669 later be converted into a memory operation. */
3670 if (TARGET_64BIT
3671 && outer_code == AND
3672 && UINTVAL (x) == 0xffffffff)
3673 {
3674 *total = 0;
3675 return true;
3676 }
3677
3678 if (TARGET_MIPS16)
3679 {
3680 cost = mips16_constant_cost (outer_code, INTVAL (x));
3681 if (cost >= 0)
3682 {
3683 *total = cost;
3684 return true;
3685 }
3686 }
3687 else
3688 {
3689 /* When not optimizing for size, we care more about the cost
3690 of hot code, and hot code is often in a loop. If a constant
3691 operand needs to be forced into a register, we will often be
3692 able to hoist the constant load out of the loop, so the load
3693 should not contribute to the cost. */
3694 if (speed || mips_immediate_operand_p (outer_code, INTVAL (x)))
3695 {
3696 *total = 0;
3697 return true;
3698 }
3699 }
3700 /* Fall through. */
3701
3702 case CONST:
3703 case SYMBOL_REF:
3704 case LABEL_REF:
3705 case CONST_DOUBLE:
3706 if (force_to_mem_operand (x, VOIDmode))
3707 {
3708 *total = COSTS_N_INSNS (1);
3709 return true;
3710 }
3711 cost = mips_const_insns (x);
3712 if (cost > 0)
3713 {
3714 /* If the constant is likely to be stored in a GPR, SETs of
3715 single-insn constants are as cheap as register sets; we
3716 never want to CSE them.
3717
3718 Don't reduce the cost of storing a floating-point zero in
3719 FPRs. If we have a zero in an FPR for other reasons, we
3720 can get better cfg-cleanup and delayed-branch results by
3721 using it consistently, rather than using $0 sometimes and
3722 an FPR at other times. Also, moves between floating-point
3723 registers are sometimes cheaper than (D)MTC1 $0. */
3724 if (cost == 1
3725 && outer_code == SET
3726 && !(float_mode_p && TARGET_HARD_FLOAT))
3727 cost = 0;
3728 /* When non-MIPS16 code loads a constant N>1 times, we rarely
3729 want to CSE the constant itself. It is usually better to
3730 have N copies of the last operation in the sequence and one
3731 shared copy of the other operations. (Note that this is
3732 not true for MIPS16 code, where the final operation in the
3733 sequence is often an extended instruction.)
3734
3735 Also, if we have a CONST_INT, we don't know whether it is
3736 for a word or doubleword operation, so we cannot rely on
3737 the result of mips_build_integer. */
3738 else if (!TARGET_MIPS16
3739 && (outer_code == SET || mode == VOIDmode))
3740 cost = 1;
3741 *total = COSTS_N_INSNS (cost);
3742 return true;
3743 }
3744 /* The value will need to be fetched from the constant pool. */
3745 *total = CONSTANT_POOL_COST;
3746 return true;
3747
3748 case MEM:
3749 /* If the address is legitimate, return the number of
3750 instructions it needs. */
3751 addr = XEXP (x, 0);
3752 cost = mips_address_insns (addr, mode, true);
3753 if (cost > 0)
3754 {
3755 *total = COSTS_N_INSNS (cost + 1);
3756 return true;
3757 }
3758 /* Check for a scaled indexed address. */
3759 if (mips_lwxs_address_p (addr)
3760 || mips_lx_address_p (addr, mode))
3761 {
3762 *total = COSTS_N_INSNS (2);
3763 return true;
3764 }
3765 /* Otherwise use the default handling. */
3766 return false;
3767
3768 case FFS:
3769 *total = COSTS_N_INSNS (6);
3770 return false;
3771
3772 case NOT:
3773 *total = COSTS_N_INSNS (GET_MODE_SIZE (mode) > UNITS_PER_WORD ? 2 : 1);
3774 return false;
3775
3776 case AND:
3777 /* Check for a *clear_upper32 pattern and treat it like a zero
3778 extension. See the pattern's comment for details. */
3779 if (TARGET_64BIT
3780 && mode == DImode
3781 && CONST_INT_P (XEXP (x, 1))
3782 && UINTVAL (XEXP (x, 1)) == 0xffffffff)
3783 {
3784 *total = (mips_zero_extend_cost (mode, XEXP (x, 0))
3785 + set_src_cost (XEXP (x, 0), speed));
3786 return true;
3787 }
3788 if (ISA_HAS_CINS && CONST_INT_P (XEXP (x, 1)))
3789 {
3790 rtx op = XEXP (x, 0);
3791 if (GET_CODE (op) == ASHIFT
3792 && CONST_INT_P (XEXP (op, 1))
3793 && mask_low_and_shift_p (mode, XEXP (x, 1), XEXP (op, 1), 32))
3794 {
3795 *total = COSTS_N_INSNS (1) + set_src_cost (XEXP (op, 0), speed);
3796 return true;
3797 }
3798 }
3799
3800 /* Fall through. */
3801
3802 case IOR:
3803 case XOR:
3804 /* Double-word operations use two single-word operations. */
3805 *total = mips_binary_cost (x, COSTS_N_INSNS (1), COSTS_N_INSNS (2),
3806 speed);
3807 return true;
3808
3809 case ASHIFT:
3810 case ASHIFTRT:
3811 case LSHIFTRT:
3812 case ROTATE:
3813 case ROTATERT:
3814 if (CONSTANT_P (XEXP (x, 1)))
3815 *total = mips_binary_cost (x, COSTS_N_INSNS (1), COSTS_N_INSNS (4),
3816 speed);
3817 else
3818 *total = mips_binary_cost (x, COSTS_N_INSNS (1), COSTS_N_INSNS (12),
3819 speed);
3820 return true;
3821
3822 case ABS:
3823 if (float_mode_p)
3824 *total = mips_cost->fp_add;
3825 else
3826 *total = COSTS_N_INSNS (4);
3827 return false;
3828
3829 case LO_SUM:
3830 /* Low-part immediates need an extended MIPS16 instruction. */
3831 *total = (COSTS_N_INSNS (TARGET_MIPS16 ? 2 : 1)
3832 + set_src_cost (XEXP (x, 0), speed));
3833 return true;
3834
3835 case LT:
3836 case LTU:
3837 case LE:
3838 case LEU:
3839 case GT:
3840 case GTU:
3841 case GE:
3842 case GEU:
3843 case EQ:
3844 case NE:
3845 case UNORDERED:
3846 case LTGT:
3847 /* Branch comparisons have VOIDmode, so use the first operand's
3848 mode instead. */
3849 mode = GET_MODE (XEXP (x, 0));
3850 if (FLOAT_MODE_P (mode))
3851 {
3852 *total = mips_cost->fp_add;
3853 return false;
3854 }
3855 *total = mips_binary_cost (x, COSTS_N_INSNS (1), COSTS_N_INSNS (4),
3856 speed);
3857 return true;
3858
3859 case MINUS:
3860 if (float_mode_p
3861 && (ISA_HAS_NMADD4_NMSUB4 || ISA_HAS_NMADD3_NMSUB3)
3862 && TARGET_FUSED_MADD
3863 && !HONOR_NANS (mode)
3864 && !HONOR_SIGNED_ZEROS (mode))
3865 {
3866 /* See if we can use NMADD or NMSUB. See mips.md for the
3867 associated patterns. */
3868 rtx op0 = XEXP (x, 0);
3869 rtx op1 = XEXP (x, 1);
3870 if (GET_CODE (op0) == MULT && GET_CODE (XEXP (op0, 0)) == NEG)
3871 {
3872 *total = (mips_fp_mult_cost (mode)
3873 + set_src_cost (XEXP (XEXP (op0, 0), 0), speed)
3874 + set_src_cost (XEXP (op0, 1), speed)
3875 + set_src_cost (op1, speed));
3876 return true;
3877 }
3878 if (GET_CODE (op1) == MULT)
3879 {
3880 *total = (mips_fp_mult_cost (mode)
3881 + set_src_cost (op0, speed)
3882 + set_src_cost (XEXP (op1, 0), speed)
3883 + set_src_cost (XEXP (op1, 1), speed));
3884 return true;
3885 }
3886 }
3887 /* Fall through. */
3888
3889 case PLUS:
3890 if (float_mode_p)
3891 {
3892 /* If this is part of a MADD or MSUB, treat the PLUS as
3893 being free. */
3894 if ((ISA_HAS_FP_MADD4_MSUB4 || ISA_HAS_FP_MADD3_MSUB3)
3895 && TARGET_FUSED_MADD
3896 && GET_CODE (XEXP (x, 0)) == MULT)
3897 *total = 0;
3898 else
3899 *total = mips_cost->fp_add;
3900 return false;
3901 }
3902
3903 /* Double-word operations require three single-word operations and
3904 an SLTU. The MIPS16 version then needs to move the result of
3905 the SLTU from $24 to a MIPS16 register. */
3906 *total = mips_binary_cost (x, COSTS_N_INSNS (1),
3907 COSTS_N_INSNS (TARGET_MIPS16 ? 5 : 4),
3908 speed);
3909 return true;
3910
3911 case NEG:
3912 if (float_mode_p
3913 && (ISA_HAS_NMADD4_NMSUB4 || ISA_HAS_NMADD3_NMSUB3)
3914 && TARGET_FUSED_MADD
3915 && !HONOR_NANS (mode)
3916 && HONOR_SIGNED_ZEROS (mode))
3917 {
3918 /* See if we can use NMADD or NMSUB. See mips.md for the
3919 associated patterns. */
3920 rtx op = XEXP (x, 0);
3921 if ((GET_CODE (op) == PLUS || GET_CODE (op) == MINUS)
3922 && GET_CODE (XEXP (op, 0)) == MULT)
3923 {
3924 *total = (mips_fp_mult_cost (mode)
3925 + set_src_cost (XEXP (XEXP (op, 0), 0), speed)
3926 + set_src_cost (XEXP (XEXP (op, 0), 1), speed)
3927 + set_src_cost (XEXP (op, 1), speed));
3928 return true;
3929 }
3930 }
3931
3932 if (float_mode_p)
3933 *total = mips_cost->fp_add;
3934 else
3935 *total = COSTS_N_INSNS (GET_MODE_SIZE (mode) > UNITS_PER_WORD ? 4 : 1);
3936 return false;
3937
3938 case MULT:
3939 if (float_mode_p)
3940 *total = mips_fp_mult_cost (mode);
3941 else if (mode == DImode && !TARGET_64BIT)
3942 /* Synthesized from 2 mulsi3s, 1 mulsidi3 and two additions,
3943 where the mulsidi3 always includes an MFHI and an MFLO. */
3944 *total = (speed
3945 ? mips_cost->int_mult_si * 3 + 6
3946 : COSTS_N_INSNS (ISA_HAS_MUL3 ? 7 : 9));
3947 else if (!speed)
3948 *total = COSTS_N_INSNS (ISA_HAS_MUL3 ? 1 : 2) + 1;
3949 else if (mode == DImode)
3950 *total = mips_cost->int_mult_di;
3951 else
3952 *total = mips_cost->int_mult_si;
3953 return false;
3954
3955 case DIV:
3956 /* Check for a reciprocal. */
3957 if (float_mode_p
3958 && ISA_HAS_FP4
3959 && flag_unsafe_math_optimizations
3960 && XEXP (x, 0) == CONST1_RTX (mode))
3961 {
3962 if (outer_code == SQRT || GET_CODE (XEXP (x, 1)) == SQRT)
3963 /* An rsqrt<mode>a or rsqrt<mode>b pattern. Count the
3964 division as being free. */
3965 *total = set_src_cost (XEXP (x, 1), speed);
3966 else
3967 *total = (mips_fp_div_cost (mode)
3968 + set_src_cost (XEXP (x, 1), speed));
3969 return true;
3970 }
3971 /* Fall through. */
3972
3973 case SQRT:
3974 case MOD:
3975 if (float_mode_p)
3976 {
3977 *total = mips_fp_div_cost (mode);
3978 return false;
3979 }
3980 /* Fall through. */
3981
3982 case UDIV:
3983 case UMOD:
3984 if (!speed)
3985 {
3986 /* It is our responsibility to make division by a power of 2
3987 as cheap as 2 register additions if we want the division
3988 expanders to be used for such operations; see the setting
3989 of sdiv_pow2_cheap in optabs.c. Using (D)DIV for MIPS16
3990 should always produce shorter code than using
3991 expand_sdiv2_pow2. */
3992 if (TARGET_MIPS16
3993 && CONST_INT_P (XEXP (x, 1))
3994 && exact_log2 (INTVAL (XEXP (x, 1))) >= 0)
3995 {
3996 *total = COSTS_N_INSNS (2) + set_src_cost (XEXP (x, 0), speed);
3997 return true;
3998 }
3999 *total = COSTS_N_INSNS (mips_idiv_insns ());
4000 }
4001 else if (mode == DImode)
4002 *total = mips_cost->int_div_di;
4003 else
4004 *total = mips_cost->int_div_si;
4005 return false;
4006
4007 case SIGN_EXTEND:
4008 *total = mips_sign_extend_cost (mode, XEXP (x, 0));
4009 return false;
4010
4011 case ZERO_EXTEND:
4012 if (outer_code == SET
4013 && ISA_HAS_BADDU
4014 && GET_MODE (XEXP (x, 0)) == QImode
4015 && GET_CODE (XEXP (x, 0)) == PLUS)
4016 {
4017 rtx plus = XEXP (x, 0);
4018 *total = (COSTS_N_INSNS (1)
4019 + mips_truncated_op_cost (XEXP (plus, 0), speed)
4020 + mips_truncated_op_cost (XEXP (plus, 1), speed));
4021 return true;
4022 }
4023 *total = mips_zero_extend_cost (mode, XEXP (x, 0));
4024 return false;
4025
4026 case FLOAT:
4027 case UNSIGNED_FLOAT:
4028 case FIX:
4029 case FLOAT_EXTEND:
4030 case FLOAT_TRUNCATE:
4031 *total = mips_cost->fp_add;
4032 return false;
4033
4034 case SET:
4035 if (register_operand (SET_DEST (x), VOIDmode)
4036 && reg_or_0_operand (SET_SRC (x), VOIDmode))
4037 {
4038 *total = mips_set_reg_reg_cost (GET_MODE (SET_DEST (x)));
4039 return true;
4040 }
4041 return false;
4042
4043 default:
4044 return false;
4045 }
4046 }
4047
4048 /* Implement TARGET_ADDRESS_COST. */
4049
4050 static int
4051 mips_address_cost (rtx addr, enum machine_mode mode,
4052 addr_space_t as ATTRIBUTE_UNUSED,
4053 bool speed ATTRIBUTE_UNUSED)
4054 {
4055 return mips_address_insns (addr, mode, false);
4056 }
4057 \f
4058 /* Information about a single instruction in a multi-instruction
4059 asm sequence. */
4060 struct mips_multi_member {
4061 /* True if this is a label, false if it is code. */
4062 bool is_label_p;
4063
4064 /* The output_asm_insn format of the instruction. */
4065 const char *format;
4066
4067 /* The operands to the instruction. */
4068 rtx operands[MAX_RECOG_OPERANDS];
4069 };
4070 typedef struct mips_multi_member mips_multi_member;
4071
4072 /* The instructions that make up the current multi-insn sequence. */
4073 static vec<mips_multi_member> mips_multi_members;
4074
4075 /* How many instructions (as opposed to labels) are in the current
4076 multi-insn sequence. */
4077 static unsigned int mips_multi_num_insns;
4078
4079 /* Start a new multi-insn sequence. */
4080
4081 static void
4082 mips_multi_start (void)
4083 {
4084 mips_multi_members.truncate (0);
4085 mips_multi_num_insns = 0;
4086 }
4087
4088 /* Add a new, uninitialized member to the current multi-insn sequence. */
4089
4090 static struct mips_multi_member *
4091 mips_multi_add (void)
4092 {
4093 mips_multi_member empty;
4094 return mips_multi_members.safe_push (empty);
4095 }
4096
4097 /* Add a normal insn with the given asm format to the current multi-insn
4098 sequence. The other arguments are a null-terminated list of operands. */
4099
4100 static void
4101 mips_multi_add_insn (const char *format, ...)
4102 {
4103 struct mips_multi_member *member;
4104 va_list ap;
4105 unsigned int i;
4106 rtx op;
4107
4108 member = mips_multi_add ();
4109 member->is_label_p = false;
4110 member->format = format;
4111 va_start (ap, format);
4112 i = 0;
4113 while ((op = va_arg (ap, rtx)))
4114 member->operands[i++] = op;
4115 va_end (ap);
4116 mips_multi_num_insns++;
4117 }
4118
4119 /* Add the given label definition to the current multi-insn sequence.
4120 The definition should include the colon. */
4121
4122 static void
4123 mips_multi_add_label (const char *label)
4124 {
4125 struct mips_multi_member *member;
4126
4127 member = mips_multi_add ();
4128 member->is_label_p = true;
4129 member->format = label;
4130 }
4131
4132 /* Return the index of the last member of the current multi-insn sequence. */
4133
4134 static unsigned int
4135 mips_multi_last_index (void)
4136 {
4137 return mips_multi_members.length () - 1;
4138 }
4139
4140 /* Add a copy of an existing instruction to the current multi-insn
4141 sequence. I is the index of the instruction that should be copied. */
4142
4143 static void
4144 mips_multi_copy_insn (unsigned int i)
4145 {
4146 struct mips_multi_member *member;
4147
4148 member = mips_multi_add ();
4149 memcpy (member, &mips_multi_members[i], sizeof (*member));
4150 gcc_assert (!member->is_label_p);
4151 }
4152
4153 /* Change the operand of an existing instruction in the current
4154 multi-insn sequence. I is the index of the instruction,
4155 OP is the index of the operand, and X is the new value. */
4156
4157 static void
4158 mips_multi_set_operand (unsigned int i, unsigned int op, rtx x)
4159 {
4160 mips_multi_members[i].operands[op] = x;
4161 }
4162
4163 /* Write out the asm code for the current multi-insn sequence. */
4164
4165 static void
4166 mips_multi_write (void)
4167 {
4168 struct mips_multi_member *member;
4169 unsigned int i;
4170
4171 FOR_EACH_VEC_ELT (mips_multi_members, i, member)
4172 if (member->is_label_p)
4173 fprintf (asm_out_file, "%s\n", member->format);
4174 else
4175 output_asm_insn (member->format, member->operands);
4176 }
4177 \f
4178 /* Return one word of double-word value OP, taking into account the fixed
4179 endianness of certain registers. HIGH_P is true to select the high part,
4180 false to select the low part. */
4181
4182 rtx
4183 mips_subword (rtx op, bool high_p)
4184 {
4185 unsigned int byte, offset;
4186 enum machine_mode mode;
4187
4188 mode = GET_MODE (op);
4189 if (mode == VOIDmode)
4190 mode = TARGET_64BIT ? TImode : DImode;
4191
4192 if (TARGET_BIG_ENDIAN ? !high_p : high_p)
4193 byte = UNITS_PER_WORD;
4194 else
4195 byte = 0;
4196
4197 if (FP_REG_RTX_P (op))
4198 {
4199 /* Paired FPRs are always ordered little-endian. */
4200 offset = (UNITS_PER_WORD < UNITS_PER_HWFPVALUE ? high_p : byte != 0);
4201 return gen_rtx_REG (word_mode, REGNO (op) + offset);
4202 }
4203
4204 if (MEM_P (op))
4205 return mips_rewrite_small_data (adjust_address (op, word_mode, byte));
4206
4207 return simplify_gen_subreg (word_mode, op, mode, byte);
4208 }
4209
4210 /* Return true if SRC should be moved into DEST using "MULT $0, $0".
4211 SPLIT_TYPE is the condition under which moves should be split. */
4212
4213 static bool
4214 mips_mult_move_p (rtx dest, rtx src, enum mips_split_type split_type)
4215 {
4216 return ((split_type != SPLIT_FOR_SPEED
4217 || mips_tuning_info.fast_mult_zero_zero_p)
4218 && src == const0_rtx
4219 && REG_P (dest)
4220 && GET_MODE_SIZE (GET_MODE (dest)) == 2 * UNITS_PER_WORD
4221 && (ISA_HAS_DSP_MULT
4222 ? ACC_REG_P (REGNO (dest))
4223 : MD_REG_P (REGNO (dest))));
4224 }
4225
4226 /* Return true if a move from SRC to DEST should be split into two.
4227 SPLIT_TYPE describes the split condition. */
4228
4229 bool
4230 mips_split_move_p (rtx dest, rtx src, enum mips_split_type split_type)
4231 {
4232 /* Check whether the move can be done using some variant of MULT $0,$0. */
4233 if (mips_mult_move_p (dest, src, split_type))
4234 return false;
4235
4236 /* FPR-to-FPR moves can be done in a single instruction, if they're
4237 allowed at all. */
4238 unsigned int size = GET_MODE_SIZE (GET_MODE (dest));
4239 if (size == 8 && FP_REG_RTX_P (src) && FP_REG_RTX_P (dest))
4240 return false;
4241
4242 /* Check for floating-point loads and stores. */
4243 if (size == 8 && ISA_HAS_LDC1_SDC1)
4244 {
4245 if (FP_REG_RTX_P (dest) && MEM_P (src))
4246 return false;
4247 if (FP_REG_RTX_P (src) && MEM_P (dest))
4248 return false;
4249 }
4250
4251 /* Otherwise split all multiword moves. */
4252 return size > UNITS_PER_WORD;
4253 }
4254
4255 /* Split a move from SRC to DEST, given that mips_split_move_p holds.
4256 SPLIT_TYPE describes the split condition. */
4257
4258 void
4259 mips_split_move (rtx dest, rtx src, enum mips_split_type split_type)
4260 {
4261 rtx low_dest;
4262
4263 gcc_checking_assert (mips_split_move_p (dest, src, split_type));
4264 if (FP_REG_RTX_P (dest) || FP_REG_RTX_P (src))
4265 {
4266 if (!TARGET_64BIT && GET_MODE (dest) == DImode)
4267 emit_insn (gen_move_doubleword_fprdi (dest, src));
4268 else if (!TARGET_64BIT && GET_MODE (dest) == DFmode)
4269 emit_insn (gen_move_doubleword_fprdf (dest, src));
4270 else if (!TARGET_64BIT && GET_MODE (dest) == V2SFmode)
4271 emit_insn (gen_move_doubleword_fprv2sf (dest, src));
4272 else if (!TARGET_64BIT && GET_MODE (dest) == V2SImode)
4273 emit_insn (gen_move_doubleword_fprv2si (dest, src));
4274 else if (!TARGET_64BIT && GET_MODE (dest) == V4HImode)
4275 emit_insn (gen_move_doubleword_fprv4hi (dest, src));
4276 else if (!TARGET_64BIT && GET_MODE (dest) == V8QImode)
4277 emit_insn (gen_move_doubleword_fprv8qi (dest, src));
4278 else if (TARGET_64BIT && GET_MODE (dest) == TFmode)
4279 emit_insn (gen_move_doubleword_fprtf (dest, src));
4280 else
4281 gcc_unreachable ();
4282 }
4283 else if (REG_P (dest) && REGNO (dest) == MD_REG_FIRST)
4284 {
4285 low_dest = mips_subword (dest, false);
4286 mips_emit_move (low_dest, mips_subword (src, false));
4287 if (TARGET_64BIT)
4288 emit_insn (gen_mthidi_ti (dest, mips_subword (src, true), low_dest));
4289 else
4290 emit_insn (gen_mthisi_di (dest, mips_subword (src, true), low_dest));
4291 }
4292 else if (REG_P (src) && REGNO (src) == MD_REG_FIRST)
4293 {
4294 mips_emit_move (mips_subword (dest, false), mips_subword (src, false));
4295 if (TARGET_64BIT)
4296 emit_insn (gen_mfhidi_ti (mips_subword (dest, true), src));
4297 else
4298 emit_insn (gen_mfhisi_di (mips_subword (dest, true), src));
4299 }
4300 else
4301 {
4302 /* The operation can be split into two normal moves. Decide in
4303 which order to do them. */
4304 low_dest = mips_subword (dest, false);
4305 if (REG_P (low_dest)
4306 && reg_overlap_mentioned_p (low_dest, src))
4307 {
4308 mips_emit_move (mips_subword (dest, true), mips_subword (src, true));
4309 mips_emit_move (low_dest, mips_subword (src, false));
4310 }
4311 else
4312 {
4313 mips_emit_move (low_dest, mips_subword (src, false));
4314 mips_emit_move (mips_subword (dest, true), mips_subword (src, true));
4315 }
4316 }
4317 }
4318
4319 /* Return the split type for instruction INSN. */
4320
4321 static enum mips_split_type
4322 mips_insn_split_type (rtx insn)
4323 {
4324 basic_block bb = BLOCK_FOR_INSN (insn);
4325 if (bb)
4326 {
4327 if (optimize_bb_for_speed_p (bb))
4328 return SPLIT_FOR_SPEED;
4329 else
4330 return SPLIT_FOR_SIZE;
4331 }
4332 /* Once CFG information has been removed, we should trust the optimization
4333 decisions made by previous passes and only split where necessary. */
4334 return SPLIT_IF_NECESSARY;
4335 }
4336
4337 /* Return true if a move from SRC to DEST in INSN should be split. */
4338
4339 bool
4340 mips_split_move_insn_p (rtx dest, rtx src, rtx insn)
4341 {
4342 return mips_split_move_p (dest, src, mips_insn_split_type (insn));
4343 }
4344
4345 /* Split a move from SRC to DEST in INSN, given that mips_split_move_insn_p
4346 holds. */
4347
4348 void
4349 mips_split_move_insn (rtx dest, rtx src, rtx insn)
4350 {
4351 mips_split_move (dest, src, mips_insn_split_type (insn));
4352 }
4353 \f
4354 /* Return the appropriate instructions to move SRC into DEST. Assume
4355 that SRC is operand 1 and DEST is operand 0. */
4356
4357 const char *
4358 mips_output_move (rtx dest, rtx src)
4359 {
4360 enum rtx_code dest_code, src_code;
4361 enum machine_mode mode;
4362 enum mips_symbol_type symbol_type;
4363 bool dbl_p;
4364
4365 dest_code = GET_CODE (dest);
4366 src_code = GET_CODE (src);
4367 mode = GET_MODE (dest);
4368 dbl_p = (GET_MODE_SIZE (mode) == 8);
4369
4370 if (mips_split_move_p (dest, src, SPLIT_IF_NECESSARY))
4371 return "#";
4372
4373 if ((src_code == REG && GP_REG_P (REGNO (src)))
4374 || (!TARGET_MIPS16 && src == CONST0_RTX (mode)))
4375 {
4376 if (dest_code == REG)
4377 {
4378 if (GP_REG_P (REGNO (dest)))
4379 return "move\t%0,%z1";
4380
4381 if (mips_mult_move_p (dest, src, SPLIT_IF_NECESSARY))
4382 {
4383 if (ISA_HAS_DSP_MULT)
4384 return "mult\t%q0,%.,%.";
4385 else
4386 return "mult\t%.,%.";
4387 }
4388
4389 /* Moves to HI are handled by special .md insns. */
4390 if (REGNO (dest) == LO_REGNUM)
4391 return "mtlo\t%z1";
4392
4393 if (DSP_ACC_REG_P (REGNO (dest)))
4394 {
4395 static char retval[] = "mt__\t%z1,%q0";
4396
4397 retval[2] = reg_names[REGNO (dest)][4];
4398 retval[3] = reg_names[REGNO (dest)][5];
4399 return retval;
4400 }
4401
4402 if (FP_REG_P (REGNO (dest)))
4403 return dbl_p ? "dmtc1\t%z1,%0" : "mtc1\t%z1,%0";
4404
4405 if (ALL_COP_REG_P (REGNO (dest)))
4406 {
4407 static char retval[] = "dmtc_\t%z1,%0";
4408
4409 retval[4] = COPNUM_AS_CHAR_FROM_REGNUM (REGNO (dest));
4410 return dbl_p ? retval : retval + 1;
4411 }
4412 }
4413 if (dest_code == MEM)
4414 switch (GET_MODE_SIZE (mode))
4415 {
4416 case 1: return "sb\t%z1,%0";
4417 case 2: return "sh\t%z1,%0";
4418 case 4: return "sw\t%z1,%0";
4419 case 8: return "sd\t%z1,%0";
4420 }
4421 }
4422 if (dest_code == REG && GP_REG_P (REGNO (dest)))
4423 {
4424 if (src_code == REG)
4425 {
4426 /* Moves from HI are handled by special .md insns. */
4427 if (REGNO (src) == LO_REGNUM)
4428 {
4429 /* When generating VR4120 or VR4130 code, we use MACC and
4430 DMACC instead of MFLO. This avoids both the normal
4431 MIPS III HI/LO hazards and the errata related to
4432 -mfix-vr4130. */
4433 if (ISA_HAS_MACCHI)
4434 return dbl_p ? "dmacc\t%0,%.,%." : "macc\t%0,%.,%.";
4435 return "mflo\t%0";
4436 }
4437
4438 if (DSP_ACC_REG_P (REGNO (src)))
4439 {
4440 static char retval[] = "mf__\t%0,%q1";
4441
4442 retval[2] = reg_names[REGNO (src)][4];
4443 retval[3] = reg_names[REGNO (src)][5];
4444 return retval;
4445 }
4446
4447 if (FP_REG_P (REGNO (src)))
4448 return dbl_p ? "dmfc1\t%0,%1" : "mfc1\t%0,%1";
4449
4450 if (ALL_COP_REG_P (REGNO (src)))
4451 {
4452 static char retval[] = "dmfc_\t%0,%1";
4453
4454 retval[4] = COPNUM_AS_CHAR_FROM_REGNUM (REGNO (src));
4455 return dbl_p ? retval : retval + 1;
4456 }
4457 }
4458
4459 if (src_code == MEM)
4460 switch (GET_MODE_SIZE (mode))
4461 {
4462 case 1: return "lbu\t%0,%1";
4463 case 2: return "lhu\t%0,%1";
4464 case 4: return "lw\t%0,%1";
4465 case 8: return "ld\t%0,%1";
4466 }
4467
4468 if (src_code == CONST_INT)
4469 {
4470 /* Don't use the X format for the operand itself, because that
4471 will give out-of-range numbers for 64-bit hosts and 32-bit
4472 targets. */
4473 if (!TARGET_MIPS16)
4474 return "li\t%0,%1\t\t\t# %X1";
4475
4476 if (SMALL_OPERAND_UNSIGNED (INTVAL (src)))
4477 return "li\t%0,%1";
4478
4479 if (SMALL_OPERAND_UNSIGNED (-INTVAL (src)))
4480 return "#";
4481 }
4482
4483 if (src_code == HIGH)
4484 return TARGET_MIPS16 ? "#" : "lui\t%0,%h1";
4485
4486 if (CONST_GP_P (src))
4487 return "move\t%0,%1";
4488
4489 if (mips_symbolic_constant_p (src, SYMBOL_CONTEXT_LEA, &symbol_type)
4490 && mips_lo_relocs[symbol_type] != 0)
4491 {
4492 /* A signed 16-bit constant formed by applying a relocation
4493 operator to a symbolic address. */
4494 gcc_assert (!mips_split_p[symbol_type]);
4495 return "li\t%0,%R1";
4496 }
4497
4498 if (symbolic_operand (src, VOIDmode))
4499 {
4500 gcc_assert (TARGET_MIPS16
4501 ? TARGET_MIPS16_TEXT_LOADS
4502 : !TARGET_EXPLICIT_RELOCS);
4503 return dbl_p ? "dla\t%0,%1" : "la\t%0,%1";
4504 }
4505 }
4506 if (src_code == REG && FP_REG_P (REGNO (src)))
4507 {
4508 if (dest_code == REG && FP_REG_P (REGNO (dest)))
4509 {
4510 if (GET_MODE (dest) == V2SFmode)
4511 return "mov.ps\t%0,%1";
4512 else
4513 return dbl_p ? "mov.d\t%0,%1" : "mov.s\t%0,%1";
4514 }
4515
4516 if (dest_code == MEM)
4517 return dbl_p ? "sdc1\t%1,%0" : "swc1\t%1,%0";
4518 }
4519 if (dest_code == REG && FP_REG_P (REGNO (dest)))
4520 {
4521 if (src_code == MEM)
4522 return dbl_p ? "ldc1\t%0,%1" : "lwc1\t%0,%1";
4523 }
4524 if (dest_code == REG && ALL_COP_REG_P (REGNO (dest)) && src_code == MEM)
4525 {
4526 static char retval[] = "l_c_\t%0,%1";
4527
4528 retval[1] = (dbl_p ? 'd' : 'w');
4529 retval[3] = COPNUM_AS_CHAR_FROM_REGNUM (REGNO (dest));
4530 return retval;
4531 }
4532 if (dest_code == MEM && src_code == REG && ALL_COP_REG_P (REGNO (src)))
4533 {
4534 static char retval[] = "s_c_\t%1,%0";
4535
4536 retval[1] = (dbl_p ? 'd' : 'w');
4537 retval[3] = COPNUM_AS_CHAR_FROM_REGNUM (REGNO (src));
4538 return retval;
4539 }
4540 gcc_unreachable ();
4541 }
4542 \f
4543 /* Return true if CMP1 is a suitable second operand for integer ordering
4544 test CODE. See also the *sCC patterns in mips.md. */
4545
4546 static bool
4547 mips_int_order_operand_ok_p (enum rtx_code code, rtx cmp1)
4548 {
4549 switch (code)
4550 {
4551 case GT:
4552 case GTU:
4553 return reg_or_0_operand (cmp1, VOIDmode);
4554
4555 case GE:
4556 case GEU:
4557 return !TARGET_MIPS16 && cmp1 == const1_rtx;
4558
4559 case LT:
4560 case LTU:
4561 return arith_operand (cmp1, VOIDmode);
4562
4563 case LE:
4564 return sle_operand (cmp1, VOIDmode);
4565
4566 case LEU:
4567 return sleu_operand (cmp1, VOIDmode);
4568
4569 default:
4570 gcc_unreachable ();
4571 }
4572 }
4573
4574 /* Return true if *CMP1 (of mode MODE) is a valid second operand for
4575 integer ordering test *CODE, or if an equivalent combination can
4576 be formed by adjusting *CODE and *CMP1. When returning true, update
4577 *CODE and *CMP1 with the chosen code and operand, otherwise leave
4578 them alone. */
4579
4580 static bool
4581 mips_canonicalize_int_order_test (enum rtx_code *code, rtx *cmp1,
4582 enum machine_mode mode)
4583 {
4584 HOST_WIDE_INT plus_one;
4585
4586 if (mips_int_order_operand_ok_p (*code, *cmp1))
4587 return true;
4588
4589 if (CONST_INT_P (*cmp1))
4590 switch (*code)
4591 {
4592 case LE:
4593 plus_one = trunc_int_for_mode (UINTVAL (*cmp1) + 1, mode);
4594 if (INTVAL (*cmp1) < plus_one)
4595 {
4596 *code = LT;
4597 *cmp1 = force_reg (mode, GEN_INT (plus_one));
4598 return true;
4599 }
4600 break;
4601
4602 case LEU:
4603 plus_one = trunc_int_for_mode (UINTVAL (*cmp1) + 1, mode);
4604 if (plus_one != 0)
4605 {
4606 *code = LTU;
4607 *cmp1 = force_reg (mode, GEN_INT (plus_one));
4608 return true;
4609 }
4610 break;
4611
4612 default:
4613 break;
4614 }
4615 return false;
4616 }
4617
4618 /* Compare CMP0 and CMP1 using ordering test CODE and store the result
4619 in TARGET. CMP0 and TARGET are register_operands. If INVERT_PTR
4620 is nonnull, it's OK to set TARGET to the inverse of the result and
4621 flip *INVERT_PTR instead. */
4622
4623 static void
4624 mips_emit_int_order_test (enum rtx_code code, bool *invert_ptr,
4625 rtx target, rtx cmp0, rtx cmp1)
4626 {
4627 enum machine_mode mode;
4628
4629 /* First see if there is a MIPS instruction that can do this operation.
4630 If not, try doing the same for the inverse operation. If that also
4631 fails, force CMP1 into a register and try again. */
4632 mode = GET_MODE (cmp0);
4633 if (mips_canonicalize_int_order_test (&code, &cmp1, mode))
4634 mips_emit_binary (code, target, cmp0, cmp1);
4635 else
4636 {
4637 enum rtx_code inv_code = reverse_condition (code);
4638 if (!mips_canonicalize_int_order_test (&inv_code, &cmp1, mode))
4639 {
4640 cmp1 = force_reg (mode, cmp1);
4641 mips_emit_int_order_test (code, invert_ptr, target, cmp0, cmp1);
4642 }
4643 else if (invert_ptr == 0)
4644 {
4645 rtx inv_target;
4646
4647 inv_target = mips_force_binary (GET_MODE (target),
4648 inv_code, cmp0, cmp1);
4649 mips_emit_binary (XOR, target, inv_target, const1_rtx);
4650 }
4651 else
4652 {
4653 *invert_ptr = !*invert_ptr;
4654 mips_emit_binary (inv_code, target, cmp0, cmp1);
4655 }
4656 }
4657 }
4658
4659 /* Return a register that is zero iff CMP0 and CMP1 are equal.
4660 The register will have the same mode as CMP0. */
4661
4662 static rtx
4663 mips_zero_if_equal (rtx cmp0, rtx cmp1)
4664 {
4665 if (cmp1 == const0_rtx)
4666 return cmp0;
4667
4668 if (uns_arith_operand (cmp1, VOIDmode))
4669 return expand_binop (GET_MODE (cmp0), xor_optab,
4670 cmp0, cmp1, 0, 0, OPTAB_DIRECT);
4671
4672 return expand_binop (GET_MODE (cmp0), sub_optab,
4673 cmp0, cmp1, 0, 0, OPTAB_DIRECT);
4674 }
4675
4676 /* Convert *CODE into a code that can be used in a floating-point
4677 scc instruction (C.cond.fmt). Return true if the values of
4678 the condition code registers will be inverted, with 0 indicating
4679 that the condition holds. */
4680
4681 static bool
4682 mips_reversed_fp_cond (enum rtx_code *code)
4683 {
4684 switch (*code)
4685 {
4686 case NE:
4687 case LTGT:
4688 case ORDERED:
4689 *code = reverse_condition_maybe_unordered (*code);
4690 return true;
4691
4692 default:
4693 return false;
4694 }
4695 }
4696
4697 /* Allocate a floating-point condition-code register of mode MODE.
4698
4699 These condition code registers are used for certain kinds
4700 of compound operation, such as compare and branches, vconds,
4701 and built-in functions. At expand time, their use is entirely
4702 controlled by MIPS-specific code and is entirely internal
4703 to these compound operations.
4704
4705 We could (and did in the past) expose condition-code values
4706 as pseudo registers and leave the register allocator to pick
4707 appropriate registers. The problem is that it is not practically
4708 possible for the rtl optimizers to guarantee that no spills will
4709 be needed, even when AVOID_CCMODE_COPIES is defined. We would
4710 therefore need spill and reload sequences to handle the worst case.
4711
4712 Although such sequences do exist, they are very expensive and are
4713 not something we'd want to use. This is especially true of CCV2 and
4714 CCV4, where all the shuffling would greatly outweigh whatever benefit
4715 the vectorization itself provides.
4716
4717 The main benefit of having more than one condition-code register
4718 is to allow the pipelining of operations, especially those involving
4719 comparisons and conditional moves. We don't really expect the
4720 registers to be live for long periods, and certainly never want
4721 them to be live across calls.
4722
4723 Also, there should be no penalty attached to using all the available
4724 registers. They are simply bits in the same underlying FPU control
4725 register.
4726
4727 We therefore expose the hardware registers from the outset and use
4728 a simple round-robin allocation scheme. */
4729
4730 static rtx
4731 mips_allocate_fcc (enum machine_mode mode)
4732 {
4733 unsigned int regno, count;
4734
4735 gcc_assert (TARGET_HARD_FLOAT && ISA_HAS_8CC);
4736
4737 if (mode == CCmode)
4738 count = 1;
4739 else if (mode == CCV2mode)
4740 count = 2;
4741 else if (mode == CCV4mode)
4742 count = 4;
4743 else
4744 gcc_unreachable ();
4745
4746 cfun->machine->next_fcc += -cfun->machine->next_fcc & (count - 1);
4747 if (cfun->machine->next_fcc > ST_REG_LAST - ST_REG_FIRST)
4748 cfun->machine->next_fcc = 0;
4749 regno = ST_REG_FIRST + cfun->machine->next_fcc;
4750 cfun->machine->next_fcc += count;
4751 return gen_rtx_REG (mode, regno);
4752 }
4753
4754 /* Convert a comparison into something that can be used in a branch or
4755 conditional move. On entry, *OP0 and *OP1 are the values being
4756 compared and *CODE is the code used to compare them.
4757
4758 Update *CODE, *OP0 and *OP1 so that they describe the final comparison.
4759 If NEED_EQ_NE_P, then only EQ or NE comparisons against zero are possible,
4760 otherwise any standard branch condition can be used. The standard branch
4761 conditions are:
4762
4763 - EQ or NE between two registers.
4764 - any comparison between a register and zero. */
4765
4766 static void
4767 mips_emit_compare (enum rtx_code *code, rtx *op0, rtx *op1, bool need_eq_ne_p)
4768 {
4769 rtx cmp_op0 = *op0;
4770 rtx cmp_op1 = *op1;
4771
4772 if (GET_MODE_CLASS (GET_MODE (*op0)) == MODE_INT)
4773 {
4774 if (!need_eq_ne_p && *op1 == const0_rtx)
4775 ;
4776 else if (*code == EQ || *code == NE)
4777 {
4778 if (need_eq_ne_p)
4779 {
4780 *op0 = mips_zero_if_equal (cmp_op0, cmp_op1);
4781 *op1 = const0_rtx;
4782 }
4783 else
4784 *op1 = force_reg (GET_MODE (cmp_op0), cmp_op1);
4785 }
4786 else
4787 {
4788 /* The comparison needs a separate scc instruction. Store the
4789 result of the scc in *OP0 and compare it against zero. */
4790 bool invert = false;
4791 *op0 = gen_reg_rtx (GET_MODE (cmp_op0));
4792 mips_emit_int_order_test (*code, &invert, *op0, cmp_op0, cmp_op1);
4793 *code = (invert ? EQ : NE);
4794 *op1 = const0_rtx;
4795 }
4796 }
4797 else if (ALL_FIXED_POINT_MODE_P (GET_MODE (cmp_op0)))
4798 {
4799 *op0 = gen_rtx_REG (CCDSPmode, CCDSP_CC_REGNUM);
4800 mips_emit_binary (*code, *op0, cmp_op0, cmp_op1);
4801 *code = NE;
4802 *op1 = const0_rtx;
4803 }
4804 else
4805 {
4806 enum rtx_code cmp_code;
4807
4808 /* Floating-point tests use a separate C.cond.fmt comparison to
4809 set a condition code register. The branch or conditional move
4810 will then compare that register against zero.
4811
4812 Set CMP_CODE to the code of the comparison instruction and
4813 *CODE to the code that the branch or move should use. */
4814 cmp_code = *code;
4815 *code = mips_reversed_fp_cond (&cmp_code) ? EQ : NE;
4816 *op0 = (ISA_HAS_8CC
4817 ? mips_allocate_fcc (CCmode)
4818 : gen_rtx_REG (CCmode, FPSW_REGNUM));
4819 *op1 = const0_rtx;
4820 mips_emit_binary (cmp_code, *op0, cmp_op0, cmp_op1);
4821 }
4822 }
4823 \f
4824 /* Try performing the comparison in OPERANDS[1], whose arms are OPERANDS[2]
4825 and OPERAND[3]. Store the result in OPERANDS[0].
4826
4827 On 64-bit targets, the mode of the comparison and target will always be
4828 SImode, thus possibly narrower than that of the comparison's operands. */
4829
4830 void
4831 mips_expand_scc (rtx operands[])
4832 {
4833 rtx target = operands[0];
4834 enum rtx_code code = GET_CODE (operands[1]);
4835 rtx op0 = operands[2];
4836 rtx op1 = operands[3];
4837
4838 gcc_assert (GET_MODE_CLASS (GET_MODE (op0)) == MODE_INT);
4839
4840 if (code == EQ || code == NE)
4841 {
4842 if (ISA_HAS_SEQ_SNE
4843 && reg_imm10_operand (op1, GET_MODE (op1)))
4844 mips_emit_binary (code, target, op0, op1);
4845 else
4846 {
4847 rtx zie = mips_zero_if_equal (op0, op1);
4848 mips_emit_binary (code, target, zie, const0_rtx);
4849 }
4850 }
4851 else
4852 mips_emit_int_order_test (code, 0, target, op0, op1);
4853 }
4854
4855 /* Compare OPERANDS[1] with OPERANDS[2] using comparison code
4856 CODE and jump to OPERANDS[3] if the condition holds. */
4857
4858 void
4859 mips_expand_conditional_branch (rtx *operands)
4860 {
4861 enum rtx_code code = GET_CODE (operands[0]);
4862 rtx op0 = operands[1];
4863 rtx op1 = operands[2];
4864 rtx condition;
4865
4866 mips_emit_compare (&code, &op0, &op1, TARGET_MIPS16);
4867 condition = gen_rtx_fmt_ee (code, VOIDmode, op0, op1);
4868 emit_jump_insn (gen_condjump (condition, operands[3]));
4869 }
4870
4871 /* Implement:
4872
4873 (set temp (COND:CCV2 CMP_OP0 CMP_OP1))
4874 (set DEST (unspec [TRUE_SRC FALSE_SRC temp] UNSPEC_MOVE_TF_PS)) */
4875
4876 void
4877 mips_expand_vcondv2sf (rtx dest, rtx true_src, rtx false_src,
4878 enum rtx_code cond, rtx cmp_op0, rtx cmp_op1)
4879 {
4880 rtx cmp_result;
4881 bool reversed_p;
4882
4883 reversed_p = mips_reversed_fp_cond (&cond);
4884 cmp_result = mips_allocate_fcc (CCV2mode);
4885 emit_insn (gen_scc_ps (cmp_result,
4886 gen_rtx_fmt_ee (cond, VOIDmode, cmp_op0, cmp_op1)));
4887 if (reversed_p)
4888 emit_insn (gen_mips_cond_move_tf_ps (dest, false_src, true_src,
4889 cmp_result));
4890 else
4891 emit_insn (gen_mips_cond_move_tf_ps (dest, true_src, false_src,
4892 cmp_result));
4893 }
4894
4895 /* Perform the comparison in OPERANDS[1]. Move OPERANDS[2] into OPERANDS[0]
4896 if the condition holds, otherwise move OPERANDS[3] into OPERANDS[0]. */
4897
4898 void
4899 mips_expand_conditional_move (rtx *operands)
4900 {
4901 rtx cond;
4902 enum rtx_code code = GET_CODE (operands[1]);
4903 rtx op0 = XEXP (operands[1], 0);
4904 rtx op1 = XEXP (operands[1], 1);
4905
4906 mips_emit_compare (&code, &op0, &op1, true);
4907 cond = gen_rtx_fmt_ee (code, GET_MODE (op0), op0, op1);
4908 emit_insn (gen_rtx_SET (VOIDmode, operands[0],
4909 gen_rtx_IF_THEN_ELSE (GET_MODE (operands[0]), cond,
4910 operands[2], operands[3])));
4911 }
4912
4913 /* Perform the comparison in COMPARISON, then trap if the condition holds. */
4914
4915 void
4916 mips_expand_conditional_trap (rtx comparison)
4917 {
4918 rtx op0, op1;
4919 enum machine_mode mode;
4920 enum rtx_code code;
4921
4922 /* MIPS conditional trap instructions don't have GT or LE flavors,
4923 so we must swap the operands and convert to LT and GE respectively. */
4924 code = GET_CODE (comparison);
4925 switch (code)
4926 {
4927 case GT:
4928 case LE:
4929 case GTU:
4930 case LEU:
4931 code = swap_condition (code);
4932 op0 = XEXP (comparison, 1);
4933 op1 = XEXP (comparison, 0);
4934 break;
4935
4936 default:
4937 op0 = XEXP (comparison, 0);
4938 op1 = XEXP (comparison, 1);
4939 break;
4940 }
4941
4942 mode = GET_MODE (XEXP (comparison, 0));
4943 op0 = force_reg (mode, op0);
4944 if (!arith_operand (op1, mode))
4945 op1 = force_reg (mode, op1);
4946
4947 emit_insn (gen_rtx_TRAP_IF (VOIDmode,
4948 gen_rtx_fmt_ee (code, mode, op0, op1),
4949 const0_rtx));
4950 }
4951 \f
4952 /* Initialize *CUM for a call to a function of type FNTYPE. */
4953
4954 void
4955 mips_init_cumulative_args (CUMULATIVE_ARGS *cum, tree fntype)
4956 {
4957 memset (cum, 0, sizeof (*cum));
4958 cum->prototype = (fntype && prototype_p (fntype));
4959 cum->gp_reg_found = (cum->prototype && stdarg_p (fntype));
4960 }
4961
4962 /* Fill INFO with information about a single argument. CUM is the
4963 cumulative state for earlier arguments. MODE is the mode of this
4964 argument and TYPE is its type (if known). NAMED is true if this
4965 is a named (fixed) argument rather than a variable one. */
4966
4967 static void
4968 mips_get_arg_info (struct mips_arg_info *info, const CUMULATIVE_ARGS *cum,
4969 enum machine_mode mode, const_tree type, bool named)
4970 {
4971 bool doubleword_aligned_p;
4972 unsigned int num_bytes, num_words, max_regs;
4973
4974 /* Work out the size of the argument. */
4975 num_bytes = type ? int_size_in_bytes (type) : GET_MODE_SIZE (mode);
4976 num_words = (num_bytes + UNITS_PER_WORD - 1) / UNITS_PER_WORD;
4977
4978 /* Decide whether it should go in a floating-point register, assuming
4979 one is free. Later code checks for availability.
4980
4981 The checks against UNITS_PER_FPVALUE handle the soft-float and
4982 single-float cases. */
4983 switch (mips_abi)
4984 {
4985 case ABI_EABI:
4986 /* The EABI conventions have traditionally been defined in terms
4987 of TYPE_MODE, regardless of the actual type. */
4988 info->fpr_p = ((GET_MODE_CLASS (mode) == MODE_FLOAT
4989 || mode == V2SFmode)
4990 && GET_MODE_SIZE (mode) <= UNITS_PER_FPVALUE);
4991 break;
4992
4993 case ABI_32:
4994 case ABI_O64:
4995 /* Only leading floating-point scalars are passed in
4996 floating-point registers. We also handle vector floats the same
4997 say, which is OK because they are not covered by the standard ABI. */
4998 info->fpr_p = (!cum->gp_reg_found
4999 && cum->arg_number < 2
5000 && (type == 0
5001 || SCALAR_FLOAT_TYPE_P (type)
5002 || VECTOR_FLOAT_TYPE_P (type))
5003 && (GET_MODE_CLASS (mode) == MODE_FLOAT
5004 || mode == V2SFmode)
5005 && GET_MODE_SIZE (mode) <= UNITS_PER_FPVALUE);
5006 break;
5007
5008 case ABI_N32:
5009 case ABI_64:
5010 /* Scalar, complex and vector floating-point types are passed in
5011 floating-point registers, as long as this is a named rather
5012 than a variable argument. */
5013 info->fpr_p = (named
5014 && (type == 0 || FLOAT_TYPE_P (type))
5015 && (GET_MODE_CLASS (mode) == MODE_FLOAT
5016 || GET_MODE_CLASS (mode) == MODE_COMPLEX_FLOAT
5017 || mode == V2SFmode)
5018 && GET_MODE_UNIT_SIZE (mode) <= UNITS_PER_FPVALUE);
5019
5020 /* ??? According to the ABI documentation, the real and imaginary
5021 parts of complex floats should be passed in individual registers.
5022 The real and imaginary parts of stack arguments are supposed
5023 to be contiguous and there should be an extra word of padding
5024 at the end.
5025
5026 This has two problems. First, it makes it impossible to use a
5027 single "void *" va_list type, since register and stack arguments
5028 are passed differently. (At the time of writing, MIPSpro cannot
5029 handle complex float varargs correctly.) Second, it's unclear
5030 what should happen when there is only one register free.
5031
5032 For now, we assume that named complex floats should go into FPRs
5033 if there are two FPRs free, otherwise they should be passed in the
5034 same way as a struct containing two floats. */
5035 if (info->fpr_p
5036 && GET_MODE_CLASS (mode) == MODE_COMPLEX_FLOAT
5037 && GET_MODE_UNIT_SIZE (mode) < UNITS_PER_FPVALUE)
5038 {
5039 if (cum->num_gprs >= MAX_ARGS_IN_REGISTERS - 1)
5040 info->fpr_p = false;
5041 else
5042 num_words = 2;
5043 }
5044 break;
5045
5046 default:
5047 gcc_unreachable ();
5048 }
5049
5050 /* See whether the argument has doubleword alignment. */
5051 doubleword_aligned_p = (mips_function_arg_boundary (mode, type)
5052 > BITS_PER_WORD);
5053
5054 /* Set REG_OFFSET to the register count we're interested in.
5055 The EABI allocates the floating-point registers separately,
5056 but the other ABIs allocate them like integer registers. */
5057 info->reg_offset = (mips_abi == ABI_EABI && info->fpr_p
5058 ? cum->num_fprs
5059 : cum->num_gprs);
5060
5061 /* Advance to an even register if the argument is doubleword-aligned. */
5062 if (doubleword_aligned_p)
5063 info->reg_offset += info->reg_offset & 1;
5064
5065 /* Work out the offset of a stack argument. */
5066 info->stack_offset = cum->stack_words;
5067 if (doubleword_aligned_p)
5068 info->stack_offset += info->stack_offset & 1;
5069
5070 max_regs = MAX_ARGS_IN_REGISTERS - info->reg_offset;
5071
5072 /* Partition the argument between registers and stack. */
5073 info->reg_words = MIN (num_words, max_regs);
5074 info->stack_words = num_words - info->reg_words;
5075 }
5076
5077 /* INFO describes a register argument that has the normal format for the
5078 argument's mode. Return the register it uses, assuming that FPRs are
5079 available if HARD_FLOAT_P. */
5080
5081 static unsigned int
5082 mips_arg_regno (const struct mips_arg_info *info, bool hard_float_p)
5083 {
5084 if (!info->fpr_p || !hard_float_p)
5085 return GP_ARG_FIRST + info->reg_offset;
5086 else if (mips_abi == ABI_32 && TARGET_DOUBLE_FLOAT && info->reg_offset > 0)
5087 /* In o32, the second argument is always passed in $f14
5088 for TARGET_DOUBLE_FLOAT, regardless of whether the
5089 first argument was a word or doubleword. */
5090 return FP_ARG_FIRST + 2;
5091 else
5092 return FP_ARG_FIRST + info->reg_offset;
5093 }
5094
5095 /* Implement TARGET_STRICT_ARGUMENT_NAMING. */
5096
5097 static bool
5098 mips_strict_argument_naming (cumulative_args_t ca ATTRIBUTE_UNUSED)
5099 {
5100 return !TARGET_OLDABI;
5101 }
5102
5103 /* Implement TARGET_FUNCTION_ARG. */
5104
5105 static rtx
5106 mips_function_arg (cumulative_args_t cum_v, enum machine_mode mode,
5107 const_tree type, bool named)
5108 {
5109 CUMULATIVE_ARGS *cum = get_cumulative_args (cum_v);
5110 struct mips_arg_info info;
5111
5112 /* We will be called with a mode of VOIDmode after the last argument
5113 has been seen. Whatever we return will be passed to the call expander.
5114 If we need a MIPS16 fp_code, return a REG with the code stored as
5115 the mode. */
5116 if (mode == VOIDmode)
5117 {
5118 if (TARGET_MIPS16 && cum->fp_code != 0)
5119 return gen_rtx_REG ((enum machine_mode) cum->fp_code, 0);
5120 else
5121 return NULL;
5122 }
5123
5124 mips_get_arg_info (&info, cum, mode, type, named);
5125
5126 /* Return straight away if the whole argument is passed on the stack. */
5127 if (info.reg_offset == MAX_ARGS_IN_REGISTERS)
5128 return NULL;
5129
5130 /* The n32 and n64 ABIs say that if any 64-bit chunk of the structure
5131 contains a double in its entirety, then that 64-bit chunk is passed
5132 in a floating-point register. */
5133 if (TARGET_NEWABI
5134 && TARGET_HARD_FLOAT
5135 && named
5136 && type != 0
5137 && TREE_CODE (type) == RECORD_TYPE
5138 && TYPE_SIZE_UNIT (type)
5139 && host_integerp (TYPE_SIZE_UNIT (type), 1))
5140 {
5141 tree field;
5142
5143 /* First check to see if there is any such field. */
5144 for (field = TYPE_FIELDS (type); field; field = DECL_CHAIN (field))
5145 if (TREE_CODE (field) == FIELD_DECL
5146 && SCALAR_FLOAT_TYPE_P (TREE_TYPE (field))
5147 && TYPE_PRECISION (TREE_TYPE (field)) == BITS_PER_WORD
5148 && host_integerp (bit_position (field), 0)
5149 && int_bit_position (field) % BITS_PER_WORD == 0)
5150 break;
5151
5152 if (field != 0)
5153 {
5154 /* Now handle the special case by returning a PARALLEL
5155 indicating where each 64-bit chunk goes. INFO.REG_WORDS
5156 chunks are passed in registers. */
5157 unsigned int i;
5158 HOST_WIDE_INT bitpos;
5159 rtx ret;
5160
5161 /* assign_parms checks the mode of ENTRY_PARM, so we must
5162 use the actual mode here. */
5163 ret = gen_rtx_PARALLEL (mode, rtvec_alloc (info.reg_words));
5164
5165 bitpos = 0;
5166 field = TYPE_FIELDS (type);
5167 for (i = 0; i < info.reg_words; i++)
5168 {
5169 rtx reg;
5170
5171 for (; field; field = DECL_CHAIN (field))
5172 if (TREE_CODE (field) == FIELD_DECL
5173 && int_bit_position (field) >= bitpos)
5174 break;
5175
5176 if (field
5177 && int_bit_position (field) == bitpos
5178 && SCALAR_FLOAT_TYPE_P (TREE_TYPE (field))
5179 && TYPE_PRECISION (TREE_TYPE (field)) == BITS_PER_WORD)
5180 reg = gen_rtx_REG (DFmode, FP_ARG_FIRST + info.reg_offset + i);
5181 else
5182 reg = gen_rtx_REG (DImode, GP_ARG_FIRST + info.reg_offset + i);
5183
5184 XVECEXP (ret, 0, i)
5185 = gen_rtx_EXPR_LIST (VOIDmode, reg,
5186 GEN_INT (bitpos / BITS_PER_UNIT));
5187
5188 bitpos += BITS_PER_WORD;
5189 }
5190 return ret;
5191 }
5192 }
5193
5194 /* Handle the n32/n64 conventions for passing complex floating-point
5195 arguments in FPR pairs. The real part goes in the lower register
5196 and the imaginary part goes in the upper register. */
5197 if (TARGET_NEWABI
5198 && info.fpr_p
5199 && GET_MODE_CLASS (mode) == MODE_COMPLEX_FLOAT)
5200 {
5201 rtx real, imag;
5202 enum machine_mode inner;
5203 unsigned int regno;
5204
5205 inner = GET_MODE_INNER (mode);
5206 regno = FP_ARG_FIRST + info.reg_offset;
5207 if (info.reg_words * UNITS_PER_WORD == GET_MODE_SIZE (inner))
5208 {
5209 /* Real part in registers, imaginary part on stack. */
5210 gcc_assert (info.stack_words == info.reg_words);
5211 return gen_rtx_REG (inner, regno);
5212 }
5213 else
5214 {
5215 gcc_assert (info.stack_words == 0);
5216 real = gen_rtx_EXPR_LIST (VOIDmode,
5217 gen_rtx_REG (inner, regno),
5218 const0_rtx);
5219 imag = gen_rtx_EXPR_LIST (VOIDmode,
5220 gen_rtx_REG (inner,
5221 regno + info.reg_words / 2),
5222 GEN_INT (GET_MODE_SIZE (inner)));
5223 return gen_rtx_PARALLEL (mode, gen_rtvec (2, real, imag));
5224 }
5225 }
5226
5227 return gen_rtx_REG (mode, mips_arg_regno (&info, TARGET_HARD_FLOAT));
5228 }
5229
5230 /* Implement TARGET_FUNCTION_ARG_ADVANCE. */
5231
5232 static void
5233 mips_function_arg_advance (cumulative_args_t cum_v, enum machine_mode mode,
5234 const_tree type, bool named)
5235 {
5236 CUMULATIVE_ARGS *cum = get_cumulative_args (cum_v);
5237 struct mips_arg_info info;
5238
5239 mips_get_arg_info (&info, cum, mode, type, named);
5240
5241 if (!info.fpr_p)
5242 cum->gp_reg_found = true;
5243
5244 /* See the comment above the CUMULATIVE_ARGS structure in mips.h for
5245 an explanation of what this code does. It assumes that we're using
5246 either the o32 or the o64 ABI, both of which pass at most 2 arguments
5247 in FPRs. */
5248 if (cum->arg_number < 2 && info.fpr_p)
5249 cum->fp_code += (mode == SFmode ? 1 : 2) << (cum->arg_number * 2);
5250
5251 /* Advance the register count. This has the effect of setting
5252 num_gprs to MAX_ARGS_IN_REGISTERS if a doubleword-aligned
5253 argument required us to skip the final GPR and pass the whole
5254 argument on the stack. */
5255 if (mips_abi != ABI_EABI || !info.fpr_p)
5256 cum->num_gprs = info.reg_offset + info.reg_words;
5257 else if (info.reg_words > 0)
5258 cum->num_fprs += MAX_FPRS_PER_FMT;
5259
5260 /* Advance the stack word count. */
5261 if (info.stack_words > 0)
5262 cum->stack_words = info.stack_offset + info.stack_words;
5263
5264 cum->arg_number++;
5265 }
5266
5267 /* Implement TARGET_ARG_PARTIAL_BYTES. */
5268
5269 static int
5270 mips_arg_partial_bytes (cumulative_args_t cum,
5271 enum machine_mode mode, tree type, bool named)
5272 {
5273 struct mips_arg_info info;
5274
5275 mips_get_arg_info (&info, get_cumulative_args (cum), mode, type, named);
5276 return info.stack_words > 0 ? info.reg_words * UNITS_PER_WORD : 0;
5277 }
5278
5279 /* Implement TARGET_FUNCTION_ARG_BOUNDARY. Every parameter gets at
5280 least PARM_BOUNDARY bits of alignment, but will be given anything up
5281 to STACK_BOUNDARY bits if the type requires it. */
5282
5283 static unsigned int
5284 mips_function_arg_boundary (enum machine_mode mode, const_tree type)
5285 {
5286 unsigned int alignment;
5287
5288 alignment = type ? TYPE_ALIGN (type) : GET_MODE_ALIGNMENT (mode);
5289 if (alignment < PARM_BOUNDARY)
5290 alignment = PARM_BOUNDARY;
5291 if (alignment > STACK_BOUNDARY)
5292 alignment = STACK_BOUNDARY;
5293 return alignment;
5294 }
5295
5296 /* Return true if FUNCTION_ARG_PADDING (MODE, TYPE) should return
5297 upward rather than downward. In other words, return true if the
5298 first byte of the stack slot has useful data, false if the last
5299 byte does. */
5300
5301 bool
5302 mips_pad_arg_upward (enum machine_mode mode, const_tree type)
5303 {
5304 /* On little-endian targets, the first byte of every stack argument
5305 is passed in the first byte of the stack slot. */
5306 if (!BYTES_BIG_ENDIAN)
5307 return true;
5308
5309 /* Otherwise, integral types are padded downward: the last byte of a
5310 stack argument is passed in the last byte of the stack slot. */
5311 if (type != 0
5312 ? (INTEGRAL_TYPE_P (type)
5313 || POINTER_TYPE_P (type)
5314 || FIXED_POINT_TYPE_P (type))
5315 : (SCALAR_INT_MODE_P (mode)
5316 || ALL_SCALAR_FIXED_POINT_MODE_P (mode)))
5317 return false;
5318
5319 /* Big-endian o64 pads floating-point arguments downward. */
5320 if (mips_abi == ABI_O64)
5321 if (type != 0 ? FLOAT_TYPE_P (type) : GET_MODE_CLASS (mode) == MODE_FLOAT)
5322 return false;
5323
5324 /* Other types are padded upward for o32, o64, n32 and n64. */
5325 if (mips_abi != ABI_EABI)
5326 return true;
5327
5328 /* Arguments smaller than a stack slot are padded downward. */
5329 if (mode != BLKmode)
5330 return GET_MODE_BITSIZE (mode) >= PARM_BOUNDARY;
5331 else
5332 return int_size_in_bytes (type) >= (PARM_BOUNDARY / BITS_PER_UNIT);
5333 }
5334
5335 /* Likewise BLOCK_REG_PADDING (MODE, TYPE, ...). Return !BYTES_BIG_ENDIAN
5336 if the least significant byte of the register has useful data. Return
5337 the opposite if the most significant byte does. */
5338
5339 bool
5340 mips_pad_reg_upward (enum machine_mode mode, tree type)
5341 {
5342 /* No shifting is required for floating-point arguments. */
5343 if (type != 0 ? FLOAT_TYPE_P (type) : GET_MODE_CLASS (mode) == MODE_FLOAT)
5344 return !BYTES_BIG_ENDIAN;
5345
5346 /* Otherwise, apply the same padding to register arguments as we do
5347 to stack arguments. */
5348 return mips_pad_arg_upward (mode, type);
5349 }
5350
5351 /* Return nonzero when an argument must be passed by reference. */
5352
5353 static bool
5354 mips_pass_by_reference (cumulative_args_t cum ATTRIBUTE_UNUSED,
5355 enum machine_mode mode, const_tree type,
5356 bool named ATTRIBUTE_UNUSED)
5357 {
5358 if (mips_abi == ABI_EABI)
5359 {
5360 int size;
5361
5362 /* ??? How should SCmode be handled? */
5363 if (mode == DImode || mode == DFmode
5364 || mode == DQmode || mode == UDQmode
5365 || mode == DAmode || mode == UDAmode)
5366 return 0;
5367
5368 size = type ? int_size_in_bytes (type) : GET_MODE_SIZE (mode);
5369 return size == -1 || size > UNITS_PER_WORD;
5370 }
5371 else
5372 {
5373 /* If we have a variable-sized parameter, we have no choice. */
5374 return targetm.calls.must_pass_in_stack (mode, type);
5375 }
5376 }
5377
5378 /* Implement TARGET_CALLEE_COPIES. */
5379
5380 static bool
5381 mips_callee_copies (cumulative_args_t cum ATTRIBUTE_UNUSED,
5382 enum machine_mode mode ATTRIBUTE_UNUSED,
5383 const_tree type ATTRIBUTE_UNUSED, bool named)
5384 {
5385 return mips_abi == ABI_EABI && named;
5386 }
5387 \f
5388 /* See whether VALTYPE is a record whose fields should be returned in
5389 floating-point registers. If so, return the number of fields and
5390 list them in FIELDS (which should have two elements). Return 0
5391 otherwise.
5392
5393 For n32 & n64, a structure with one or two fields is returned in
5394 floating-point registers as long as every field has a floating-point
5395 type. */
5396
5397 static int
5398 mips_fpr_return_fields (const_tree valtype, tree *fields)
5399 {
5400 tree field;
5401 int i;
5402
5403 if (!TARGET_NEWABI)
5404 return 0;
5405
5406 if (TREE_CODE (valtype) != RECORD_TYPE)
5407 return 0;
5408
5409 i = 0;
5410 for (field = TYPE_FIELDS (valtype); field != 0; field = DECL_CHAIN (field))
5411 {
5412 if (TREE_CODE (field) != FIELD_DECL)
5413 continue;
5414
5415 if (!SCALAR_FLOAT_TYPE_P (TREE_TYPE (field)))
5416 return 0;
5417
5418 if (i == 2)
5419 return 0;
5420
5421 fields[i++] = field;
5422 }
5423 return i;
5424 }
5425
5426 /* Implement TARGET_RETURN_IN_MSB. For n32 & n64, we should return
5427 a value in the most significant part of $2/$3 if:
5428
5429 - the target is big-endian;
5430
5431 - the value has a structure or union type (we generalize this to
5432 cover aggregates from other languages too); and
5433
5434 - the structure is not returned in floating-point registers. */
5435
5436 static bool
5437 mips_return_in_msb (const_tree valtype)
5438 {
5439 tree fields[2];
5440
5441 return (TARGET_NEWABI
5442 && TARGET_BIG_ENDIAN
5443 && AGGREGATE_TYPE_P (valtype)
5444 && mips_fpr_return_fields (valtype, fields) == 0);
5445 }
5446
5447 /* Return true if the function return value MODE will get returned in a
5448 floating-point register. */
5449
5450 static bool
5451 mips_return_mode_in_fpr_p (enum machine_mode mode)
5452 {
5453 return ((GET_MODE_CLASS (mode) == MODE_FLOAT
5454 || mode == V2SFmode
5455 || GET_MODE_CLASS (mode) == MODE_COMPLEX_FLOAT)
5456 && GET_MODE_UNIT_SIZE (mode) <= UNITS_PER_HWFPVALUE);
5457 }
5458
5459 /* Return the representation of an FPR return register when the
5460 value being returned in FP_RETURN has mode VALUE_MODE and the
5461 return type itself has mode TYPE_MODE. On NewABI targets,
5462 the two modes may be different for structures like:
5463
5464 struct __attribute__((packed)) foo { float f; }
5465
5466 where we return the SFmode value of "f" in FP_RETURN, but where
5467 the structure itself has mode BLKmode. */
5468
5469 static rtx
5470 mips_return_fpr_single (enum machine_mode type_mode,
5471 enum machine_mode value_mode)
5472 {
5473 rtx x;
5474
5475 x = gen_rtx_REG (value_mode, FP_RETURN);
5476 if (type_mode != value_mode)
5477 {
5478 x = gen_rtx_EXPR_LIST (VOIDmode, x, const0_rtx);
5479 x = gen_rtx_PARALLEL (type_mode, gen_rtvec (1, x));
5480 }
5481 return x;
5482 }
5483
5484 /* Return a composite value in a pair of floating-point registers.
5485 MODE1 and OFFSET1 are the mode and byte offset for the first value,
5486 likewise MODE2 and OFFSET2 for the second. MODE is the mode of the
5487 complete value.
5488
5489 For n32 & n64, $f0 always holds the first value and $f2 the second.
5490 Otherwise the values are packed together as closely as possible. */
5491
5492 static rtx
5493 mips_return_fpr_pair (enum machine_mode mode,
5494 enum machine_mode mode1, HOST_WIDE_INT offset1,
5495 enum machine_mode mode2, HOST_WIDE_INT offset2)
5496 {
5497 int inc;
5498
5499 inc = (TARGET_NEWABI ? 2 : MAX_FPRS_PER_FMT);
5500 return gen_rtx_PARALLEL
5501 (mode,
5502 gen_rtvec (2,
5503 gen_rtx_EXPR_LIST (VOIDmode,
5504 gen_rtx_REG (mode1, FP_RETURN),
5505 GEN_INT (offset1)),
5506 gen_rtx_EXPR_LIST (VOIDmode,
5507 gen_rtx_REG (mode2, FP_RETURN + inc),
5508 GEN_INT (offset2))));
5509
5510 }
5511
5512 /* Implement TARGET_FUNCTION_VALUE and TARGET_LIBCALL_VALUE.
5513 For normal calls, VALTYPE is the return type and MODE is VOIDmode.
5514 For libcalls, VALTYPE is null and MODE is the mode of the return value. */
5515
5516 static rtx
5517 mips_function_value_1 (const_tree valtype, const_tree fn_decl_or_type,
5518 enum machine_mode mode)
5519 {
5520 if (valtype)
5521 {
5522 tree fields[2];
5523 int unsigned_p;
5524 const_tree func;
5525
5526 if (fn_decl_or_type && DECL_P (fn_decl_or_type))
5527 func = fn_decl_or_type;
5528 else
5529 func = NULL;
5530
5531 mode = TYPE_MODE (valtype);
5532 unsigned_p = TYPE_UNSIGNED (valtype);
5533
5534 /* Since TARGET_PROMOTE_FUNCTION_MODE unconditionally promotes,
5535 return values, promote the mode here too. */
5536 mode = promote_function_mode (valtype, mode, &unsigned_p, func, 1);
5537
5538 /* Handle structures whose fields are returned in $f0/$f2. */
5539 switch (mips_fpr_return_fields (valtype, fields))
5540 {
5541 case 1:
5542 return mips_return_fpr_single (mode,
5543 TYPE_MODE (TREE_TYPE (fields[0])));
5544
5545 case 2:
5546 return mips_return_fpr_pair (mode,
5547 TYPE_MODE (TREE_TYPE (fields[0])),
5548 int_byte_position (fields[0]),
5549 TYPE_MODE (TREE_TYPE (fields[1])),
5550 int_byte_position (fields[1]));
5551 }
5552
5553 /* If a value is passed in the most significant part of a register, see
5554 whether we have to round the mode up to a whole number of words. */
5555 if (mips_return_in_msb (valtype))
5556 {
5557 HOST_WIDE_INT size = int_size_in_bytes (valtype);
5558 if (size % UNITS_PER_WORD != 0)
5559 {
5560 size += UNITS_PER_WORD - size % UNITS_PER_WORD;
5561 mode = mode_for_size (size * BITS_PER_UNIT, MODE_INT, 0);
5562 }
5563 }
5564
5565 /* For EABI, the class of return register depends entirely on MODE.
5566 For example, "struct { some_type x; }" and "union { some_type x; }"
5567 are returned in the same way as a bare "some_type" would be.
5568 Other ABIs only use FPRs for scalar, complex or vector types. */
5569 if (mips_abi != ABI_EABI && !FLOAT_TYPE_P (valtype))
5570 return gen_rtx_REG (mode, GP_RETURN);
5571 }
5572
5573 if (!TARGET_MIPS16)
5574 {
5575 /* Handle long doubles for n32 & n64. */
5576 if (mode == TFmode)
5577 return mips_return_fpr_pair (mode,
5578 DImode, 0,
5579 DImode, GET_MODE_SIZE (mode) / 2);
5580
5581 if (mips_return_mode_in_fpr_p (mode))
5582 {
5583 if (GET_MODE_CLASS (mode) == MODE_COMPLEX_FLOAT)
5584 return mips_return_fpr_pair (mode,
5585 GET_MODE_INNER (mode), 0,
5586 GET_MODE_INNER (mode),
5587 GET_MODE_SIZE (mode) / 2);
5588 else
5589 return gen_rtx_REG (mode, FP_RETURN);
5590 }
5591 }
5592
5593 return gen_rtx_REG (mode, GP_RETURN);
5594 }
5595
5596 /* Implement TARGET_FUNCTION_VALUE. */
5597
5598 static rtx
5599 mips_function_value (const_tree valtype, const_tree fn_decl_or_type,
5600 bool outgoing ATTRIBUTE_UNUSED)
5601 {
5602 return mips_function_value_1 (valtype, fn_decl_or_type, VOIDmode);
5603 }
5604
5605 /* Implement TARGET_LIBCALL_VALUE. */
5606
5607 static rtx
5608 mips_libcall_value (enum machine_mode mode, const_rtx fun ATTRIBUTE_UNUSED)
5609 {
5610 return mips_function_value_1 (NULL_TREE, NULL_TREE, mode);
5611 }
5612
5613 /* Implement TARGET_FUNCTION_VALUE_REGNO_P.
5614
5615 On the MIPS, R2 R3 and F0 F2 are the only register thus used.
5616 Currently, R2 and F0 are only implemented here (C has no complex type). */
5617
5618 static bool
5619 mips_function_value_regno_p (const unsigned int regno)
5620 {
5621 if (regno == GP_RETURN
5622 || regno == FP_RETURN
5623 || (LONG_DOUBLE_TYPE_SIZE == 128
5624 && FP_RETURN != GP_RETURN
5625 && regno == FP_RETURN + 2))
5626 return true;
5627
5628 return false;
5629 }
5630
5631 /* Implement TARGET_RETURN_IN_MEMORY. Under the o32 and o64 ABIs,
5632 all BLKmode objects are returned in memory. Under the n32, n64
5633 and embedded ABIs, small structures are returned in a register.
5634 Objects with varying size must still be returned in memory, of
5635 course. */
5636
5637 static bool
5638 mips_return_in_memory (const_tree type, const_tree fndecl ATTRIBUTE_UNUSED)
5639 {
5640 return (TARGET_OLDABI
5641 ? TYPE_MODE (type) == BLKmode
5642 : !IN_RANGE (int_size_in_bytes (type), 0, 2 * UNITS_PER_WORD));
5643 }
5644 \f
5645 /* Implement TARGET_SETUP_INCOMING_VARARGS. */
5646
5647 static void
5648 mips_setup_incoming_varargs (cumulative_args_t cum, enum machine_mode mode,
5649 tree type, int *pretend_size ATTRIBUTE_UNUSED,
5650 int no_rtl)
5651 {
5652 CUMULATIVE_ARGS local_cum;
5653 int gp_saved, fp_saved;
5654
5655 /* The caller has advanced CUM up to, but not beyond, the last named
5656 argument. Advance a local copy of CUM past the last "real" named
5657 argument, to find out how many registers are left over. */
5658 local_cum = *get_cumulative_args (cum);
5659 mips_function_arg_advance (pack_cumulative_args (&local_cum), mode, type,
5660 true);
5661
5662 /* Found out how many registers we need to save. */
5663 gp_saved = MAX_ARGS_IN_REGISTERS - local_cum.num_gprs;
5664 fp_saved = (EABI_FLOAT_VARARGS_P
5665 ? MAX_ARGS_IN_REGISTERS - local_cum.num_fprs
5666 : 0);
5667
5668 if (!no_rtl)
5669 {
5670 if (gp_saved > 0)
5671 {
5672 rtx ptr, mem;
5673
5674 ptr = plus_constant (Pmode, virtual_incoming_args_rtx,
5675 REG_PARM_STACK_SPACE (cfun->decl)
5676 - gp_saved * UNITS_PER_WORD);
5677 mem = gen_frame_mem (BLKmode, ptr);
5678 set_mem_alias_set (mem, get_varargs_alias_set ());
5679
5680 move_block_from_reg (local_cum.num_gprs + GP_ARG_FIRST,
5681 mem, gp_saved);
5682 }
5683 if (fp_saved > 0)
5684 {
5685 /* We can't use move_block_from_reg, because it will use
5686 the wrong mode. */
5687 enum machine_mode mode;
5688 int off, i;
5689
5690 /* Set OFF to the offset from virtual_incoming_args_rtx of
5691 the first float register. The FP save area lies below
5692 the integer one, and is aligned to UNITS_PER_FPVALUE bytes. */
5693 off = (-gp_saved * UNITS_PER_WORD) & -UNITS_PER_FPVALUE;
5694 off -= fp_saved * UNITS_PER_FPREG;
5695
5696 mode = TARGET_SINGLE_FLOAT ? SFmode : DFmode;
5697
5698 for (i = local_cum.num_fprs; i < MAX_ARGS_IN_REGISTERS;
5699 i += MAX_FPRS_PER_FMT)
5700 {
5701 rtx ptr, mem;
5702
5703 ptr = plus_constant (Pmode, virtual_incoming_args_rtx, off);
5704 mem = gen_frame_mem (mode, ptr);
5705 set_mem_alias_set (mem, get_varargs_alias_set ());
5706 mips_emit_move (mem, gen_rtx_REG (mode, FP_ARG_FIRST + i));
5707 off += UNITS_PER_HWFPVALUE;
5708 }
5709 }
5710 }
5711 if (REG_PARM_STACK_SPACE (cfun->decl) == 0)
5712 cfun->machine->varargs_size = (gp_saved * UNITS_PER_WORD
5713 + fp_saved * UNITS_PER_FPREG);
5714 }
5715
5716 /* Implement TARGET_BUILTIN_VA_LIST. */
5717
5718 static tree
5719 mips_build_builtin_va_list (void)
5720 {
5721 if (EABI_FLOAT_VARARGS_P)
5722 {
5723 /* We keep 3 pointers, and two offsets.
5724
5725 Two pointers are to the overflow area, which starts at the CFA.
5726 One of these is constant, for addressing into the GPR save area
5727 below it. The other is advanced up the stack through the
5728 overflow region.
5729
5730 The third pointer is to the bottom of the GPR save area.
5731 Since the FPR save area is just below it, we can address
5732 FPR slots off this pointer.
5733
5734 We also keep two one-byte offsets, which are to be subtracted
5735 from the constant pointers to yield addresses in the GPR and
5736 FPR save areas. These are downcounted as float or non-float
5737 arguments are used, and when they get to zero, the argument
5738 must be obtained from the overflow region. */
5739 tree f_ovfl, f_gtop, f_ftop, f_goff, f_foff, f_res, record;
5740 tree array, index;
5741
5742 record = lang_hooks.types.make_type (RECORD_TYPE);
5743
5744 f_ovfl = build_decl (BUILTINS_LOCATION,
5745 FIELD_DECL, get_identifier ("__overflow_argptr"),
5746 ptr_type_node);
5747 f_gtop = build_decl (BUILTINS_LOCATION,
5748 FIELD_DECL, get_identifier ("__gpr_top"),
5749 ptr_type_node);
5750 f_ftop = build_decl (BUILTINS_LOCATION,
5751 FIELD_DECL, get_identifier ("__fpr_top"),
5752 ptr_type_node);
5753 f_goff = build_decl (BUILTINS_LOCATION,
5754 FIELD_DECL, get_identifier ("__gpr_offset"),
5755 unsigned_char_type_node);
5756 f_foff = build_decl (BUILTINS_LOCATION,
5757 FIELD_DECL, get_identifier ("__fpr_offset"),
5758 unsigned_char_type_node);
5759 /* Explicitly pad to the size of a pointer, so that -Wpadded won't
5760 warn on every user file. */
5761 index = build_int_cst (NULL_TREE, GET_MODE_SIZE (ptr_mode) - 2 - 1);
5762 array = build_array_type (unsigned_char_type_node,
5763 build_index_type (index));
5764 f_res = build_decl (BUILTINS_LOCATION,
5765 FIELD_DECL, get_identifier ("__reserved"), array);
5766
5767 DECL_FIELD_CONTEXT (f_ovfl) = record;
5768 DECL_FIELD_CONTEXT (f_gtop) = record;
5769 DECL_FIELD_CONTEXT (f_ftop) = record;
5770 DECL_FIELD_CONTEXT (f_goff) = record;
5771 DECL_FIELD_CONTEXT (f_foff) = record;
5772 DECL_FIELD_CONTEXT (f_res) = record;
5773
5774 TYPE_FIELDS (record) = f_ovfl;
5775 DECL_CHAIN (f_ovfl) = f_gtop;
5776 DECL_CHAIN (f_gtop) = f_ftop;
5777 DECL_CHAIN (f_ftop) = f_goff;
5778 DECL_CHAIN (f_goff) = f_foff;
5779 DECL_CHAIN (f_foff) = f_res;
5780
5781 layout_type (record);
5782 return record;
5783 }
5784 else
5785 /* Otherwise, we use 'void *'. */
5786 return ptr_type_node;
5787 }
5788
5789 /* Implement TARGET_EXPAND_BUILTIN_VA_START. */
5790
5791 static void
5792 mips_va_start (tree valist, rtx nextarg)
5793 {
5794 if (EABI_FLOAT_VARARGS_P)
5795 {
5796 const CUMULATIVE_ARGS *cum;
5797 tree f_ovfl, f_gtop, f_ftop, f_goff, f_foff;
5798 tree ovfl, gtop, ftop, goff, foff;
5799 tree t;
5800 int gpr_save_area_size;
5801 int fpr_save_area_size;
5802 int fpr_offset;
5803
5804 cum = &crtl->args.info;
5805 gpr_save_area_size
5806 = (MAX_ARGS_IN_REGISTERS - cum->num_gprs) * UNITS_PER_WORD;
5807 fpr_save_area_size
5808 = (MAX_ARGS_IN_REGISTERS - cum->num_fprs) * UNITS_PER_FPREG;
5809
5810 f_ovfl = TYPE_FIELDS (va_list_type_node);
5811 f_gtop = DECL_CHAIN (f_ovfl);
5812 f_ftop = DECL_CHAIN (f_gtop);
5813 f_goff = DECL_CHAIN (f_ftop);
5814 f_foff = DECL_CHAIN (f_goff);
5815
5816 ovfl = build3 (COMPONENT_REF, TREE_TYPE (f_ovfl), valist, f_ovfl,
5817 NULL_TREE);
5818 gtop = build3 (COMPONENT_REF, TREE_TYPE (f_gtop), valist, f_gtop,
5819 NULL_TREE);
5820 ftop = build3 (COMPONENT_REF, TREE_TYPE (f_ftop), valist, f_ftop,
5821 NULL_TREE);
5822 goff = build3 (COMPONENT_REF, TREE_TYPE (f_goff), valist, f_goff,
5823 NULL_TREE);
5824 foff = build3 (COMPONENT_REF, TREE_TYPE (f_foff), valist, f_foff,
5825 NULL_TREE);
5826
5827 /* Emit code to initialize OVFL, which points to the next varargs
5828 stack argument. CUM->STACK_WORDS gives the number of stack
5829 words used by named arguments. */
5830 t = make_tree (TREE_TYPE (ovfl), virtual_incoming_args_rtx);
5831 if (cum->stack_words > 0)
5832 t = fold_build_pointer_plus_hwi (t, cum->stack_words * UNITS_PER_WORD);
5833 t = build2 (MODIFY_EXPR, TREE_TYPE (ovfl), ovfl, t);
5834 expand_expr (t, const0_rtx, VOIDmode, EXPAND_NORMAL);
5835
5836 /* Emit code to initialize GTOP, the top of the GPR save area. */
5837 t = make_tree (TREE_TYPE (gtop), virtual_incoming_args_rtx);
5838 t = build2 (MODIFY_EXPR, TREE_TYPE (gtop), gtop, t);
5839 expand_expr (t, const0_rtx, VOIDmode, EXPAND_NORMAL);
5840
5841 /* Emit code to initialize FTOP, the top of the FPR save area.
5842 This address is gpr_save_area_bytes below GTOP, rounded
5843 down to the next fp-aligned boundary. */
5844 t = make_tree (TREE_TYPE (ftop), virtual_incoming_args_rtx);
5845 fpr_offset = gpr_save_area_size + UNITS_PER_FPVALUE - 1;
5846 fpr_offset &= -UNITS_PER_FPVALUE;
5847 if (fpr_offset)
5848 t = fold_build_pointer_plus_hwi (t, -fpr_offset);
5849 t = build2 (MODIFY_EXPR, TREE_TYPE (ftop), ftop, t);
5850 expand_expr (t, const0_rtx, VOIDmode, EXPAND_NORMAL);
5851
5852 /* Emit code to initialize GOFF, the offset from GTOP of the
5853 next GPR argument. */
5854 t = build2 (MODIFY_EXPR, TREE_TYPE (goff), goff,
5855 build_int_cst (TREE_TYPE (goff), gpr_save_area_size));
5856 expand_expr (t, const0_rtx, VOIDmode, EXPAND_NORMAL);
5857
5858 /* Likewise emit code to initialize FOFF, the offset from FTOP
5859 of the next FPR argument. */
5860 t = build2 (MODIFY_EXPR, TREE_TYPE (foff), foff,
5861 build_int_cst (TREE_TYPE (foff), fpr_save_area_size));
5862 expand_expr (t, const0_rtx, VOIDmode, EXPAND_NORMAL);
5863 }
5864 else
5865 {
5866 nextarg = plus_constant (Pmode, nextarg, -cfun->machine->varargs_size);
5867 std_expand_builtin_va_start (valist, nextarg);
5868 }
5869 }
5870
5871 /* Like std_gimplify_va_arg_expr, but apply alignment to zero-sized
5872 types as well. */
5873
5874 static tree
5875 mips_std_gimplify_va_arg_expr (tree valist, tree type, gimple_seq *pre_p,
5876 gimple_seq *post_p)
5877 {
5878 tree addr, t, type_size, rounded_size, valist_tmp;
5879 unsigned HOST_WIDE_INT align, boundary;
5880 bool indirect;
5881
5882 indirect = pass_by_reference (NULL, TYPE_MODE (type), type, false);
5883 if (indirect)
5884 type = build_pointer_type (type);
5885
5886 align = PARM_BOUNDARY / BITS_PER_UNIT;
5887 boundary = targetm.calls.function_arg_boundary (TYPE_MODE (type), type);
5888
5889 /* When we align parameter on stack for caller, if the parameter
5890 alignment is beyond MAX_SUPPORTED_STACK_ALIGNMENT, it will be
5891 aligned at MAX_SUPPORTED_STACK_ALIGNMENT. We will match callee
5892 here with caller. */
5893 if (boundary > MAX_SUPPORTED_STACK_ALIGNMENT)
5894 boundary = MAX_SUPPORTED_STACK_ALIGNMENT;
5895
5896 boundary /= BITS_PER_UNIT;
5897
5898 /* Hoist the valist value into a temporary for the moment. */
5899 valist_tmp = get_initialized_tmp_var (valist, pre_p, NULL);
5900
5901 /* va_list pointer is aligned to PARM_BOUNDARY. If argument actually
5902 requires greater alignment, we must perform dynamic alignment. */
5903 if (boundary > align)
5904 {
5905 t = build2 (MODIFY_EXPR, TREE_TYPE (valist), valist_tmp,
5906 fold_build_pointer_plus_hwi (valist_tmp, boundary - 1));
5907 gimplify_and_add (t, pre_p);
5908
5909 t = build2 (MODIFY_EXPR, TREE_TYPE (valist), valist_tmp,
5910 fold_build2 (BIT_AND_EXPR, TREE_TYPE (valist),
5911 valist_tmp,
5912 build_int_cst (TREE_TYPE (valist), -boundary)));
5913 gimplify_and_add (t, pre_p);
5914 }
5915 else
5916 boundary = align;
5917
5918 /* If the actual alignment is less than the alignment of the type,
5919 adjust the type accordingly so that we don't assume strict alignment
5920 when dereferencing the pointer. */
5921 boundary *= BITS_PER_UNIT;
5922 if (boundary < TYPE_ALIGN (type))
5923 {
5924 type = build_variant_type_copy (type);
5925 TYPE_ALIGN (type) = boundary;
5926 }
5927
5928 /* Compute the rounded size of the type. */
5929 type_size = size_in_bytes (type);
5930 rounded_size = round_up (type_size, align);
5931
5932 /* Reduce rounded_size so it's sharable with the postqueue. */
5933 gimplify_expr (&rounded_size, pre_p, post_p, is_gimple_val, fb_rvalue);
5934
5935 /* Get AP. */
5936 addr = valist_tmp;
5937 if (PAD_VARARGS_DOWN && !integer_zerop (rounded_size))
5938 {
5939 /* Small args are padded downward. */
5940 t = fold_build2_loc (input_location, GT_EXPR, sizetype,
5941 rounded_size, size_int (align));
5942 t = fold_build3 (COND_EXPR, sizetype, t, size_zero_node,
5943 size_binop (MINUS_EXPR, rounded_size, type_size));
5944 addr = fold_build_pointer_plus (addr, t);
5945 }
5946
5947 /* Compute new value for AP. */
5948 t = fold_build_pointer_plus (valist_tmp, rounded_size);
5949 t = build2 (MODIFY_EXPR, TREE_TYPE (valist), valist, t);
5950 gimplify_and_add (t, pre_p);
5951
5952 addr = fold_convert (build_pointer_type (type), addr);
5953
5954 if (indirect)
5955 addr = build_va_arg_indirect_ref (addr);
5956
5957 return build_va_arg_indirect_ref (addr);
5958 }
5959
5960 /* Implement TARGET_GIMPLIFY_VA_ARG_EXPR. */
5961
5962 static tree
5963 mips_gimplify_va_arg_expr (tree valist, tree type, gimple_seq *pre_p,
5964 gimple_seq *post_p)
5965 {
5966 tree addr;
5967 bool indirect_p;
5968
5969 indirect_p = pass_by_reference (NULL, TYPE_MODE (type), type, 0);
5970 if (indirect_p)
5971 type = build_pointer_type (type);
5972
5973 if (!EABI_FLOAT_VARARGS_P)
5974 addr = mips_std_gimplify_va_arg_expr (valist, type, pre_p, post_p);
5975 else
5976 {
5977 tree f_ovfl, f_gtop, f_ftop, f_goff, f_foff;
5978 tree ovfl, top, off, align;
5979 HOST_WIDE_INT size, rsize, osize;
5980 tree t, u;
5981
5982 f_ovfl = TYPE_FIELDS (va_list_type_node);
5983 f_gtop = DECL_CHAIN (f_ovfl);
5984 f_ftop = DECL_CHAIN (f_gtop);
5985 f_goff = DECL_CHAIN (f_ftop);
5986 f_foff = DECL_CHAIN (f_goff);
5987
5988 /* Let:
5989
5990 TOP be the top of the GPR or FPR save area;
5991 OFF be the offset from TOP of the next register;
5992 ADDR_RTX be the address of the argument;
5993 SIZE be the number of bytes in the argument type;
5994 RSIZE be the number of bytes used to store the argument
5995 when it's in the register save area; and
5996 OSIZE be the number of bytes used to store it when it's
5997 in the stack overflow area.
5998
5999 The code we want is:
6000
6001 1: off &= -rsize; // round down
6002 2: if (off != 0)
6003 3: {
6004 4: addr_rtx = top - off + (BYTES_BIG_ENDIAN ? RSIZE - SIZE : 0);
6005 5: off -= rsize;
6006 6: }
6007 7: else
6008 8: {
6009 9: ovfl = ((intptr_t) ovfl + osize - 1) & -osize;
6010 10: addr_rtx = ovfl + (BYTES_BIG_ENDIAN ? OSIZE - SIZE : 0);
6011 11: ovfl += osize;
6012 14: }
6013
6014 [1] and [9] can sometimes be optimized away. */
6015
6016 ovfl = build3 (COMPONENT_REF, TREE_TYPE (f_ovfl), valist, f_ovfl,
6017 NULL_TREE);
6018 size = int_size_in_bytes (type);
6019
6020 if (GET_MODE_CLASS (TYPE_MODE (type)) == MODE_FLOAT
6021 && GET_MODE_SIZE (TYPE_MODE (type)) <= UNITS_PER_FPVALUE)
6022 {
6023 top = build3 (COMPONENT_REF, TREE_TYPE (f_ftop),
6024 unshare_expr (valist), f_ftop, NULL_TREE);
6025 off = build3 (COMPONENT_REF, TREE_TYPE (f_foff),
6026 unshare_expr (valist), f_foff, NULL_TREE);
6027
6028 /* When va_start saves FPR arguments to the stack, each slot
6029 takes up UNITS_PER_HWFPVALUE bytes, regardless of the
6030 argument's precision. */
6031 rsize = UNITS_PER_HWFPVALUE;
6032
6033 /* Overflow arguments are padded to UNITS_PER_WORD bytes
6034 (= PARM_BOUNDARY bits). This can be different from RSIZE
6035 in two cases:
6036
6037 (1) On 32-bit targets when TYPE is a structure such as:
6038
6039 struct s { float f; };
6040
6041 Such structures are passed in paired FPRs, so RSIZE
6042 will be 8 bytes. However, the structure only takes
6043 up 4 bytes of memory, so OSIZE will only be 4.
6044
6045 (2) In combinations such as -mgp64 -msingle-float
6046 -fshort-double. Doubles passed in registers will then take
6047 up 4 (UNITS_PER_HWFPVALUE) bytes, but those passed on the
6048 stack take up UNITS_PER_WORD bytes. */
6049 osize = MAX (GET_MODE_SIZE (TYPE_MODE (type)), UNITS_PER_WORD);
6050 }
6051 else
6052 {
6053 top = build3 (COMPONENT_REF, TREE_TYPE (f_gtop),
6054 unshare_expr (valist), f_gtop, NULL_TREE);
6055 off = build3 (COMPONENT_REF, TREE_TYPE (f_goff),
6056 unshare_expr (valist), f_goff, NULL_TREE);
6057 rsize = (size + UNITS_PER_WORD - 1) & -UNITS_PER_WORD;
6058 if (rsize > UNITS_PER_WORD)
6059 {
6060 /* [1] Emit code for: off &= -rsize. */
6061 t = build2 (BIT_AND_EXPR, TREE_TYPE (off), unshare_expr (off),
6062 build_int_cst (TREE_TYPE (off), -rsize));
6063 gimplify_assign (unshare_expr (off), t, pre_p);
6064 }
6065 osize = rsize;
6066 }
6067
6068 /* [2] Emit code to branch if off == 0. */
6069 t = build2 (NE_EXPR, boolean_type_node, unshare_expr (off),
6070 build_int_cst (TREE_TYPE (off), 0));
6071 addr = build3 (COND_EXPR, ptr_type_node, t, NULL_TREE, NULL_TREE);
6072
6073 /* [5] Emit code for: off -= rsize. We do this as a form of
6074 post-decrement not available to C. */
6075 t = fold_convert (TREE_TYPE (off), build_int_cst (NULL_TREE, rsize));
6076 t = build2 (POSTDECREMENT_EXPR, TREE_TYPE (off), off, t);
6077
6078 /* [4] Emit code for:
6079 addr_rtx = top - off + (BYTES_BIG_ENDIAN ? RSIZE - SIZE : 0). */
6080 t = fold_convert (sizetype, t);
6081 t = fold_build1 (NEGATE_EXPR, sizetype, t);
6082 t = fold_build_pointer_plus (top, t);
6083 if (BYTES_BIG_ENDIAN && rsize > size)
6084 t = fold_build_pointer_plus_hwi (t, rsize - size);
6085 COND_EXPR_THEN (addr) = t;
6086
6087 if (osize > UNITS_PER_WORD)
6088 {
6089 /* [9] Emit: ovfl = ((intptr_t) ovfl + osize - 1) & -osize. */
6090 t = fold_build_pointer_plus_hwi (unshare_expr (ovfl), osize - 1);
6091 u = build_int_cst (TREE_TYPE (t), -osize);
6092 t = build2 (BIT_AND_EXPR, TREE_TYPE (t), t, u);
6093 align = build2 (MODIFY_EXPR, TREE_TYPE (ovfl),
6094 unshare_expr (ovfl), t);
6095 }
6096 else
6097 align = NULL;
6098
6099 /* [10, 11] Emit code for:
6100 addr_rtx = ovfl + (BYTES_BIG_ENDIAN ? OSIZE - SIZE : 0)
6101 ovfl += osize. */
6102 u = fold_convert (TREE_TYPE (ovfl), build_int_cst (NULL_TREE, osize));
6103 t = build2 (POSTINCREMENT_EXPR, TREE_TYPE (ovfl), ovfl, u);
6104 if (BYTES_BIG_ENDIAN && osize > size)
6105 t = fold_build_pointer_plus_hwi (t, osize - size);
6106
6107 /* String [9] and [10, 11] together. */
6108 if (align)
6109 t = build2 (COMPOUND_EXPR, TREE_TYPE (t), align, t);
6110 COND_EXPR_ELSE (addr) = t;
6111
6112 addr = fold_convert (build_pointer_type (type), addr);
6113 addr = build_va_arg_indirect_ref (addr);
6114 }
6115
6116 if (indirect_p)
6117 addr = build_va_arg_indirect_ref (addr);
6118
6119 return addr;
6120 }
6121 \f
6122 /* Declare a unique, locally-binding function called NAME, then start
6123 its definition. */
6124
6125 static void
6126 mips_start_unique_function (const char *name)
6127 {
6128 tree decl;
6129
6130 decl = build_decl (BUILTINS_LOCATION, FUNCTION_DECL,
6131 get_identifier (name),
6132 build_function_type_list (void_type_node, NULL_TREE));
6133 DECL_RESULT (decl) = build_decl (BUILTINS_LOCATION, RESULT_DECL,
6134 NULL_TREE, void_type_node);
6135 TREE_PUBLIC (decl) = 1;
6136 TREE_STATIC (decl) = 1;
6137
6138 DECL_COMDAT_GROUP (decl) = DECL_ASSEMBLER_NAME (decl);
6139
6140 targetm.asm_out.unique_section (decl, 0);
6141 switch_to_section (get_named_section (decl, NULL, 0));
6142
6143 targetm.asm_out.globalize_label (asm_out_file, name);
6144 fputs ("\t.hidden\t", asm_out_file);
6145 assemble_name (asm_out_file, name);
6146 putc ('\n', asm_out_file);
6147 }
6148
6149 /* Start a definition of function NAME. MIPS16_P indicates whether the
6150 function contains MIPS16 code. */
6151
6152 static void
6153 mips_start_function_definition (const char *name, bool mips16_p)
6154 {
6155 if (mips16_p)
6156 fprintf (asm_out_file, "\t.set\tmips16\n");
6157 else
6158 fprintf (asm_out_file, "\t.set\tnomips16\n");
6159
6160 if (TARGET_MICROMIPS)
6161 fprintf (asm_out_file, "\t.set\tmicromips\n");
6162 #ifdef HAVE_GAS_MICROMIPS
6163 else
6164 fprintf (asm_out_file, "\t.set\tnomicromips\n");
6165 #endif
6166
6167 if (!flag_inhibit_size_directive)
6168 {
6169 fputs ("\t.ent\t", asm_out_file);
6170 assemble_name (asm_out_file, name);
6171 fputs ("\n", asm_out_file);
6172 }
6173
6174 ASM_OUTPUT_TYPE_DIRECTIVE (asm_out_file, name, "function");
6175
6176 /* Start the definition proper. */
6177 assemble_name (asm_out_file, name);
6178 fputs (":\n", asm_out_file);
6179 }
6180
6181 /* End a function definition started by mips_start_function_definition. */
6182
6183 static void
6184 mips_end_function_definition (const char *name)
6185 {
6186 if (!flag_inhibit_size_directive)
6187 {
6188 fputs ("\t.end\t", asm_out_file);
6189 assemble_name (asm_out_file, name);
6190 fputs ("\n", asm_out_file);
6191 }
6192 }
6193 \f
6194 /* Output a definition of the __mips16_rdhwr function. */
6195
6196 static void
6197 mips_output_mips16_rdhwr (void)
6198 {
6199 const char *name;
6200
6201 name = "__mips16_rdhwr";
6202 mips_start_unique_function (name);
6203 mips_start_function_definition (name, false);
6204 fprintf (asm_out_file,
6205 "\t.set\tpush\n"
6206 "\t.set\tmips32r2\n"
6207 "\t.set\tnoreorder\n"
6208 "\trdhwr\t$3,$29\n"
6209 "\t.set\tpop\n"
6210 "\tj\t$31\n");
6211 mips_end_function_definition (name);
6212 }
6213 \f
6214 /* Return true if calls to X can use R_MIPS_CALL* relocations. */
6215
6216 static bool
6217 mips_ok_for_lazy_binding_p (rtx x)
6218 {
6219 return (TARGET_USE_GOT
6220 && GET_CODE (x) == SYMBOL_REF
6221 && !SYMBOL_REF_BIND_NOW_P (x)
6222 && !mips_symbol_binds_local_p (x));
6223 }
6224
6225 /* Load function address ADDR into register DEST. TYPE is as for
6226 mips_expand_call. Return true if we used an explicit lazy-binding
6227 sequence. */
6228
6229 static bool
6230 mips_load_call_address (enum mips_call_type type, rtx dest, rtx addr)
6231 {
6232 /* If we're generating PIC, and this call is to a global function,
6233 try to allow its address to be resolved lazily. This isn't
6234 possible for sibcalls when $gp is call-saved because the value
6235 of $gp on entry to the stub would be our caller's gp, not ours. */
6236 if (TARGET_EXPLICIT_RELOCS
6237 && !(type == MIPS_CALL_SIBCALL && TARGET_CALL_SAVED_GP)
6238 && mips_ok_for_lazy_binding_p (addr))
6239 {
6240 addr = mips_got_load (dest, addr, SYMBOL_GOTOFF_CALL);
6241 emit_insn (gen_rtx_SET (VOIDmode, dest, addr));
6242 return true;
6243 }
6244 else
6245 {
6246 mips_emit_move (dest, addr);
6247 return false;
6248 }
6249 }
6250 \f
6251 /* Each locally-defined hard-float MIPS16 function has a local symbol
6252 associated with it. This hash table maps the function symbol (FUNC)
6253 to the local symbol (LOCAL). */
6254 struct GTY(()) mips16_local_alias {
6255 rtx func;
6256 rtx local;
6257 };
6258 static GTY ((param_is (struct mips16_local_alias))) htab_t mips16_local_aliases;
6259
6260 /* Hash table callbacks for mips16_local_aliases. */
6261
6262 static hashval_t
6263 mips16_local_aliases_hash (const void *entry)
6264 {
6265 const struct mips16_local_alias *alias;
6266
6267 alias = (const struct mips16_local_alias *) entry;
6268 return htab_hash_string (XSTR (alias->func, 0));
6269 }
6270
6271 static int
6272 mips16_local_aliases_eq (const void *entry1, const void *entry2)
6273 {
6274 const struct mips16_local_alias *alias1, *alias2;
6275
6276 alias1 = (const struct mips16_local_alias *) entry1;
6277 alias2 = (const struct mips16_local_alias *) entry2;
6278 return rtx_equal_p (alias1->func, alias2->func);
6279 }
6280
6281 /* FUNC is the symbol for a locally-defined hard-float MIPS16 function.
6282 Return a local alias for it, creating a new one if necessary. */
6283
6284 static rtx
6285 mips16_local_alias (rtx func)
6286 {
6287 struct mips16_local_alias *alias, tmp_alias;
6288 void **slot;
6289
6290 /* Create the hash table if this is the first call. */
6291 if (mips16_local_aliases == NULL)
6292 mips16_local_aliases = htab_create_ggc (37, mips16_local_aliases_hash,
6293 mips16_local_aliases_eq, NULL);
6294
6295 /* Look up the function symbol, creating a new entry if need be. */
6296 tmp_alias.func = func;
6297 slot = htab_find_slot (mips16_local_aliases, &tmp_alias, INSERT);
6298 gcc_assert (slot != NULL);
6299
6300 alias = (struct mips16_local_alias *) *slot;
6301 if (alias == NULL)
6302 {
6303 const char *func_name, *local_name;
6304 rtx local;
6305
6306 /* Create a new SYMBOL_REF for the local symbol. The choice of
6307 __fn_local_* is based on the __fn_stub_* names that we've
6308 traditionally used for the non-MIPS16 stub. */
6309 func_name = targetm.strip_name_encoding (XSTR (func, 0));
6310 local_name = ACONCAT (("__fn_local_", func_name, NULL));
6311 local = gen_rtx_SYMBOL_REF (Pmode, ggc_strdup (local_name));
6312 SYMBOL_REF_FLAGS (local) = SYMBOL_REF_FLAGS (func) | SYMBOL_FLAG_LOCAL;
6313
6314 /* Create a new structure to represent the mapping. */
6315 alias = ggc_alloc_mips16_local_alias ();
6316 alias->func = func;
6317 alias->local = local;
6318 *slot = alias;
6319 }
6320 return alias->local;
6321 }
6322 \f
6323 /* A chained list of functions for which mips16_build_call_stub has already
6324 generated a stub. NAME is the name of the function and FP_RET_P is true
6325 if the function returns a value in floating-point registers. */
6326 struct mips16_stub {
6327 struct mips16_stub *next;
6328 char *name;
6329 bool fp_ret_p;
6330 };
6331 static struct mips16_stub *mips16_stubs;
6332
6333 /* Return the two-character string that identifies floating-point
6334 return mode MODE in the name of a MIPS16 function stub. */
6335
6336 static const char *
6337 mips16_call_stub_mode_suffix (enum machine_mode mode)
6338 {
6339 if (mode == SFmode)
6340 return "sf";
6341 else if (mode == DFmode)
6342 return "df";
6343 else if (mode == SCmode)
6344 return "sc";
6345 else if (mode == DCmode)
6346 return "dc";
6347 else if (mode == V2SFmode)
6348 return "df";
6349 else
6350 gcc_unreachable ();
6351 }
6352
6353 /* Write instructions to move a 32-bit value between general register
6354 GPREG and floating-point register FPREG. DIRECTION is 't' to move
6355 from GPREG to FPREG and 'f' to move in the opposite direction. */
6356
6357 static void
6358 mips_output_32bit_xfer (char direction, unsigned int gpreg, unsigned int fpreg)
6359 {
6360 fprintf (asm_out_file, "\tm%cc1\t%s,%s\n", direction,
6361 reg_names[gpreg], reg_names[fpreg]);
6362 }
6363
6364 /* Likewise for 64-bit values. */
6365
6366 static void
6367 mips_output_64bit_xfer (char direction, unsigned int gpreg, unsigned int fpreg)
6368 {
6369 if (TARGET_64BIT)
6370 fprintf (asm_out_file, "\tdm%cc1\t%s,%s\n", direction,
6371 reg_names[gpreg], reg_names[fpreg]);
6372 else if (TARGET_FLOAT64)
6373 {
6374 fprintf (asm_out_file, "\tm%cc1\t%s,%s\n", direction,
6375 reg_names[gpreg + TARGET_BIG_ENDIAN], reg_names[fpreg]);
6376 fprintf (asm_out_file, "\tm%chc1\t%s,%s\n", direction,
6377 reg_names[gpreg + TARGET_LITTLE_ENDIAN], reg_names[fpreg]);
6378 }
6379 else
6380 {
6381 /* Move the least-significant word. */
6382 fprintf (asm_out_file, "\tm%cc1\t%s,%s\n", direction,
6383 reg_names[gpreg + TARGET_BIG_ENDIAN], reg_names[fpreg]);
6384 /* ...then the most significant word. */
6385 fprintf (asm_out_file, "\tm%cc1\t%s,%s\n", direction,
6386 reg_names[gpreg + TARGET_LITTLE_ENDIAN], reg_names[fpreg + 1]);
6387 }
6388 }
6389
6390 /* Write out code to move floating-point arguments into or out of
6391 general registers. FP_CODE is the code describing which arguments
6392 are present (see the comment above the definition of CUMULATIVE_ARGS
6393 in mips.h). DIRECTION is as for mips_output_32bit_xfer. */
6394
6395 static void
6396 mips_output_args_xfer (int fp_code, char direction)
6397 {
6398 unsigned int gparg, fparg, f;
6399 CUMULATIVE_ARGS cum;
6400
6401 /* This code only works for o32 and o64. */
6402 gcc_assert (TARGET_OLDABI);
6403
6404 mips_init_cumulative_args (&cum, NULL);
6405
6406 for (f = (unsigned int) fp_code; f != 0; f >>= 2)
6407 {
6408 enum machine_mode mode;
6409 struct mips_arg_info info;
6410
6411 if ((f & 3) == 1)
6412 mode = SFmode;
6413 else if ((f & 3) == 2)
6414 mode = DFmode;
6415 else
6416 gcc_unreachable ();
6417
6418 mips_get_arg_info (&info, &cum, mode, NULL, true);
6419 gparg = mips_arg_regno (&info, false);
6420 fparg = mips_arg_regno (&info, true);
6421
6422 if (mode == SFmode)
6423 mips_output_32bit_xfer (direction, gparg, fparg);
6424 else
6425 mips_output_64bit_xfer (direction, gparg, fparg);
6426
6427 mips_function_arg_advance (pack_cumulative_args (&cum), mode, NULL, true);
6428 }
6429 }
6430
6431 /* Write a MIPS16 stub for the current function. This stub is used
6432 for functions which take arguments in the floating-point registers.
6433 It is normal-mode code that moves the floating-point arguments
6434 into the general registers and then jumps to the MIPS16 code. */
6435
6436 static void
6437 mips16_build_function_stub (void)
6438 {
6439 const char *fnname, *alias_name, *separator;
6440 char *secname, *stubname;
6441 tree stubdecl;
6442 unsigned int f;
6443 rtx symbol, alias;
6444
6445 /* Create the name of the stub, and its unique section. */
6446 symbol = XEXP (DECL_RTL (current_function_decl), 0);
6447 alias = mips16_local_alias (symbol);
6448
6449 fnname = targetm.strip_name_encoding (XSTR (symbol, 0));
6450 alias_name = targetm.strip_name_encoding (XSTR (alias, 0));
6451 secname = ACONCAT ((".mips16.fn.", fnname, NULL));
6452 stubname = ACONCAT (("__fn_stub_", fnname, NULL));
6453
6454 /* Build a decl for the stub. */
6455 stubdecl = build_decl (BUILTINS_LOCATION,
6456 FUNCTION_DECL, get_identifier (stubname),
6457 build_function_type_list (void_type_node, NULL_TREE));
6458 DECL_SECTION_NAME (stubdecl) = build_string (strlen (secname), secname);
6459 DECL_RESULT (stubdecl) = build_decl (BUILTINS_LOCATION,
6460 RESULT_DECL, NULL_TREE, void_type_node);
6461
6462 /* Output a comment. */
6463 fprintf (asm_out_file, "\t# Stub function for %s (",
6464 current_function_name ());
6465 separator = "";
6466 for (f = (unsigned int) crtl->args.info.fp_code; f != 0; f >>= 2)
6467 {
6468 fprintf (asm_out_file, "%s%s", separator,
6469 (f & 3) == 1 ? "float" : "double");
6470 separator = ", ";
6471 }
6472 fprintf (asm_out_file, ")\n");
6473
6474 /* Start the function definition. */
6475 assemble_start_function (stubdecl, stubname);
6476 mips_start_function_definition (stubname, false);
6477
6478 /* If generating pic2 code, either set up the global pointer or
6479 switch to pic0. */
6480 if (TARGET_ABICALLS_PIC2)
6481 {
6482 if (TARGET_ABSOLUTE_ABICALLS)
6483 fprintf (asm_out_file, "\t.option\tpic0\n");
6484 else
6485 {
6486 output_asm_insn ("%(.cpload\t%^%)", NULL);
6487 /* Emit an R_MIPS_NONE relocation to tell the linker what the
6488 target function is. Use a local GOT access when loading the
6489 symbol, to cut down on the number of unnecessary GOT entries
6490 for stubs that aren't needed. */
6491 output_asm_insn (".reloc\t0,R_MIPS_NONE,%0", &symbol);
6492 symbol = alias;
6493 }
6494 }
6495
6496 /* Load the address of the MIPS16 function into $25. Do this first so
6497 that targets with coprocessor interlocks can use an MFC1 to fill the
6498 delay slot. */
6499 output_asm_insn ("la\t%^,%0", &symbol);
6500
6501 /* Move the arguments from floating-point registers to general registers. */
6502 mips_output_args_xfer (crtl->args.info.fp_code, 'f');
6503
6504 /* Jump to the MIPS16 function. */
6505 output_asm_insn ("jr\t%^", NULL);
6506
6507 if (TARGET_ABICALLS_PIC2 && TARGET_ABSOLUTE_ABICALLS)
6508 fprintf (asm_out_file, "\t.option\tpic2\n");
6509
6510 mips_end_function_definition (stubname);
6511
6512 /* If the linker needs to create a dynamic symbol for the target
6513 function, it will associate the symbol with the stub (which,
6514 unlike the target function, follows the proper calling conventions).
6515 It is therefore useful to have a local alias for the target function,
6516 so that it can still be identified as MIPS16 code. As an optimization,
6517 this symbol can also be used for indirect MIPS16 references from
6518 within this file. */
6519 ASM_OUTPUT_DEF (asm_out_file, alias_name, fnname);
6520
6521 switch_to_section (function_section (current_function_decl));
6522 }
6523
6524 /* The current function is a MIPS16 function that returns a value in an FPR.
6525 Copy the return value from its soft-float to its hard-float location.
6526 libgcc2 has special non-MIPS16 helper functions for each case. */
6527
6528 static void
6529 mips16_copy_fpr_return_value (void)
6530 {
6531 rtx fn, insn, retval;
6532 tree return_type;
6533 enum machine_mode return_mode;
6534 const char *name;
6535
6536 return_type = DECL_RESULT (current_function_decl);
6537 return_mode = DECL_MODE (return_type);
6538
6539 name = ACONCAT (("__mips16_ret_",
6540 mips16_call_stub_mode_suffix (return_mode),
6541 NULL));
6542 fn = mips16_stub_function (name);
6543
6544 /* The function takes arguments in $2 (and possibly $3), so calls
6545 to it cannot be lazily bound. */
6546 SYMBOL_REF_FLAGS (fn) |= SYMBOL_FLAG_BIND_NOW;
6547
6548 /* Model the call as something that takes the GPR return value as
6549 argument and returns an "updated" value. */
6550 retval = gen_rtx_REG (return_mode, GP_RETURN);
6551 insn = mips_expand_call (MIPS_CALL_EPILOGUE, retval, fn,
6552 const0_rtx, NULL_RTX, false);
6553 use_reg (&CALL_INSN_FUNCTION_USAGE (insn), retval);
6554 }
6555
6556 /* Consider building a stub for a MIPS16 call to function *FN_PTR.
6557 RETVAL is the location of the return value, or null if this is
6558 a "call" rather than a "call_value". ARGS_SIZE is the size of the
6559 arguments and FP_CODE is the code built by mips_function_arg;
6560 see the comment before the fp_code field in CUMULATIVE_ARGS for details.
6561
6562 There are three alternatives:
6563
6564 - If a stub was needed, emit the call and return the call insn itself.
6565
6566 - If we can avoid using a stub by redirecting the call, set *FN_PTR
6567 to the new target and return null.
6568
6569 - If *FN_PTR doesn't need a stub, return null and leave *FN_PTR
6570 unmodified.
6571
6572 A stub is needed for calls to functions that, in normal mode,
6573 receive arguments in FPRs or return values in FPRs. The stub
6574 copies the arguments from their soft-float positions to their
6575 hard-float positions, calls the real function, then copies the
6576 return value from its hard-float position to its soft-float
6577 position.
6578
6579 We can emit a JAL to *FN_PTR even when *FN_PTR might need a stub.
6580 If *FN_PTR turns out to be to a non-MIPS16 function, the linker
6581 automatically redirects the JAL to the stub, otherwise the JAL
6582 continues to call FN directly. */
6583
6584 static rtx
6585 mips16_build_call_stub (rtx retval, rtx *fn_ptr, rtx args_size, int fp_code)
6586 {
6587 const char *fnname;
6588 bool fp_ret_p;
6589 struct mips16_stub *l;
6590 rtx insn, fn;
6591
6592 /* We don't need to do anything if we aren't in MIPS16 mode, or if
6593 we were invoked with the -msoft-float option. */
6594 if (!TARGET_MIPS16 || TARGET_SOFT_FLOAT_ABI)
6595 return NULL_RTX;
6596
6597 /* Figure out whether the value might come back in a floating-point
6598 register. */
6599 fp_ret_p = retval && mips_return_mode_in_fpr_p (GET_MODE (retval));
6600
6601 /* We don't need to do anything if there were no floating-point
6602 arguments and the value will not be returned in a floating-point
6603 register. */
6604 if (fp_code == 0 && !fp_ret_p)
6605 return NULL_RTX;
6606
6607 /* We don't need to do anything if this is a call to a special
6608 MIPS16 support function. */
6609 fn = *fn_ptr;
6610 if (mips16_stub_function_p (fn))
6611 return NULL_RTX;
6612
6613 /* If we're calling a locally-defined MIPS16 function, we know that
6614 it will return values in both the "soft-float" and "hard-float"
6615 registers. There is no need to use a stub to move the latter
6616 to the former. */
6617 if (fp_code == 0 && mips16_local_function_p (fn))
6618 return NULL_RTX;
6619
6620 /* This code will only work for o32 and o64 abis. The other ABI's
6621 require more sophisticated support. */
6622 gcc_assert (TARGET_OLDABI);
6623
6624 /* If we're calling via a function pointer, use one of the magic
6625 libgcc.a stubs provided for each (FP_CODE, FP_RET_P) combination.
6626 Each stub expects the function address to arrive in register $2. */
6627 if (GET_CODE (fn) != SYMBOL_REF
6628 || !call_insn_operand (fn, VOIDmode))
6629 {
6630 char buf[30];
6631 rtx stub_fn, insn, addr;
6632 bool lazy_p;
6633
6634 /* If this is a locally-defined and locally-binding function,
6635 avoid the stub by calling the local alias directly. */
6636 if (mips16_local_function_p (fn))
6637 {
6638 *fn_ptr = mips16_local_alias (fn);
6639 return NULL_RTX;
6640 }
6641
6642 /* Create a SYMBOL_REF for the libgcc.a function. */
6643 if (fp_ret_p)
6644 sprintf (buf, "__mips16_call_stub_%s_%d",
6645 mips16_call_stub_mode_suffix (GET_MODE (retval)),
6646 fp_code);
6647 else
6648 sprintf (buf, "__mips16_call_stub_%d", fp_code);
6649 stub_fn = mips16_stub_function (buf);
6650
6651 /* The function uses $2 as an argument, so calls to it
6652 cannot be lazily bound. */
6653 SYMBOL_REF_FLAGS (stub_fn) |= SYMBOL_FLAG_BIND_NOW;
6654
6655 /* Load the target function into $2. */
6656 addr = gen_rtx_REG (Pmode, GP_REG_FIRST + 2);
6657 lazy_p = mips_load_call_address (MIPS_CALL_NORMAL, addr, fn);
6658
6659 /* Emit the call. */
6660 insn = mips_expand_call (MIPS_CALL_NORMAL, retval, stub_fn,
6661 args_size, NULL_RTX, lazy_p);
6662
6663 /* Tell GCC that this call does indeed use the value of $2. */
6664 use_reg (&CALL_INSN_FUNCTION_USAGE (insn), addr);
6665
6666 /* If we are handling a floating-point return value, we need to
6667 save $18 in the function prologue. Putting a note on the
6668 call will mean that df_regs_ever_live_p ($18) will be true if the
6669 call is not eliminated, and we can check that in the prologue
6670 code. */
6671 if (fp_ret_p)
6672 CALL_INSN_FUNCTION_USAGE (insn) =
6673 gen_rtx_EXPR_LIST (VOIDmode,
6674 gen_rtx_CLOBBER (VOIDmode,
6675 gen_rtx_REG (word_mode, 18)),
6676 CALL_INSN_FUNCTION_USAGE (insn));
6677
6678 return insn;
6679 }
6680
6681 /* We know the function we are going to call. If we have already
6682 built a stub, we don't need to do anything further. */
6683 fnname = targetm.strip_name_encoding (XSTR (fn, 0));
6684 for (l = mips16_stubs; l != NULL; l = l->next)
6685 if (strcmp (l->name, fnname) == 0)
6686 break;
6687
6688 if (l == NULL)
6689 {
6690 const char *separator;
6691 char *secname, *stubname;
6692 tree stubid, stubdecl;
6693 unsigned int f;
6694
6695 /* If the function does not return in FPRs, the special stub
6696 section is named
6697 .mips16.call.FNNAME
6698
6699 If the function does return in FPRs, the stub section is named
6700 .mips16.call.fp.FNNAME
6701
6702 Build a decl for the stub. */
6703 secname = ACONCAT ((".mips16.call.", fp_ret_p ? "fp." : "",
6704 fnname, NULL));
6705 stubname = ACONCAT (("__call_stub_", fp_ret_p ? "fp_" : "",
6706 fnname, NULL));
6707 stubid = get_identifier (stubname);
6708 stubdecl = build_decl (BUILTINS_LOCATION,
6709 FUNCTION_DECL, stubid,
6710 build_function_type_list (void_type_node,
6711 NULL_TREE));
6712 DECL_SECTION_NAME (stubdecl) = build_string (strlen (secname), secname);
6713 DECL_RESULT (stubdecl) = build_decl (BUILTINS_LOCATION,
6714 RESULT_DECL, NULL_TREE,
6715 void_type_node);
6716
6717 /* Output a comment. */
6718 fprintf (asm_out_file, "\t# Stub function to call %s%s (",
6719 (fp_ret_p
6720 ? (GET_MODE (retval) == SFmode ? "float " : "double ")
6721 : ""),
6722 fnname);
6723 separator = "";
6724 for (f = (unsigned int) fp_code; f != 0; f >>= 2)
6725 {
6726 fprintf (asm_out_file, "%s%s", separator,
6727 (f & 3) == 1 ? "float" : "double");
6728 separator = ", ";
6729 }
6730 fprintf (asm_out_file, ")\n");
6731
6732 /* Start the function definition. */
6733 assemble_start_function (stubdecl, stubname);
6734 mips_start_function_definition (stubname, false);
6735
6736 if (fp_ret_p)
6737 {
6738 fprintf (asm_out_file, "\t.cfi_startproc\n");
6739
6740 /* Create a fake CFA 4 bytes below the stack pointer.
6741 This works around unwinders (like libgcc's) that expect
6742 the CFA for non-signal frames to be unique. */
6743 fprintf (asm_out_file, "\t.cfi_def_cfa 29,-4\n");
6744
6745 /* "Save" $sp in itself so we don't use the fake CFA.
6746 This is: DW_CFA_val_expression r29, { DW_OP_reg29 }. */
6747 fprintf (asm_out_file, "\t.cfi_escape 0x16,29,1,0x6d\n");
6748 }
6749 else
6750 {
6751 /* Load the address of the MIPS16 function into $25. Do this
6752 first so that targets with coprocessor interlocks can use
6753 an MFC1 to fill the delay slot. */
6754 if (TARGET_EXPLICIT_RELOCS)
6755 {
6756 output_asm_insn ("lui\t%^,%%hi(%0)", &fn);
6757 output_asm_insn ("addiu\t%^,%^,%%lo(%0)", &fn);
6758 }
6759 else
6760 output_asm_insn ("la\t%^,%0", &fn);
6761 }
6762
6763 /* Move the arguments from general registers to floating-point
6764 registers. */
6765 mips_output_args_xfer (fp_code, 't');
6766
6767 if (fp_ret_p)
6768 {
6769 /* Save the return address in $18 and call the non-MIPS16 function.
6770 The stub's caller knows that $18 might be clobbered, even though
6771 $18 is usually a call-saved register. */
6772 fprintf (asm_out_file, "\tmove\t%s,%s\n",
6773 reg_names[GP_REG_FIRST + 18], reg_names[RETURN_ADDR_REGNUM]);
6774 output_asm_insn (MIPS_CALL ("jal", &fn, 0, -1), &fn);
6775 fprintf (asm_out_file, "\t.cfi_register 31,18\n");
6776
6777 /* Move the result from floating-point registers to
6778 general registers. */
6779 switch (GET_MODE (retval))
6780 {
6781 case SCmode:
6782 mips_output_32bit_xfer ('f', GP_RETURN + TARGET_BIG_ENDIAN,
6783 TARGET_BIG_ENDIAN
6784 ? FP_REG_FIRST + MAX_FPRS_PER_FMT
6785 : FP_REG_FIRST);
6786 mips_output_32bit_xfer ('f', GP_RETURN + TARGET_LITTLE_ENDIAN,
6787 TARGET_LITTLE_ENDIAN
6788 ? FP_REG_FIRST + MAX_FPRS_PER_FMT
6789 : FP_REG_FIRST);
6790 if (GET_MODE (retval) == SCmode && TARGET_64BIT)
6791 {
6792 /* On 64-bit targets, complex floats are returned in
6793 a single GPR, such that "sd" on a suitably-aligned
6794 target would store the value correctly. */
6795 fprintf (asm_out_file, "\tdsll\t%s,%s,32\n",
6796 reg_names[GP_RETURN + TARGET_BIG_ENDIAN],
6797 reg_names[GP_RETURN + TARGET_BIG_ENDIAN]);
6798 fprintf (asm_out_file, "\tdsll\t%s,%s,32\n",
6799 reg_names[GP_RETURN + TARGET_LITTLE_ENDIAN],
6800 reg_names[GP_RETURN + TARGET_LITTLE_ENDIAN]);
6801 fprintf (asm_out_file, "\tdsrl\t%s,%s,32\n",
6802 reg_names[GP_RETURN + TARGET_BIG_ENDIAN],
6803 reg_names[GP_RETURN + TARGET_BIG_ENDIAN]);
6804 fprintf (asm_out_file, "\tor\t%s,%s,%s\n",
6805 reg_names[GP_RETURN],
6806 reg_names[GP_RETURN],
6807 reg_names[GP_RETURN + 1]);
6808 }
6809 break;
6810
6811 case SFmode:
6812 mips_output_32bit_xfer ('f', GP_RETURN, FP_REG_FIRST);
6813 break;
6814
6815 case DCmode:
6816 mips_output_64bit_xfer ('f', GP_RETURN + (8 / UNITS_PER_WORD),
6817 FP_REG_FIRST + MAX_FPRS_PER_FMT);
6818 /* Fall though. */
6819 case DFmode:
6820 case V2SFmode:
6821 mips_output_64bit_xfer ('f', GP_RETURN, FP_REG_FIRST);
6822 break;
6823
6824 default:
6825 gcc_unreachable ();
6826 }
6827 fprintf (asm_out_file, "\tjr\t%s\n", reg_names[GP_REG_FIRST + 18]);
6828 fprintf (asm_out_file, "\t.cfi_endproc\n");
6829 }
6830 else
6831 {
6832 /* Jump to the previously-loaded address. */
6833 output_asm_insn ("jr\t%^", NULL);
6834 }
6835
6836 #ifdef ASM_DECLARE_FUNCTION_SIZE
6837 ASM_DECLARE_FUNCTION_SIZE (asm_out_file, stubname, stubdecl);
6838 #endif
6839
6840 mips_end_function_definition (stubname);
6841
6842 /* Record this stub. */
6843 l = XNEW (struct mips16_stub);
6844 l->name = xstrdup (fnname);
6845 l->fp_ret_p = fp_ret_p;
6846 l->next = mips16_stubs;
6847 mips16_stubs = l;
6848 }
6849
6850 /* If we expect a floating-point return value, but we've built a
6851 stub which does not expect one, then we're in trouble. We can't
6852 use the existing stub, because it won't handle the floating-point
6853 value. We can't build a new stub, because the linker won't know
6854 which stub to use for the various calls in this object file.
6855 Fortunately, this case is illegal, since it means that a function
6856 was declared in two different ways in a single compilation. */
6857 if (fp_ret_p && !l->fp_ret_p)
6858 error ("cannot handle inconsistent calls to %qs", fnname);
6859
6860 if (retval == NULL_RTX)
6861 insn = gen_call_internal_direct (fn, args_size);
6862 else
6863 insn = gen_call_value_internal_direct (retval, fn, args_size);
6864 insn = mips_emit_call_insn (insn, fn, fn, false);
6865
6866 /* If we are calling a stub which handles a floating-point return
6867 value, we need to arrange to save $18 in the prologue. We do this
6868 by marking the function call as using the register. The prologue
6869 will later see that it is used, and emit code to save it. */
6870 if (fp_ret_p)
6871 CALL_INSN_FUNCTION_USAGE (insn) =
6872 gen_rtx_EXPR_LIST (VOIDmode,
6873 gen_rtx_CLOBBER (VOIDmode,
6874 gen_rtx_REG (word_mode, 18)),
6875 CALL_INSN_FUNCTION_USAGE (insn));
6876
6877 return insn;
6878 }
6879 \f
6880 /* Expand a call of type TYPE. RESULT is where the result will go (null
6881 for "call"s and "sibcall"s), ADDR is the address of the function,
6882 ARGS_SIZE is the size of the arguments and AUX is the value passed
6883 to us by mips_function_arg. LAZY_P is true if this call already
6884 involves a lazily-bound function address (such as when calling
6885 functions through a MIPS16 hard-float stub).
6886
6887 Return the call itself. */
6888
6889 rtx
6890 mips_expand_call (enum mips_call_type type, rtx result, rtx addr,
6891 rtx args_size, rtx aux, bool lazy_p)
6892 {
6893 rtx orig_addr, pattern, insn;
6894 int fp_code;
6895
6896 fp_code = aux == 0 ? 0 : (int) GET_MODE (aux);
6897 insn = mips16_build_call_stub (result, &addr, args_size, fp_code);
6898 if (insn)
6899 {
6900 gcc_assert (!lazy_p && type == MIPS_CALL_NORMAL);
6901 return insn;
6902 }
6903
6904 orig_addr = addr;
6905 if (!call_insn_operand (addr, VOIDmode))
6906 {
6907 if (type == MIPS_CALL_EPILOGUE)
6908 addr = MIPS_EPILOGUE_TEMP (Pmode);
6909 else
6910 addr = gen_reg_rtx (Pmode);
6911 lazy_p |= mips_load_call_address (type, addr, orig_addr);
6912 }
6913
6914 if (result == 0)
6915 {
6916 rtx (*fn) (rtx, rtx);
6917
6918 if (type == MIPS_CALL_SIBCALL)
6919 fn = gen_sibcall_internal;
6920 else
6921 fn = gen_call_internal;
6922
6923 pattern = fn (addr, args_size);
6924 }
6925 else if (GET_CODE (result) == PARALLEL && XVECLEN (result, 0) == 2)
6926 {
6927 /* Handle return values created by mips_return_fpr_pair. */
6928 rtx (*fn) (rtx, rtx, rtx, rtx);
6929 rtx reg1, reg2;
6930
6931 if (type == MIPS_CALL_SIBCALL)
6932 fn = gen_sibcall_value_multiple_internal;
6933 else
6934 fn = gen_call_value_multiple_internal;
6935
6936 reg1 = XEXP (XVECEXP (result, 0, 0), 0);
6937 reg2 = XEXP (XVECEXP (result, 0, 1), 0);
6938 pattern = fn (reg1, addr, args_size, reg2);
6939 }
6940 else
6941 {
6942 rtx (*fn) (rtx, rtx, rtx);
6943
6944 if (type == MIPS_CALL_SIBCALL)
6945 fn = gen_sibcall_value_internal;
6946 else
6947 fn = gen_call_value_internal;
6948
6949 /* Handle return values created by mips_return_fpr_single. */
6950 if (GET_CODE (result) == PARALLEL && XVECLEN (result, 0) == 1)
6951 result = XEXP (XVECEXP (result, 0, 0), 0);
6952 pattern = fn (result, addr, args_size);
6953 }
6954
6955 return mips_emit_call_insn (pattern, orig_addr, addr, lazy_p);
6956 }
6957
6958 /* Split call instruction INSN into a $gp-clobbering call and
6959 (where necessary) an instruction to restore $gp from its save slot.
6960 CALL_PATTERN is the pattern of the new call. */
6961
6962 void
6963 mips_split_call (rtx insn, rtx call_pattern)
6964 {
6965 emit_call_insn (call_pattern);
6966 if (!find_reg_note (insn, REG_NORETURN, 0))
6967 /* Pick a temporary register that is suitable for both MIPS16 and
6968 non-MIPS16 code. $4 and $5 are used for returning complex double
6969 values in soft-float code, so $6 is the first suitable candidate. */
6970 mips_restore_gp_from_cprestore_slot (gen_rtx_REG (Pmode, GP_ARG_FIRST + 2));
6971 }
6972
6973 /* Return true if a call to DECL may need to use JALX. */
6974
6975 static bool
6976 mips_call_may_need_jalx_p (tree decl)
6977 {
6978 /* If the current translation unit would use a different mode for DECL,
6979 assume that the call needs JALX. */
6980 if (mips_get_compress_mode (decl) != TARGET_COMPRESSION)
6981 return true;
6982
6983 /* mips_get_compress_mode is always accurate for locally-binding
6984 functions in the current translation unit. */
6985 if (!DECL_EXTERNAL (decl) && targetm.binds_local_p (decl))
6986 return false;
6987
6988 /* When -minterlink-compressed is in effect, assume that functions
6989 could use a different encoding mode unless an attribute explicitly
6990 tells us otherwise. */
6991 if (TARGET_INTERLINK_COMPRESSED)
6992 {
6993 if (!TARGET_COMPRESSION
6994 && mips_get_compress_off_flags (DECL_ATTRIBUTES (decl)) ==0)
6995 return true;
6996 if (TARGET_COMPRESSION
6997 && mips_get_compress_on_flags (DECL_ATTRIBUTES (decl)) == 0)
6998 return true;
6999 }
7000
7001 return false;
7002 }
7003
7004 /* Implement TARGET_FUNCTION_OK_FOR_SIBCALL. */
7005
7006 static bool
7007 mips_function_ok_for_sibcall (tree decl, tree exp ATTRIBUTE_UNUSED)
7008 {
7009 if (!TARGET_SIBCALLS)
7010 return false;
7011
7012 /* Interrupt handlers need special epilogue code and therefore can't
7013 use sibcalls. */
7014 if (mips_interrupt_type_p (TREE_TYPE (current_function_decl)))
7015 return false;
7016
7017 /* Direct Js are only possible to functions that use the same ISA encoding.
7018 There is no JX counterpoart of JALX. */
7019 if (decl
7020 && const_call_insn_operand (XEXP (DECL_RTL (decl), 0), VOIDmode)
7021 && mips_call_may_need_jalx_p (decl))
7022 return false;
7023
7024 /* Sibling calls should not prevent lazy binding. Lazy-binding stubs
7025 require $gp to be valid on entry, so sibcalls can only use stubs
7026 if $gp is call-clobbered. */
7027 if (decl
7028 && TARGET_CALL_SAVED_GP
7029 && !TARGET_ABICALLS_PIC0
7030 && !targetm.binds_local_p (decl))
7031 return false;
7032
7033 /* Otherwise OK. */
7034 return true;
7035 }
7036 \f
7037 /* Emit code to move general operand SRC into condition-code
7038 register DEST given that SCRATCH is a scratch TFmode FPR.
7039 The sequence is:
7040
7041 FP1 = SRC
7042 FP2 = 0.0f
7043 DEST = FP2 < FP1
7044
7045 where FP1 and FP2 are single-precision FPRs taken from SCRATCH. */
7046
7047 void
7048 mips_expand_fcc_reload (rtx dest, rtx src, rtx scratch)
7049 {
7050 rtx fp1, fp2;
7051
7052 /* Change the source to SFmode. */
7053 if (MEM_P (src))
7054 src = adjust_address (src, SFmode, 0);
7055 else if (REG_P (src) || GET_CODE (src) == SUBREG)
7056 src = gen_rtx_REG (SFmode, true_regnum (src));
7057
7058 fp1 = gen_rtx_REG (SFmode, REGNO (scratch));
7059 fp2 = gen_rtx_REG (SFmode, REGNO (scratch) + MAX_FPRS_PER_FMT);
7060
7061 mips_emit_move (copy_rtx (fp1), src);
7062 mips_emit_move (copy_rtx (fp2), CONST0_RTX (SFmode));
7063 emit_insn (gen_slt_sf (dest, fp2, fp1));
7064 }
7065 \f
7066 /* Implement MOVE_BY_PIECES_P. */
7067
7068 bool
7069 mips_move_by_pieces_p (unsigned HOST_WIDE_INT size, unsigned int align)
7070 {
7071 if (HAVE_movmemsi)
7072 {
7073 /* movmemsi is meant to generate code that is at least as good as
7074 move_by_pieces. However, movmemsi effectively uses a by-pieces
7075 implementation both for moves smaller than a word and for
7076 word-aligned moves of no more than MIPS_MAX_MOVE_BYTES_STRAIGHT
7077 bytes. We should allow the tree-level optimisers to do such
7078 moves by pieces, as it often exposes other optimization
7079 opportunities. We might as well continue to use movmemsi at
7080 the rtl level though, as it produces better code when
7081 scheduling is disabled (such as at -O). */
7082 if (currently_expanding_to_rtl)
7083 return false;
7084 if (align < BITS_PER_WORD)
7085 return size < UNITS_PER_WORD;
7086 return size <= MIPS_MAX_MOVE_BYTES_STRAIGHT;
7087 }
7088 /* The default value. If this becomes a target hook, we should
7089 call the default definition instead. */
7090 return (move_by_pieces_ninsns (size, align, MOVE_MAX_PIECES + 1)
7091 < (unsigned int) MOVE_RATIO (optimize_insn_for_speed_p ()));
7092 }
7093
7094 /* Implement STORE_BY_PIECES_P. */
7095
7096 bool
7097 mips_store_by_pieces_p (unsigned HOST_WIDE_INT size, unsigned int align)
7098 {
7099 /* Storing by pieces involves moving constants into registers
7100 of size MIN (ALIGN, BITS_PER_WORD), then storing them.
7101 We need to decide whether it is cheaper to load the address of
7102 constant data into a register and use a block move instead. */
7103
7104 /* If the data is only byte aligned, then:
7105
7106 (a1) A block move of less than 4 bytes would involve three 3 LBs and
7107 3 SBs. We might as well use 3 single-instruction LIs and 3 SBs
7108 instead.
7109
7110 (a2) A block move of 4 bytes from aligned source data can use an
7111 LW/SWL/SWR sequence. This is often better than the 4 LIs and
7112 4 SBs that we would generate when storing by pieces. */
7113 if (align <= BITS_PER_UNIT)
7114 return size < 4;
7115
7116 /* If the data is 2-byte aligned, then:
7117
7118 (b1) A block move of less than 4 bytes would use a combination of LBs,
7119 LHs, SBs and SHs. We get better code by using single-instruction
7120 LIs, SBs and SHs instead.
7121
7122 (b2) A block move of 4 bytes from aligned source data would again use
7123 an LW/SWL/SWR sequence. In most cases, loading the address of
7124 the source data would require at least one extra instruction.
7125 It is often more efficient to use 2 single-instruction LIs and
7126 2 SHs instead.
7127
7128 (b3) A block move of up to 3 additional bytes would be like (b1).
7129
7130 (b4) A block move of 8 bytes from aligned source data can use two
7131 LW/SWL/SWR sequences or a single LD/SDL/SDR sequence. Both
7132 sequences are better than the 4 LIs and 4 SHs that we'd generate
7133 when storing by pieces.
7134
7135 The reasoning for higher alignments is similar:
7136
7137 (c1) A block move of less than 4 bytes would be the same as (b1).
7138
7139 (c2) A block move of 4 bytes would use an LW/SW sequence. Again,
7140 loading the address of the source data would typically require
7141 at least one extra instruction. It is generally better to use
7142 LUI/ORI/SW instead.
7143
7144 (c3) A block move of up to 3 additional bytes would be like (b1).
7145
7146 (c4) A block move of 8 bytes can use two LW/SW sequences or a single
7147 LD/SD sequence, and in these cases we've traditionally preferred
7148 the memory copy over the more bulky constant moves. */
7149 return size < 8;
7150 }
7151
7152 /* Emit straight-line code to move LENGTH bytes from SRC to DEST.
7153 Assume that the areas do not overlap. */
7154
7155 static void
7156 mips_block_move_straight (rtx dest, rtx src, HOST_WIDE_INT length)
7157 {
7158 HOST_WIDE_INT offset, delta;
7159 unsigned HOST_WIDE_INT bits;
7160 int i;
7161 enum machine_mode mode;
7162 rtx *regs;
7163
7164 /* Work out how many bits to move at a time. If both operands have
7165 half-word alignment, it is usually better to move in half words.
7166 For instance, lh/lh/sh/sh is usually better than lwl/lwr/swl/swr
7167 and lw/lw/sw/sw is usually better than ldl/ldr/sdl/sdr.
7168 Otherwise move word-sized chunks. */
7169 if (MEM_ALIGN (src) == BITS_PER_WORD / 2
7170 && MEM_ALIGN (dest) == BITS_PER_WORD / 2)
7171 bits = BITS_PER_WORD / 2;
7172 else
7173 bits = BITS_PER_WORD;
7174
7175 mode = mode_for_size (bits, MODE_INT, 0);
7176 delta = bits / BITS_PER_UNIT;
7177
7178 /* Allocate a buffer for the temporary registers. */
7179 regs = XALLOCAVEC (rtx, length / delta);
7180
7181 /* Load as many BITS-sized chunks as possible. Use a normal load if
7182 the source has enough alignment, otherwise use left/right pairs. */
7183 for (offset = 0, i = 0; offset + delta <= length; offset += delta, i++)
7184 {
7185 regs[i] = gen_reg_rtx (mode);
7186 if (MEM_ALIGN (src) >= bits)
7187 mips_emit_move (regs[i], adjust_address (src, mode, offset));
7188 else
7189 {
7190 rtx part = adjust_address (src, BLKmode, offset);
7191 set_mem_size (part, delta);
7192 if (!mips_expand_ext_as_unaligned_load (regs[i], part, bits, 0, 0))
7193 gcc_unreachable ();
7194 }
7195 }
7196
7197 /* Copy the chunks to the destination. */
7198 for (offset = 0, i = 0; offset + delta <= length; offset += delta, i++)
7199 if (MEM_ALIGN (dest) >= bits)
7200 mips_emit_move (adjust_address (dest, mode, offset), regs[i]);
7201 else
7202 {
7203 rtx part = adjust_address (dest, BLKmode, offset);
7204 set_mem_size (part, delta);
7205 if (!mips_expand_ins_as_unaligned_store (part, regs[i], bits, 0))
7206 gcc_unreachable ();
7207 }
7208
7209 /* Mop up any left-over bytes. */
7210 if (offset < length)
7211 {
7212 src = adjust_address (src, BLKmode, offset);
7213 dest = adjust_address (dest, BLKmode, offset);
7214 move_by_pieces (dest, src, length - offset,
7215 MIN (MEM_ALIGN (src), MEM_ALIGN (dest)), 0);
7216 }
7217 }
7218
7219 /* Helper function for doing a loop-based block operation on memory
7220 reference MEM. Each iteration of the loop will operate on LENGTH
7221 bytes of MEM.
7222
7223 Create a new base register for use within the loop and point it to
7224 the start of MEM. Create a new memory reference that uses this
7225 register. Store them in *LOOP_REG and *LOOP_MEM respectively. */
7226
7227 static void
7228 mips_adjust_block_mem (rtx mem, HOST_WIDE_INT length,
7229 rtx *loop_reg, rtx *loop_mem)
7230 {
7231 *loop_reg = copy_addr_to_reg (XEXP (mem, 0));
7232
7233 /* Although the new mem does not refer to a known location,
7234 it does keep up to LENGTH bytes of alignment. */
7235 *loop_mem = change_address (mem, BLKmode, *loop_reg);
7236 set_mem_align (*loop_mem, MIN (MEM_ALIGN (mem), length * BITS_PER_UNIT));
7237 }
7238
7239 /* Move LENGTH bytes from SRC to DEST using a loop that moves BYTES_PER_ITER
7240 bytes at a time. LENGTH must be at least BYTES_PER_ITER. Assume that
7241 the memory regions do not overlap. */
7242
7243 static void
7244 mips_block_move_loop (rtx dest, rtx src, HOST_WIDE_INT length,
7245 HOST_WIDE_INT bytes_per_iter)
7246 {
7247 rtx label, src_reg, dest_reg, final_src, test;
7248 HOST_WIDE_INT leftover;
7249
7250 leftover = length % bytes_per_iter;
7251 length -= leftover;
7252
7253 /* Create registers and memory references for use within the loop. */
7254 mips_adjust_block_mem (src, bytes_per_iter, &src_reg, &src);
7255 mips_adjust_block_mem (dest, bytes_per_iter, &dest_reg, &dest);
7256
7257 /* Calculate the value that SRC_REG should have after the last iteration
7258 of the loop. */
7259 final_src = expand_simple_binop (Pmode, PLUS, src_reg, GEN_INT (length),
7260 0, 0, OPTAB_WIDEN);
7261
7262 /* Emit the start of the loop. */
7263 label = gen_label_rtx ();
7264 emit_label (label);
7265
7266 /* Emit the loop body. */
7267 mips_block_move_straight (dest, src, bytes_per_iter);
7268
7269 /* Move on to the next block. */
7270 mips_emit_move (src_reg, plus_constant (Pmode, src_reg, bytes_per_iter));
7271 mips_emit_move (dest_reg, plus_constant (Pmode, dest_reg, bytes_per_iter));
7272
7273 /* Emit the loop condition. */
7274 test = gen_rtx_NE (VOIDmode, src_reg, final_src);
7275 if (Pmode == DImode)
7276 emit_jump_insn (gen_cbranchdi4 (test, src_reg, final_src, label));
7277 else
7278 emit_jump_insn (gen_cbranchsi4 (test, src_reg, final_src, label));
7279
7280 /* Mop up any left-over bytes. */
7281 if (leftover)
7282 mips_block_move_straight (dest, src, leftover);
7283 }
7284
7285 /* Expand a movmemsi instruction, which copies LENGTH bytes from
7286 memory reference SRC to memory reference DEST. */
7287
7288 bool
7289 mips_expand_block_move (rtx dest, rtx src, rtx length)
7290 {
7291 if (CONST_INT_P (length))
7292 {
7293 if (INTVAL (length) <= MIPS_MAX_MOVE_BYTES_STRAIGHT)
7294 {
7295 mips_block_move_straight (dest, src, INTVAL (length));
7296 return true;
7297 }
7298 else if (optimize)
7299 {
7300 mips_block_move_loop (dest, src, INTVAL (length),
7301 MIPS_MAX_MOVE_BYTES_PER_LOOP_ITER);
7302 return true;
7303 }
7304 }
7305 return false;
7306 }
7307 \f
7308 /* Expand a loop of synci insns for the address range [BEGIN, END). */
7309
7310 void
7311 mips_expand_synci_loop (rtx begin, rtx end)
7312 {
7313 rtx inc, label, end_label, cmp_result, mask, length;
7314
7315 /* Create end_label. */
7316 end_label = gen_label_rtx ();
7317
7318 /* Check if begin equals end. */
7319 cmp_result = gen_rtx_EQ (VOIDmode, begin, end);
7320 emit_jump_insn (gen_condjump (cmp_result, end_label));
7321
7322 /* Load INC with the cache line size (rdhwr INC,$1). */
7323 inc = gen_reg_rtx (Pmode);
7324 emit_insn (PMODE_INSN (gen_rdhwr_synci_step, (inc)));
7325
7326 /* Check if inc is 0. */
7327 cmp_result = gen_rtx_EQ (VOIDmode, inc, const0_rtx);
7328 emit_jump_insn (gen_condjump (cmp_result, end_label));
7329
7330 /* Calculate mask. */
7331 mask = mips_force_unary (Pmode, NEG, inc);
7332
7333 /* Mask out begin by mask. */
7334 begin = mips_force_binary (Pmode, AND, begin, mask);
7335
7336 /* Calculate length. */
7337 length = mips_force_binary (Pmode, MINUS, end, begin);
7338
7339 /* Loop back to here. */
7340 label = gen_label_rtx ();
7341 emit_label (label);
7342
7343 emit_insn (gen_synci (begin));
7344
7345 /* Update length. */
7346 mips_emit_binary (MINUS, length, length, inc);
7347
7348 /* Update begin. */
7349 mips_emit_binary (PLUS, begin, begin, inc);
7350
7351 /* Check if length is greater than 0. */
7352 cmp_result = gen_rtx_GT (VOIDmode, length, const0_rtx);
7353 emit_jump_insn (gen_condjump (cmp_result, label));
7354
7355 emit_label (end_label);
7356 }
7357 \f
7358 /* Expand a QI or HI mode atomic memory operation.
7359
7360 GENERATOR contains a pointer to the gen_* function that generates
7361 the SI mode underlying atomic operation using masks that we
7362 calculate.
7363
7364 RESULT is the return register for the operation. Its value is NULL
7365 if unused.
7366
7367 MEM is the location of the atomic access.
7368
7369 OLDVAL is the first operand for the operation.
7370
7371 NEWVAL is the optional second operand for the operation. Its value
7372 is NULL if unused. */
7373
7374 void
7375 mips_expand_atomic_qihi (union mips_gen_fn_ptrs generator,
7376 rtx result, rtx mem, rtx oldval, rtx newval)
7377 {
7378 rtx orig_addr, memsi_addr, memsi, shift, shiftsi, unshifted_mask;
7379 rtx unshifted_mask_reg, mask, inverted_mask, si_op;
7380 rtx res = NULL;
7381 enum machine_mode mode;
7382
7383 mode = GET_MODE (mem);
7384
7385 /* Compute the address of the containing SImode value. */
7386 orig_addr = force_reg (Pmode, XEXP (mem, 0));
7387 memsi_addr = mips_force_binary (Pmode, AND, orig_addr,
7388 force_reg (Pmode, GEN_INT (-4)));
7389
7390 /* Create a memory reference for it. */
7391 memsi = gen_rtx_MEM (SImode, memsi_addr);
7392 set_mem_alias_set (memsi, ALIAS_SET_MEMORY_BARRIER);
7393 MEM_VOLATILE_P (memsi) = MEM_VOLATILE_P (mem);
7394
7395 /* Work out the byte offset of the QImode or HImode value,
7396 counting from the least significant byte. */
7397 shift = mips_force_binary (Pmode, AND, orig_addr, GEN_INT (3));
7398 if (TARGET_BIG_ENDIAN)
7399 mips_emit_binary (XOR, shift, shift, GEN_INT (mode == QImode ? 3 : 2));
7400
7401 /* Multiply by eight to convert the shift value from bytes to bits. */
7402 mips_emit_binary (ASHIFT, shift, shift, GEN_INT (3));
7403
7404 /* Make the final shift an SImode value, so that it can be used in
7405 SImode operations. */
7406 shiftsi = force_reg (SImode, gen_lowpart (SImode, shift));
7407
7408 /* Set MASK to an inclusive mask of the QImode or HImode value. */
7409 unshifted_mask = GEN_INT (GET_MODE_MASK (mode));
7410 unshifted_mask_reg = force_reg (SImode, unshifted_mask);
7411 mask = mips_force_binary (SImode, ASHIFT, unshifted_mask_reg, shiftsi);
7412
7413 /* Compute the equivalent exclusive mask. */
7414 inverted_mask = gen_reg_rtx (SImode);
7415 emit_insn (gen_rtx_SET (VOIDmode, inverted_mask,
7416 gen_rtx_NOT (SImode, mask)));
7417
7418 /* Shift the old value into place. */
7419 if (oldval != const0_rtx)
7420 {
7421 oldval = convert_modes (SImode, mode, oldval, true);
7422 oldval = force_reg (SImode, oldval);
7423 oldval = mips_force_binary (SImode, ASHIFT, oldval, shiftsi);
7424 }
7425
7426 /* Do the same for the new value. */
7427 if (newval && newval != const0_rtx)
7428 {
7429 newval = convert_modes (SImode, mode, newval, true);
7430 newval = force_reg (SImode, newval);
7431 newval = mips_force_binary (SImode, ASHIFT, newval, shiftsi);
7432 }
7433
7434 /* Do the SImode atomic access. */
7435 if (result)
7436 res = gen_reg_rtx (SImode);
7437 if (newval)
7438 si_op = generator.fn_6 (res, memsi, mask, inverted_mask, oldval, newval);
7439 else if (result)
7440 si_op = generator.fn_5 (res, memsi, mask, inverted_mask, oldval);
7441 else
7442 si_op = generator.fn_4 (memsi, mask, inverted_mask, oldval);
7443
7444 emit_insn (si_op);
7445
7446 if (result)
7447 {
7448 /* Shift and convert the result. */
7449 mips_emit_binary (AND, res, res, mask);
7450 mips_emit_binary (LSHIFTRT, res, res, shiftsi);
7451 mips_emit_move (result, gen_lowpart (GET_MODE (result), res));
7452 }
7453 }
7454
7455 /* Return true if it is possible to use left/right accesses for a
7456 bitfield of WIDTH bits starting BITPOS bits into BLKmode memory OP.
7457 When returning true, update *LEFT and *RIGHT as follows:
7458
7459 *LEFT is a QImode reference to the first byte if big endian or
7460 the last byte if little endian. This address can be used in the
7461 left-side instructions (LWL, SWL, LDL, SDL).
7462
7463 *RIGHT is a QImode reference to the opposite end of the field and
7464 can be used in the patterning right-side instruction. */
7465
7466 static bool
7467 mips_get_unaligned_mem (rtx op, HOST_WIDE_INT width, HOST_WIDE_INT bitpos,
7468 rtx *left, rtx *right)
7469 {
7470 rtx first, last;
7471
7472 /* Check that the size is valid. */
7473 if (width != 32 && (!TARGET_64BIT || width != 64))
7474 return false;
7475
7476 /* We can only access byte-aligned values. Since we are always passed
7477 a reference to the first byte of the field, it is not necessary to
7478 do anything with BITPOS after this check. */
7479 if (bitpos % BITS_PER_UNIT != 0)
7480 return false;
7481
7482 /* Reject aligned bitfields: we want to use a normal load or store
7483 instead of a left/right pair. */
7484 if (MEM_ALIGN (op) >= width)
7485 return false;
7486
7487 /* Get references to both ends of the field. */
7488 first = adjust_address (op, QImode, 0);
7489 last = adjust_address (op, QImode, width / BITS_PER_UNIT - 1);
7490
7491 /* Allocate to LEFT and RIGHT according to endianness. LEFT should
7492 correspond to the MSB and RIGHT to the LSB. */
7493 if (TARGET_BIG_ENDIAN)
7494 *left = first, *right = last;
7495 else
7496 *left = last, *right = first;
7497
7498 return true;
7499 }
7500
7501 /* Try to use left/right loads to expand an "extv" or "extzv" pattern.
7502 DEST, SRC, WIDTH and BITPOS are the operands passed to the expander;
7503 the operation is the equivalent of:
7504
7505 (set DEST (*_extract SRC WIDTH BITPOS))
7506
7507 Return true on success. */
7508
7509 bool
7510 mips_expand_ext_as_unaligned_load (rtx dest, rtx src, HOST_WIDE_INT width,
7511 HOST_WIDE_INT bitpos, bool unsigned_p)
7512 {
7513 rtx left, right, temp;
7514 rtx dest1 = NULL_RTX;
7515
7516 /* If TARGET_64BIT, the destination of a 32-bit "extz" or "extzv" will
7517 be a DImode, create a new temp and emit a zero extend at the end. */
7518 if (GET_MODE (dest) == DImode
7519 && REG_P (dest)
7520 && GET_MODE_BITSIZE (SImode) == width)
7521 {
7522 dest1 = dest;
7523 dest = gen_reg_rtx (SImode);
7524 }
7525
7526 if (!mips_get_unaligned_mem (src, width, bitpos, &left, &right))
7527 return false;
7528
7529 temp = gen_reg_rtx (GET_MODE (dest));
7530 if (GET_MODE (dest) == DImode)
7531 {
7532 emit_insn (gen_mov_ldl (temp, src, left));
7533 emit_insn (gen_mov_ldr (dest, copy_rtx (src), right, temp));
7534 }
7535 else
7536 {
7537 emit_insn (gen_mov_lwl (temp, src, left));
7538 emit_insn (gen_mov_lwr (dest, copy_rtx (src), right, temp));
7539 }
7540
7541 /* If we were loading 32bits and the original register was DI then
7542 sign/zero extend into the orignal dest. */
7543 if (dest1)
7544 {
7545 if (unsigned_p)
7546 emit_insn (gen_zero_extendsidi2 (dest1, dest));
7547 else
7548 emit_insn (gen_extendsidi2 (dest1, dest));
7549 }
7550 return true;
7551 }
7552
7553 /* Try to use left/right stores to expand an "ins" pattern. DEST, WIDTH,
7554 BITPOS and SRC are the operands passed to the expander; the operation
7555 is the equivalent of:
7556
7557 (set (zero_extract DEST WIDTH BITPOS) SRC)
7558
7559 Return true on success. */
7560
7561 bool
7562 mips_expand_ins_as_unaligned_store (rtx dest, rtx src, HOST_WIDE_INT width,
7563 HOST_WIDE_INT bitpos)
7564 {
7565 rtx left, right;
7566 enum machine_mode mode;
7567
7568 if (!mips_get_unaligned_mem (dest, width, bitpos, &left, &right))
7569 return false;
7570
7571 mode = mode_for_size (width, MODE_INT, 0);
7572 src = gen_lowpart (mode, src);
7573 if (mode == DImode)
7574 {
7575 emit_insn (gen_mov_sdl (dest, src, left));
7576 emit_insn (gen_mov_sdr (copy_rtx (dest), copy_rtx (src), right));
7577 }
7578 else
7579 {
7580 emit_insn (gen_mov_swl (dest, src, left));
7581 emit_insn (gen_mov_swr (copy_rtx (dest), copy_rtx (src), right));
7582 }
7583 return true;
7584 }
7585
7586 /* Return true if X is a MEM with the same size as MODE. */
7587
7588 bool
7589 mips_mem_fits_mode_p (enum machine_mode mode, rtx x)
7590 {
7591 return (MEM_P (x)
7592 && MEM_SIZE_KNOWN_P (x)
7593 && MEM_SIZE (x) == GET_MODE_SIZE (mode));
7594 }
7595
7596 /* Return true if (zero_extract OP WIDTH BITPOS) can be used as the
7597 source of an "ext" instruction or the destination of an "ins"
7598 instruction. OP must be a register operand and the following
7599 conditions must hold:
7600
7601 0 <= BITPOS < GET_MODE_BITSIZE (GET_MODE (op))
7602 0 < WIDTH <= GET_MODE_BITSIZE (GET_MODE (op))
7603 0 < BITPOS + WIDTH <= GET_MODE_BITSIZE (GET_MODE (op))
7604
7605 Also reject lengths equal to a word as they are better handled
7606 by the move patterns. */
7607
7608 bool
7609 mips_use_ins_ext_p (rtx op, HOST_WIDE_INT width, HOST_WIDE_INT bitpos)
7610 {
7611 if (!ISA_HAS_EXT_INS
7612 || !register_operand (op, VOIDmode)
7613 || GET_MODE_BITSIZE (GET_MODE (op)) > BITS_PER_WORD)
7614 return false;
7615
7616 if (!IN_RANGE (width, 1, GET_MODE_BITSIZE (GET_MODE (op)) - 1))
7617 return false;
7618
7619 if (bitpos < 0 || bitpos + width > GET_MODE_BITSIZE (GET_MODE (op)))
7620 return false;
7621
7622 return true;
7623 }
7624
7625 /* Check if MASK and SHIFT are valid in mask-low-and-shift-left
7626 operation if MAXLEN is the maxium length of consecutive bits that
7627 can make up MASK. MODE is the mode of the operation. See
7628 mask_low_and_shift_len for the actual definition. */
7629
7630 bool
7631 mask_low_and_shift_p (enum machine_mode mode, rtx mask, rtx shift, int maxlen)
7632 {
7633 return IN_RANGE (mask_low_and_shift_len (mode, mask, shift), 1, maxlen);
7634 }
7635
7636 /* Return true iff OP1 and OP2 are valid operands together for the
7637 *and<MODE>3 and *and<MODE>3_mips16 patterns. For the cases to consider,
7638 see the table in the comment before the pattern. */
7639
7640 bool
7641 and_operands_ok (enum machine_mode mode, rtx op1, rtx op2)
7642 {
7643 return (memory_operand (op1, mode)
7644 ? and_load_operand (op2, mode)
7645 : and_reg_operand (op2, mode));
7646 }
7647
7648 /* The canonical form of a mask-low-and-shift-left operation is
7649 (and (ashift X SHIFT) MASK) where MASK has the lower SHIFT number of bits
7650 cleared. Thus we need to shift MASK to the right before checking if it
7651 is a valid mask value. MODE is the mode of the operation. If true
7652 return the length of the mask, otherwise return -1. */
7653
7654 int
7655 mask_low_and_shift_len (enum machine_mode mode, rtx mask, rtx shift)
7656 {
7657 HOST_WIDE_INT shval;
7658
7659 shval = INTVAL (shift) & (GET_MODE_BITSIZE (mode) - 1);
7660 return exact_log2 ((UINTVAL (mask) >> shval) + 1);
7661 }
7662 \f
7663 /* Return true if -msplit-addresses is selected and should be honored.
7664
7665 -msplit-addresses is a half-way house between explicit relocations
7666 and the traditional assembler macros. It can split absolute 32-bit
7667 symbolic constants into a high/lo_sum pair but uses macros for other
7668 sorts of access.
7669
7670 Like explicit relocation support for REL targets, it relies
7671 on GNU extensions in the assembler and the linker.
7672
7673 Although this code should work for -O0, it has traditionally
7674 been treated as an optimization. */
7675
7676 static bool
7677 mips_split_addresses_p (void)
7678 {
7679 return (TARGET_SPLIT_ADDRESSES
7680 && optimize
7681 && !TARGET_MIPS16
7682 && !flag_pic
7683 && !ABI_HAS_64BIT_SYMBOLS);
7684 }
7685
7686 /* (Re-)Initialize mips_split_p, mips_lo_relocs and mips_hi_relocs. */
7687
7688 static void
7689 mips_init_relocs (void)
7690 {
7691 memset (mips_split_p, '\0', sizeof (mips_split_p));
7692 memset (mips_split_hi_p, '\0', sizeof (mips_split_hi_p));
7693 memset (mips_use_pcrel_pool_p, '\0', sizeof (mips_use_pcrel_pool_p));
7694 memset (mips_hi_relocs, '\0', sizeof (mips_hi_relocs));
7695 memset (mips_lo_relocs, '\0', sizeof (mips_lo_relocs));
7696
7697 if (TARGET_MIPS16_PCREL_LOADS)
7698 mips_use_pcrel_pool_p[SYMBOL_ABSOLUTE] = true;
7699 else
7700 {
7701 if (ABI_HAS_64BIT_SYMBOLS)
7702 {
7703 if (TARGET_EXPLICIT_RELOCS)
7704 {
7705 mips_split_p[SYMBOL_64_HIGH] = true;
7706 mips_hi_relocs[SYMBOL_64_HIGH] = "%highest(";
7707 mips_lo_relocs[SYMBOL_64_HIGH] = "%higher(";
7708
7709 mips_split_p[SYMBOL_64_MID] = true;
7710 mips_hi_relocs[SYMBOL_64_MID] = "%higher(";
7711 mips_lo_relocs[SYMBOL_64_MID] = "%hi(";
7712
7713 mips_split_p[SYMBOL_64_LOW] = true;
7714 mips_hi_relocs[SYMBOL_64_LOW] = "%hi(";
7715 mips_lo_relocs[SYMBOL_64_LOW] = "%lo(";
7716
7717 mips_split_p[SYMBOL_ABSOLUTE] = true;
7718 mips_lo_relocs[SYMBOL_ABSOLUTE] = "%lo(";
7719 }
7720 }
7721 else
7722 {
7723 if (TARGET_EXPLICIT_RELOCS
7724 || mips_split_addresses_p ()
7725 || TARGET_MIPS16)
7726 {
7727 mips_split_p[SYMBOL_ABSOLUTE] = true;
7728 mips_hi_relocs[SYMBOL_ABSOLUTE] = "%hi(";
7729 mips_lo_relocs[SYMBOL_ABSOLUTE] = "%lo(";
7730 }
7731 }
7732 }
7733
7734 if (TARGET_MIPS16)
7735 {
7736 /* The high part is provided by a pseudo copy of $gp. */
7737 mips_split_p[SYMBOL_GP_RELATIVE] = true;
7738 mips_lo_relocs[SYMBOL_GP_RELATIVE] = "%gprel(";
7739 }
7740 else if (TARGET_EXPLICIT_RELOCS)
7741 /* Small data constants are kept whole until after reload,
7742 then lowered by mips_rewrite_small_data. */
7743 mips_lo_relocs[SYMBOL_GP_RELATIVE] = "%gp_rel(";
7744
7745 if (TARGET_EXPLICIT_RELOCS)
7746 {
7747 mips_split_p[SYMBOL_GOT_PAGE_OFST] = true;
7748 if (TARGET_NEWABI)
7749 {
7750 mips_lo_relocs[SYMBOL_GOTOFF_PAGE] = "%got_page(";
7751 mips_lo_relocs[SYMBOL_GOT_PAGE_OFST] = "%got_ofst(";
7752 }
7753 else
7754 {
7755 mips_lo_relocs[SYMBOL_GOTOFF_PAGE] = "%got(";
7756 mips_lo_relocs[SYMBOL_GOT_PAGE_OFST] = "%lo(";
7757 }
7758 if (TARGET_MIPS16)
7759 /* Expose the use of $28 as soon as possible. */
7760 mips_split_hi_p[SYMBOL_GOT_PAGE_OFST] = true;
7761
7762 if (TARGET_XGOT)
7763 {
7764 /* The HIGH and LO_SUM are matched by special .md patterns. */
7765 mips_split_p[SYMBOL_GOT_DISP] = true;
7766
7767 mips_split_p[SYMBOL_GOTOFF_DISP] = true;
7768 mips_hi_relocs[SYMBOL_GOTOFF_DISP] = "%got_hi(";
7769 mips_lo_relocs[SYMBOL_GOTOFF_DISP] = "%got_lo(";
7770
7771 mips_split_p[SYMBOL_GOTOFF_CALL] = true;
7772 mips_hi_relocs[SYMBOL_GOTOFF_CALL] = "%call_hi(";
7773 mips_lo_relocs[SYMBOL_GOTOFF_CALL] = "%call_lo(";
7774 }
7775 else
7776 {
7777 if (TARGET_NEWABI)
7778 mips_lo_relocs[SYMBOL_GOTOFF_DISP] = "%got_disp(";
7779 else
7780 mips_lo_relocs[SYMBOL_GOTOFF_DISP] = "%got(";
7781 mips_lo_relocs[SYMBOL_GOTOFF_CALL] = "%call16(";
7782 if (TARGET_MIPS16)
7783 /* Expose the use of $28 as soon as possible. */
7784 mips_split_p[SYMBOL_GOT_DISP] = true;
7785 }
7786 }
7787
7788 if (TARGET_NEWABI)
7789 {
7790 mips_split_p[SYMBOL_GOTOFF_LOADGP] = true;
7791 mips_hi_relocs[SYMBOL_GOTOFF_LOADGP] = "%hi(%neg(%gp_rel(";
7792 mips_lo_relocs[SYMBOL_GOTOFF_LOADGP] = "%lo(%neg(%gp_rel(";
7793 }
7794
7795 mips_lo_relocs[SYMBOL_TLSGD] = "%tlsgd(";
7796 mips_lo_relocs[SYMBOL_TLSLDM] = "%tlsldm(";
7797
7798 if (TARGET_MIPS16_PCREL_LOADS)
7799 {
7800 mips_use_pcrel_pool_p[SYMBOL_DTPREL] = true;
7801 mips_use_pcrel_pool_p[SYMBOL_TPREL] = true;
7802 }
7803 else
7804 {
7805 mips_split_p[SYMBOL_DTPREL] = true;
7806 mips_hi_relocs[SYMBOL_DTPREL] = "%dtprel_hi(";
7807 mips_lo_relocs[SYMBOL_DTPREL] = "%dtprel_lo(";
7808
7809 mips_split_p[SYMBOL_TPREL] = true;
7810 mips_hi_relocs[SYMBOL_TPREL] = "%tprel_hi(";
7811 mips_lo_relocs[SYMBOL_TPREL] = "%tprel_lo(";
7812 }
7813
7814 mips_lo_relocs[SYMBOL_GOTTPREL] = "%gottprel(";
7815 mips_lo_relocs[SYMBOL_HALF] = "%half(";
7816 }
7817
7818 /* Print symbolic operand OP, which is part of a HIGH or LO_SUM
7819 in context CONTEXT. RELOCS is the array of relocations to use. */
7820
7821 static void
7822 mips_print_operand_reloc (FILE *file, rtx op, enum mips_symbol_context context,
7823 const char **relocs)
7824 {
7825 enum mips_symbol_type symbol_type;
7826 const char *p;
7827
7828 symbol_type = mips_classify_symbolic_expression (op, context);
7829 gcc_assert (relocs[symbol_type]);
7830
7831 fputs (relocs[symbol_type], file);
7832 output_addr_const (file, mips_strip_unspec_address (op));
7833 for (p = relocs[symbol_type]; *p != 0; p++)
7834 if (*p == '(')
7835 fputc (')', file);
7836 }
7837
7838 /* Start a new block with the given asm switch enabled. If we need
7839 to print a directive, emit PREFIX before it and SUFFIX after it. */
7840
7841 static void
7842 mips_push_asm_switch_1 (struct mips_asm_switch *asm_switch,
7843 const char *prefix, const char *suffix)
7844 {
7845 if (asm_switch->nesting_level == 0)
7846 fprintf (asm_out_file, "%s.set\tno%s%s", prefix, asm_switch->name, suffix);
7847 asm_switch->nesting_level++;
7848 }
7849
7850 /* Likewise, but end a block. */
7851
7852 static void
7853 mips_pop_asm_switch_1 (struct mips_asm_switch *asm_switch,
7854 const char *prefix, const char *suffix)
7855 {
7856 gcc_assert (asm_switch->nesting_level);
7857 asm_switch->nesting_level--;
7858 if (asm_switch->nesting_level == 0)
7859 fprintf (asm_out_file, "%s.set\t%s%s", prefix, asm_switch->name, suffix);
7860 }
7861
7862 /* Wrappers around mips_push_asm_switch_1 and mips_pop_asm_switch_1
7863 that either print a complete line or print nothing. */
7864
7865 void
7866 mips_push_asm_switch (struct mips_asm_switch *asm_switch)
7867 {
7868 mips_push_asm_switch_1 (asm_switch, "\t", "\n");
7869 }
7870
7871 void
7872 mips_pop_asm_switch (struct mips_asm_switch *asm_switch)
7873 {
7874 mips_pop_asm_switch_1 (asm_switch, "\t", "\n");
7875 }
7876
7877 /* Print the text for PRINT_OPERAND punctation character CH to FILE.
7878 The punctuation characters are:
7879
7880 '(' Start a nested ".set noreorder" block.
7881 ')' End a nested ".set noreorder" block.
7882 '[' Start a nested ".set noat" block.
7883 ']' End a nested ".set noat" block.
7884 '<' Start a nested ".set nomacro" block.
7885 '>' End a nested ".set nomacro" block.
7886 '*' Behave like %(%< if generating a delayed-branch sequence.
7887 '#' Print a nop if in a ".set noreorder" block.
7888 '/' Like '#', but do nothing within a delayed-branch sequence.
7889 '?' Print "l" if mips_branch_likely is true
7890 '~' Print a nop if mips_branch_likely is true
7891 '.' Print the name of the register with a hard-wired zero (zero or $0).
7892 '@' Print the name of the assembler temporary register (at or $1).
7893 '^' Print the name of the pic call-through register (t9 or $25).
7894 '+' Print the name of the gp register (usually gp or $28).
7895 '$' Print the name of the stack pointer register (sp or $29).
7896 ':' Print "c" to use the compact version if the delay slot is a nop.
7897 '!' Print "s" to use the short version if the delay slot contains a
7898 16-bit instruction.
7899
7900 See also mips_init_print_operand_pucnt. */
7901
7902 static void
7903 mips_print_operand_punctuation (FILE *file, int ch)
7904 {
7905 switch (ch)
7906 {
7907 case '(':
7908 mips_push_asm_switch_1 (&mips_noreorder, "", "\n\t");
7909 break;
7910
7911 case ')':
7912 mips_pop_asm_switch_1 (&mips_noreorder, "\n\t", "");
7913 break;
7914
7915 case '[':
7916 mips_push_asm_switch_1 (&mips_noat, "", "\n\t");
7917 break;
7918
7919 case ']':
7920 mips_pop_asm_switch_1 (&mips_noat, "\n\t", "");
7921 break;
7922
7923 case '<':
7924 mips_push_asm_switch_1 (&mips_nomacro, "", "\n\t");
7925 break;
7926
7927 case '>':
7928 mips_pop_asm_switch_1 (&mips_nomacro, "\n\t", "");
7929 break;
7930
7931 case '*':
7932 if (final_sequence != 0)
7933 {
7934 mips_print_operand_punctuation (file, '(');
7935 mips_print_operand_punctuation (file, '<');
7936 }
7937 break;
7938
7939 case '#':
7940 if (mips_noreorder.nesting_level > 0)
7941 fputs ("\n\tnop", file);
7942 break;
7943
7944 case '/':
7945 /* Print an extra newline so that the delayed insn is separated
7946 from the following ones. This looks neater and is consistent
7947 with non-nop delayed sequences. */
7948 if (mips_noreorder.nesting_level > 0 && final_sequence == 0)
7949 fputs ("\n\tnop\n", file);
7950 break;
7951
7952 case '?':
7953 if (mips_branch_likely)
7954 putc ('l', file);
7955 break;
7956
7957 case '~':
7958 if (mips_branch_likely)
7959 fputs ("\n\tnop", file);
7960 break;
7961
7962 case '.':
7963 fputs (reg_names[GP_REG_FIRST + 0], file);
7964 break;
7965
7966 case '@':
7967 fputs (reg_names[AT_REGNUM], file);
7968 break;
7969
7970 case '^':
7971 fputs (reg_names[PIC_FUNCTION_ADDR_REGNUM], file);
7972 break;
7973
7974 case '+':
7975 fputs (reg_names[PIC_OFFSET_TABLE_REGNUM], file);
7976 break;
7977
7978 case '$':
7979 fputs (reg_names[STACK_POINTER_REGNUM], file);
7980 break;
7981
7982 case ':':
7983 /* When final_sequence is 0, the delay slot will be a nop. We can
7984 use the compact version for microMIPS. */
7985 if (final_sequence == 0)
7986 putc ('c', file);
7987 break;
7988
7989 case '!':
7990 /* If the delay slot instruction is short, then use the
7991 compact version. */
7992 if (final_sequence == 0
7993 || get_attr_length (XVECEXP (final_sequence, 0, 1)) == 2)
7994 putc ('s', file);
7995 break;
7996
7997 default:
7998 gcc_unreachable ();
7999 break;
8000 }
8001 }
8002
8003 /* Initialize mips_print_operand_punct. */
8004
8005 static void
8006 mips_init_print_operand_punct (void)
8007 {
8008 const char *p;
8009
8010 for (p = "()[]<>*#/?~.@^+$:!"; *p; p++)
8011 mips_print_operand_punct[(unsigned char) *p] = true;
8012 }
8013
8014 /* PRINT_OPERAND prefix LETTER refers to the integer branch instruction
8015 associated with condition CODE. Print the condition part of the
8016 opcode to FILE. */
8017
8018 static void
8019 mips_print_int_branch_condition (FILE *file, enum rtx_code code, int letter)
8020 {
8021 switch (code)
8022 {
8023 case EQ:
8024 case NE:
8025 case GT:
8026 case GE:
8027 case LT:
8028 case LE:
8029 case GTU:
8030 case GEU:
8031 case LTU:
8032 case LEU:
8033 /* Conveniently, the MIPS names for these conditions are the same
8034 as their RTL equivalents. */
8035 fputs (GET_RTX_NAME (code), file);
8036 break;
8037
8038 default:
8039 output_operand_lossage ("'%%%c' is not a valid operand prefix", letter);
8040 break;
8041 }
8042 }
8043
8044 /* Likewise floating-point branches. */
8045
8046 static void
8047 mips_print_float_branch_condition (FILE *file, enum rtx_code code, int letter)
8048 {
8049 switch (code)
8050 {
8051 case EQ:
8052 fputs ("c1f", file);
8053 break;
8054
8055 case NE:
8056 fputs ("c1t", file);
8057 break;
8058
8059 default:
8060 output_operand_lossage ("'%%%c' is not a valid operand prefix", letter);
8061 break;
8062 }
8063 }
8064
8065 /* Implement TARGET_PRINT_OPERAND_PUNCT_VALID_P. */
8066
8067 static bool
8068 mips_print_operand_punct_valid_p (unsigned char code)
8069 {
8070 return mips_print_operand_punct[code];
8071 }
8072
8073 /* Implement TARGET_PRINT_OPERAND. The MIPS-specific operand codes are:
8074
8075 'X' Print CONST_INT OP in hexadecimal format.
8076 'x' Print the low 16 bits of CONST_INT OP in hexadecimal format.
8077 'd' Print CONST_INT OP in decimal.
8078 'm' Print one less than CONST_INT OP in decimal.
8079 'h' Print the high-part relocation associated with OP, after stripping
8080 any outermost HIGH.
8081 'R' Print the low-part relocation associated with OP.
8082 'C' Print the integer branch condition for comparison OP.
8083 'N' Print the inverse of the integer branch condition for comparison OP.
8084 'F' Print the FPU branch condition for comparison OP.
8085 'W' Print the inverse of the FPU branch condition for comparison OP.
8086 'T' Print 'f' for (eq:CC ...), 't' for (ne:CC ...),
8087 'z' for (eq:?I ...), 'n' for (ne:?I ...).
8088 't' Like 'T', but with the EQ/NE cases reversed
8089 'Y' Print mips_fp_conditions[INTVAL (OP)]
8090 'Z' Print OP and a comma for ISA_HAS_8CC, otherwise print nothing.
8091 'q' Print a DSP accumulator register.
8092 'D' Print the second part of a double-word register or memory operand.
8093 'L' Print the low-order register in a double-word register operand.
8094 'M' Print high-order register in a double-word register operand.
8095 'z' Print $0 if OP is zero, otherwise print OP normally.
8096 'b' Print the address of a memory operand, without offset. */
8097
8098 static void
8099 mips_print_operand (FILE *file, rtx op, int letter)
8100 {
8101 enum rtx_code code;
8102
8103 if (mips_print_operand_punct_valid_p (letter))
8104 {
8105 mips_print_operand_punctuation (file, letter);
8106 return;
8107 }
8108
8109 gcc_assert (op);
8110 code = GET_CODE (op);
8111
8112 switch (letter)
8113 {
8114 case 'X':
8115 if (CONST_INT_P (op))
8116 fprintf (file, HOST_WIDE_INT_PRINT_HEX, INTVAL (op));
8117 else
8118 output_operand_lossage ("invalid use of '%%%c'", letter);
8119 break;
8120
8121 case 'x':
8122 if (CONST_INT_P (op))
8123 fprintf (file, HOST_WIDE_INT_PRINT_HEX, INTVAL (op) & 0xffff);
8124 else
8125 output_operand_lossage ("invalid use of '%%%c'", letter);
8126 break;
8127
8128 case 'd':
8129 if (CONST_INT_P (op))
8130 fprintf (file, HOST_WIDE_INT_PRINT_DEC, INTVAL (op));
8131 else
8132 output_operand_lossage ("invalid use of '%%%c'", letter);
8133 break;
8134
8135 case 'm':
8136 if (CONST_INT_P (op))
8137 fprintf (file, HOST_WIDE_INT_PRINT_DEC, INTVAL (op) - 1);
8138 else
8139 output_operand_lossage ("invalid use of '%%%c'", letter);
8140 break;
8141
8142 case 'h':
8143 if (code == HIGH)
8144 op = XEXP (op, 0);
8145 mips_print_operand_reloc (file, op, SYMBOL_CONTEXT_LEA, mips_hi_relocs);
8146 break;
8147
8148 case 'R':
8149 mips_print_operand_reloc (file, op, SYMBOL_CONTEXT_LEA, mips_lo_relocs);
8150 break;
8151
8152 case 'C':
8153 mips_print_int_branch_condition (file, code, letter);
8154 break;
8155
8156 case 'N':
8157 mips_print_int_branch_condition (file, reverse_condition (code), letter);
8158 break;
8159
8160 case 'F':
8161 mips_print_float_branch_condition (file, code, letter);
8162 break;
8163
8164 case 'W':
8165 mips_print_float_branch_condition (file, reverse_condition (code),
8166 letter);
8167 break;
8168
8169 case 'T':
8170 case 't':
8171 {
8172 int truth = (code == NE) == (letter == 'T');
8173 fputc ("zfnt"[truth * 2 + (GET_MODE (op) == CCmode)], file);
8174 }
8175 break;
8176
8177 case 'Y':
8178 if (code == CONST_INT && UINTVAL (op) < ARRAY_SIZE (mips_fp_conditions))
8179 fputs (mips_fp_conditions[UINTVAL (op)], file);
8180 else
8181 output_operand_lossage ("'%%%c' is not a valid operand prefix",
8182 letter);
8183 break;
8184
8185 case 'Z':
8186 if (ISA_HAS_8CC)
8187 {
8188 mips_print_operand (file, op, 0);
8189 fputc (',', file);
8190 }
8191 break;
8192
8193 case 'q':
8194 if (code == REG && MD_REG_P (REGNO (op)))
8195 fprintf (file, "$ac0");
8196 else if (code == REG && DSP_ACC_REG_P (REGNO (op)))
8197 fprintf (file, "$ac%c", reg_names[REGNO (op)][3]);
8198 else
8199 output_operand_lossage ("invalid use of '%%%c'", letter);
8200 break;
8201
8202 default:
8203 switch (code)
8204 {
8205 case REG:
8206 {
8207 unsigned int regno = REGNO (op);
8208 if ((letter == 'M' && TARGET_LITTLE_ENDIAN)
8209 || (letter == 'L' && TARGET_BIG_ENDIAN)
8210 || letter == 'D')
8211 regno++;
8212 else if (letter && letter != 'z' && letter != 'M' && letter != 'L')
8213 output_operand_lossage ("invalid use of '%%%c'", letter);
8214 /* We need to print $0 .. $31 for COP0 registers. */
8215 if (COP0_REG_P (regno))
8216 fprintf (file, "$%s", &reg_names[regno][4]);
8217 else
8218 fprintf (file, "%s", reg_names[regno]);
8219 }
8220 break;
8221
8222 case MEM:
8223 if (letter == 'D')
8224 output_address (plus_constant (Pmode, XEXP (op, 0), 4));
8225 else if (letter == 'b')
8226 {
8227 gcc_assert (REG_P (XEXP (op, 0)));
8228 mips_print_operand (file, XEXP (op, 0), 0);
8229 }
8230 else if (letter && letter != 'z')
8231 output_operand_lossage ("invalid use of '%%%c'", letter);
8232 else
8233 output_address (XEXP (op, 0));
8234 break;
8235
8236 default:
8237 if (letter == 'z' && op == CONST0_RTX (GET_MODE (op)))
8238 fputs (reg_names[GP_REG_FIRST], file);
8239 else if (letter && letter != 'z')
8240 output_operand_lossage ("invalid use of '%%%c'", letter);
8241 else if (CONST_GP_P (op))
8242 fputs (reg_names[GLOBAL_POINTER_REGNUM], file);
8243 else
8244 output_addr_const (file, mips_strip_unspec_address (op));
8245 break;
8246 }
8247 }
8248 }
8249
8250 /* Implement TARGET_PRINT_OPERAND_ADDRESS. */
8251
8252 static void
8253 mips_print_operand_address (FILE *file, rtx x)
8254 {
8255 struct mips_address_info addr;
8256
8257 if (mips_classify_address (&addr, x, word_mode, true))
8258 switch (addr.type)
8259 {
8260 case ADDRESS_REG:
8261 mips_print_operand (file, addr.offset, 0);
8262 fprintf (file, "(%s)", reg_names[REGNO (addr.reg)]);
8263 return;
8264
8265 case ADDRESS_LO_SUM:
8266 mips_print_operand_reloc (file, addr.offset, SYMBOL_CONTEXT_MEM,
8267 mips_lo_relocs);
8268 fprintf (file, "(%s)", reg_names[REGNO (addr.reg)]);
8269 return;
8270
8271 case ADDRESS_CONST_INT:
8272 output_addr_const (file, x);
8273 fprintf (file, "(%s)", reg_names[GP_REG_FIRST]);
8274 return;
8275
8276 case ADDRESS_SYMBOLIC:
8277 output_addr_const (file, mips_strip_unspec_address (x));
8278 return;
8279 }
8280 gcc_unreachable ();
8281 }
8282 \f
8283 /* Implement TARGET_ENCODE_SECTION_INFO. */
8284
8285 static void
8286 mips_encode_section_info (tree decl, rtx rtl, int first)
8287 {
8288 default_encode_section_info (decl, rtl, first);
8289
8290 if (TREE_CODE (decl) == FUNCTION_DECL)
8291 {
8292 rtx symbol = XEXP (rtl, 0);
8293 tree type = TREE_TYPE (decl);
8294
8295 /* Encode whether the symbol is short or long. */
8296 if ((TARGET_LONG_CALLS && !mips_near_type_p (type))
8297 || mips_far_type_p (type))
8298 SYMBOL_REF_FLAGS (symbol) |= SYMBOL_FLAG_LONG_CALL;
8299 }
8300 }
8301
8302 /* Implement TARGET_SELECT_RTX_SECTION. */
8303
8304 static section *
8305 mips_select_rtx_section (enum machine_mode mode, rtx x,
8306 unsigned HOST_WIDE_INT align)
8307 {
8308 /* ??? Consider using mergeable small data sections. */
8309 if (mips_rtx_constant_in_small_data_p (mode))
8310 return get_named_section (NULL, ".sdata", 0);
8311
8312 return default_elf_select_rtx_section (mode, x, align);
8313 }
8314
8315 /* Implement TARGET_ASM_FUNCTION_RODATA_SECTION.
8316
8317 The complication here is that, with the combination TARGET_ABICALLS
8318 && !TARGET_ABSOLUTE_ABICALLS && !TARGET_GPWORD, jump tables will use
8319 absolute addresses, and should therefore not be included in the
8320 read-only part of a DSO. Handle such cases by selecting a normal
8321 data section instead of a read-only one. The logic apes that in
8322 default_function_rodata_section. */
8323
8324 static section *
8325 mips_function_rodata_section (tree decl)
8326 {
8327 if (!TARGET_ABICALLS || TARGET_ABSOLUTE_ABICALLS || TARGET_GPWORD)
8328 return default_function_rodata_section (decl);
8329
8330 if (decl && DECL_SECTION_NAME (decl))
8331 {
8332 const char *name = TREE_STRING_POINTER (DECL_SECTION_NAME (decl));
8333 if (DECL_ONE_ONLY (decl) && strncmp (name, ".gnu.linkonce.t.", 16) == 0)
8334 {
8335 char *rname = ASTRDUP (name);
8336 rname[14] = 'd';
8337 return get_section (rname, SECTION_LINKONCE | SECTION_WRITE, decl);
8338 }
8339 else if (flag_function_sections
8340 && flag_data_sections
8341 && strncmp (name, ".text.", 6) == 0)
8342 {
8343 char *rname = ASTRDUP (name);
8344 memcpy (rname + 1, "data", 4);
8345 return get_section (rname, SECTION_WRITE, decl);
8346 }
8347 }
8348 return data_section;
8349 }
8350
8351 /* Implement TARGET_IN_SMALL_DATA_P. */
8352
8353 static bool
8354 mips_in_small_data_p (const_tree decl)
8355 {
8356 unsigned HOST_WIDE_INT size;
8357
8358 if (TREE_CODE (decl) == STRING_CST || TREE_CODE (decl) == FUNCTION_DECL)
8359 return false;
8360
8361 /* We don't yet generate small-data references for -mabicalls
8362 or VxWorks RTP code. See the related -G handling in
8363 mips_option_override. */
8364 if (TARGET_ABICALLS || TARGET_VXWORKS_RTP)
8365 return false;
8366
8367 if (TREE_CODE (decl) == VAR_DECL && DECL_SECTION_NAME (decl) != 0)
8368 {
8369 const char *name;
8370
8371 /* Reject anything that isn't in a known small-data section. */
8372 name = TREE_STRING_POINTER (DECL_SECTION_NAME (decl));
8373 if (strcmp (name, ".sdata") != 0 && strcmp (name, ".sbss") != 0)
8374 return false;
8375
8376 /* If a symbol is defined externally, the assembler will use the
8377 usual -G rules when deciding how to implement macros. */
8378 if (mips_lo_relocs[SYMBOL_GP_RELATIVE] || !DECL_EXTERNAL (decl))
8379 return true;
8380 }
8381 else if (TARGET_EMBEDDED_DATA)
8382 {
8383 /* Don't put constants into the small data section: we want them
8384 to be in ROM rather than RAM. */
8385 if (TREE_CODE (decl) != VAR_DECL)
8386 return false;
8387
8388 if (TREE_READONLY (decl)
8389 && !TREE_SIDE_EFFECTS (decl)
8390 && (!DECL_INITIAL (decl) || TREE_CONSTANT (DECL_INITIAL (decl))))
8391 return false;
8392 }
8393
8394 /* Enforce -mlocal-sdata. */
8395 if (!TARGET_LOCAL_SDATA && !TREE_PUBLIC (decl))
8396 return false;
8397
8398 /* Enforce -mextern-sdata. */
8399 if (!TARGET_EXTERN_SDATA && DECL_P (decl))
8400 {
8401 if (DECL_EXTERNAL (decl))
8402 return false;
8403 if (DECL_COMMON (decl) && DECL_INITIAL (decl) == NULL)
8404 return false;
8405 }
8406
8407 /* We have traditionally not treated zero-sized objects as small data,
8408 so this is now effectively part of the ABI. */
8409 size = int_size_in_bytes (TREE_TYPE (decl));
8410 return size > 0 && size <= mips_small_data_threshold;
8411 }
8412
8413 /* Implement TARGET_USE_ANCHORS_FOR_SYMBOL_P. We don't want to use
8414 anchors for small data: the GP register acts as an anchor in that
8415 case. We also don't want to use them for PC-relative accesses,
8416 where the PC acts as an anchor. */
8417
8418 static bool
8419 mips_use_anchors_for_symbol_p (const_rtx symbol)
8420 {
8421 switch (mips_classify_symbol (symbol, SYMBOL_CONTEXT_MEM))
8422 {
8423 case SYMBOL_PC_RELATIVE:
8424 case SYMBOL_GP_RELATIVE:
8425 return false;
8426
8427 default:
8428 return default_use_anchors_for_symbol_p (symbol);
8429 }
8430 }
8431 \f
8432 /* The MIPS debug format wants all automatic variables and arguments
8433 to be in terms of the virtual frame pointer (stack pointer before
8434 any adjustment in the function), while the MIPS 3.0 linker wants
8435 the frame pointer to be the stack pointer after the initial
8436 adjustment. So, we do the adjustment here. The arg pointer (which
8437 is eliminated) points to the virtual frame pointer, while the frame
8438 pointer (which may be eliminated) points to the stack pointer after
8439 the initial adjustments. */
8440
8441 HOST_WIDE_INT
8442 mips_debugger_offset (rtx addr, HOST_WIDE_INT offset)
8443 {
8444 rtx offset2 = const0_rtx;
8445 rtx reg = eliminate_constant_term (addr, &offset2);
8446
8447 if (offset == 0)
8448 offset = INTVAL (offset2);
8449
8450 if (reg == stack_pointer_rtx
8451 || reg == frame_pointer_rtx
8452 || reg == hard_frame_pointer_rtx)
8453 {
8454 offset -= cfun->machine->frame.total_size;
8455 if (reg == hard_frame_pointer_rtx)
8456 offset += cfun->machine->frame.hard_frame_pointer_offset;
8457 }
8458
8459 return offset;
8460 }
8461 \f
8462 /* Implement ASM_OUTPUT_EXTERNAL. */
8463
8464 void
8465 mips_output_external (FILE *file, tree decl, const char *name)
8466 {
8467 default_elf_asm_output_external (file, decl, name);
8468
8469 /* We output the name if and only if TREE_SYMBOL_REFERENCED is
8470 set in order to avoid putting out names that are never really
8471 used. */
8472 if (TREE_SYMBOL_REFERENCED (DECL_ASSEMBLER_NAME (decl)))
8473 {
8474 if (!TARGET_EXPLICIT_RELOCS && mips_in_small_data_p (decl))
8475 {
8476 /* When using assembler macros, emit .extern directives for
8477 all small-data externs so that the assembler knows how
8478 big they are.
8479
8480 In most cases it would be safe (though pointless) to emit
8481 .externs for other symbols too. One exception is when an
8482 object is within the -G limit but declared by the user to
8483 be in a section other than .sbss or .sdata. */
8484 fputs ("\t.extern\t", file);
8485 assemble_name (file, name);
8486 fprintf (file, ", " HOST_WIDE_INT_PRINT_DEC "\n",
8487 int_size_in_bytes (TREE_TYPE (decl)));
8488 }
8489 }
8490 }
8491
8492 /* Implement TARGET_ASM_OUTPUT_SOURCE_FILENAME. */
8493
8494 static void
8495 mips_output_filename (FILE *stream, const char *name)
8496 {
8497 /* If we are emitting DWARF-2, let dwarf2out handle the ".file"
8498 directives. */
8499 if (write_symbols == DWARF2_DEBUG)
8500 return;
8501 else if (mips_output_filename_first_time)
8502 {
8503 mips_output_filename_first_time = 0;
8504 num_source_filenames += 1;
8505 current_function_file = name;
8506 fprintf (stream, "\t.file\t%d ", num_source_filenames);
8507 output_quoted_string (stream, name);
8508 putc ('\n', stream);
8509 }
8510 /* If we are emitting stabs, let dbxout.c handle this (except for
8511 the mips_output_filename_first_time case). */
8512 else if (write_symbols == DBX_DEBUG)
8513 return;
8514 else if (name != current_function_file
8515 && strcmp (name, current_function_file) != 0)
8516 {
8517 num_source_filenames += 1;
8518 current_function_file = name;
8519 fprintf (stream, "\t.file\t%d ", num_source_filenames);
8520 output_quoted_string (stream, name);
8521 putc ('\n', stream);
8522 }
8523 }
8524
8525 /* Implement TARGET_ASM_OUTPUT_DWARF_DTPREL. */
8526
8527 static void ATTRIBUTE_UNUSED
8528 mips_output_dwarf_dtprel (FILE *file, int size, rtx x)
8529 {
8530 switch (size)
8531 {
8532 case 4:
8533 fputs ("\t.dtprelword\t", file);
8534 break;
8535
8536 case 8:
8537 fputs ("\t.dtpreldword\t", file);
8538 break;
8539
8540 default:
8541 gcc_unreachable ();
8542 }
8543 output_addr_const (file, x);
8544 fputs ("+0x8000", file);
8545 }
8546
8547 /* Implement TARGET_DWARF_REGISTER_SPAN. */
8548
8549 static rtx
8550 mips_dwarf_register_span (rtx reg)
8551 {
8552 rtx high, low;
8553 enum machine_mode mode;
8554
8555 /* By default, GCC maps increasing register numbers to increasing
8556 memory locations, but paired FPRs are always little-endian,
8557 regardless of the prevailing endianness. */
8558 mode = GET_MODE (reg);
8559 if (FP_REG_P (REGNO (reg))
8560 && TARGET_BIG_ENDIAN
8561 && MAX_FPRS_PER_FMT > 1
8562 && GET_MODE_SIZE (mode) > UNITS_PER_FPREG)
8563 {
8564 gcc_assert (GET_MODE_SIZE (mode) == UNITS_PER_HWFPVALUE);
8565 high = mips_subword (reg, true);
8566 low = mips_subword (reg, false);
8567 return gen_rtx_PARALLEL (VOIDmode, gen_rtvec (2, high, low));
8568 }
8569
8570 return NULL_RTX;
8571 }
8572
8573 /* DSP ALU can bypass data with no delays for the following pairs. */
8574 enum insn_code dspalu_bypass_table[][2] =
8575 {
8576 {CODE_FOR_mips_addsc, CODE_FOR_mips_addwc},
8577 {CODE_FOR_mips_cmpu_eq_qb, CODE_FOR_mips_pick_qb},
8578 {CODE_FOR_mips_cmpu_lt_qb, CODE_FOR_mips_pick_qb},
8579 {CODE_FOR_mips_cmpu_le_qb, CODE_FOR_mips_pick_qb},
8580 {CODE_FOR_mips_cmp_eq_ph, CODE_FOR_mips_pick_ph},
8581 {CODE_FOR_mips_cmp_lt_ph, CODE_FOR_mips_pick_ph},
8582 {CODE_FOR_mips_cmp_le_ph, CODE_FOR_mips_pick_ph},
8583 {CODE_FOR_mips_wrdsp, CODE_FOR_mips_insv}
8584 };
8585
8586 int
8587 mips_dspalu_bypass_p (rtx out_insn, rtx in_insn)
8588 {
8589 int i;
8590 int num_bypass = ARRAY_SIZE (dspalu_bypass_table);
8591 enum insn_code out_icode = (enum insn_code) INSN_CODE (out_insn);
8592 enum insn_code in_icode = (enum insn_code) INSN_CODE (in_insn);
8593
8594 for (i = 0; i < num_bypass; i++)
8595 {
8596 if (out_icode == dspalu_bypass_table[i][0]
8597 && in_icode == dspalu_bypass_table[i][1])
8598 return true;
8599 }
8600
8601 return false;
8602 }
8603 /* Implement ASM_OUTPUT_ASCII. */
8604
8605 void
8606 mips_output_ascii (FILE *stream, const char *string, size_t len)
8607 {
8608 size_t i;
8609 int cur_pos;
8610
8611 cur_pos = 17;
8612 fprintf (stream, "\t.ascii\t\"");
8613 for (i = 0; i < len; i++)
8614 {
8615 int c;
8616
8617 c = (unsigned char) string[i];
8618 if (ISPRINT (c))
8619 {
8620 if (c == '\\' || c == '\"')
8621 {
8622 putc ('\\', stream);
8623 cur_pos++;
8624 }
8625 putc (c, stream);
8626 cur_pos++;
8627 }
8628 else
8629 {
8630 fprintf (stream, "\\%03o", c);
8631 cur_pos += 4;
8632 }
8633
8634 if (cur_pos > 72 && i+1 < len)
8635 {
8636 cur_pos = 17;
8637 fprintf (stream, "\"\n\t.ascii\t\"");
8638 }
8639 }
8640 fprintf (stream, "\"\n");
8641 }
8642
8643 /* Return the pseudo-op for full SYMBOL_(D)TPREL address *ADDR.
8644 Update *ADDR with the operand that should be printed. */
8645
8646 const char *
8647 mips_output_tls_reloc_directive (rtx *addr)
8648 {
8649 enum mips_symbol_type type;
8650
8651 type = mips_classify_symbolic_expression (*addr, SYMBOL_CONTEXT_LEA);
8652 *addr = mips_strip_unspec_address (*addr);
8653 switch (type)
8654 {
8655 case SYMBOL_DTPREL:
8656 return Pmode == SImode ? ".dtprelword\t%0" : ".dtpreldword\t%0";
8657
8658 case SYMBOL_TPREL:
8659 return Pmode == SImode ? ".tprelword\t%0" : ".tpreldword\t%0";
8660
8661 default:
8662 gcc_unreachable ();
8663 }
8664 }
8665
8666 /* Emit either a label, .comm, or .lcomm directive. When using assembler
8667 macros, mark the symbol as written so that mips_asm_output_external
8668 won't emit an .extern for it. STREAM is the output file, NAME is the
8669 name of the symbol, INIT_STRING is the string that should be written
8670 before the symbol and FINAL_STRING is the string that should be
8671 written after it. FINAL_STRING is a printf format that consumes the
8672 remaining arguments. */
8673
8674 void
8675 mips_declare_object (FILE *stream, const char *name, const char *init_string,
8676 const char *final_string, ...)
8677 {
8678 va_list ap;
8679
8680 fputs (init_string, stream);
8681 assemble_name (stream, name);
8682 va_start (ap, final_string);
8683 vfprintf (stream, final_string, ap);
8684 va_end (ap);
8685
8686 if (!TARGET_EXPLICIT_RELOCS)
8687 {
8688 tree name_tree = get_identifier (name);
8689 TREE_ASM_WRITTEN (name_tree) = 1;
8690 }
8691 }
8692
8693 /* Declare a common object of SIZE bytes using asm directive INIT_STRING.
8694 NAME is the name of the object and ALIGN is the required alignment
8695 in bytes. TAKES_ALIGNMENT_P is true if the directive takes a third
8696 alignment argument. */
8697
8698 void
8699 mips_declare_common_object (FILE *stream, const char *name,
8700 const char *init_string,
8701 unsigned HOST_WIDE_INT size,
8702 unsigned int align, bool takes_alignment_p)
8703 {
8704 if (!takes_alignment_p)
8705 {
8706 size += (align / BITS_PER_UNIT) - 1;
8707 size -= size % (align / BITS_PER_UNIT);
8708 mips_declare_object (stream, name, init_string,
8709 "," HOST_WIDE_INT_PRINT_UNSIGNED "\n", size);
8710 }
8711 else
8712 mips_declare_object (stream, name, init_string,
8713 "," HOST_WIDE_INT_PRINT_UNSIGNED ",%u\n",
8714 size, align / BITS_PER_UNIT);
8715 }
8716
8717 /* Implement ASM_OUTPUT_ALIGNED_DECL_COMMON. This is usually the same as the
8718 elfos.h version, but we also need to handle -muninit-const-in-rodata. */
8719
8720 void
8721 mips_output_aligned_decl_common (FILE *stream, tree decl, const char *name,
8722 unsigned HOST_WIDE_INT size,
8723 unsigned int align)
8724 {
8725 /* If the target wants uninitialized const declarations in
8726 .rdata then don't put them in .comm. */
8727 if (TARGET_EMBEDDED_DATA
8728 && TARGET_UNINIT_CONST_IN_RODATA
8729 && TREE_CODE (decl) == VAR_DECL
8730 && TREE_READONLY (decl)
8731 && (DECL_INITIAL (decl) == 0 || DECL_INITIAL (decl) == error_mark_node))
8732 {
8733 if (TREE_PUBLIC (decl) && DECL_NAME (decl))
8734 targetm.asm_out.globalize_label (stream, name);
8735
8736 switch_to_section (readonly_data_section);
8737 ASM_OUTPUT_ALIGN (stream, floor_log2 (align / BITS_PER_UNIT));
8738 mips_declare_object (stream, name, "",
8739 ":\n\t.space\t" HOST_WIDE_INT_PRINT_UNSIGNED "\n",
8740 size);
8741 }
8742 else
8743 mips_declare_common_object (stream, name, "\n\t.comm\t",
8744 size, align, true);
8745 }
8746
8747 #ifdef ASM_OUTPUT_SIZE_DIRECTIVE
8748 extern int size_directive_output;
8749
8750 /* Implement ASM_DECLARE_OBJECT_NAME. This is like most of the standard ELF
8751 definitions except that it uses mips_declare_object to emit the label. */
8752
8753 void
8754 mips_declare_object_name (FILE *stream, const char *name,
8755 tree decl ATTRIBUTE_UNUSED)
8756 {
8757 #ifdef ASM_OUTPUT_TYPE_DIRECTIVE
8758 ASM_OUTPUT_TYPE_DIRECTIVE (stream, name, "object");
8759 #endif
8760
8761 size_directive_output = 0;
8762 if (!flag_inhibit_size_directive && DECL_SIZE (decl))
8763 {
8764 HOST_WIDE_INT size;
8765
8766 size_directive_output = 1;
8767 size = int_size_in_bytes (TREE_TYPE (decl));
8768 ASM_OUTPUT_SIZE_DIRECTIVE (stream, name, size);
8769 }
8770
8771 mips_declare_object (stream, name, "", ":\n");
8772 }
8773
8774 /* Implement ASM_FINISH_DECLARE_OBJECT. This is generic ELF stuff. */
8775
8776 void
8777 mips_finish_declare_object (FILE *stream, tree decl, int top_level, int at_end)
8778 {
8779 const char *name;
8780
8781 name = XSTR (XEXP (DECL_RTL (decl), 0), 0);
8782 if (!flag_inhibit_size_directive
8783 && DECL_SIZE (decl) != 0
8784 && !at_end
8785 && top_level
8786 && DECL_INITIAL (decl) == error_mark_node
8787 && !size_directive_output)
8788 {
8789 HOST_WIDE_INT size;
8790
8791 size_directive_output = 1;
8792 size = int_size_in_bytes (TREE_TYPE (decl));
8793 ASM_OUTPUT_SIZE_DIRECTIVE (stream, name, size);
8794 }
8795 }
8796 #endif
8797 \f
8798 /* Return the FOO in the name of the ".mdebug.FOO" section associated
8799 with the current ABI. */
8800
8801 static const char *
8802 mips_mdebug_abi_name (void)
8803 {
8804 switch (mips_abi)
8805 {
8806 case ABI_32:
8807 return "abi32";
8808 case ABI_O64:
8809 return "abiO64";
8810 case ABI_N32:
8811 return "abiN32";
8812 case ABI_64:
8813 return "abi64";
8814 case ABI_EABI:
8815 return TARGET_64BIT ? "eabi64" : "eabi32";
8816 default:
8817 gcc_unreachable ();
8818 }
8819 }
8820
8821 /* Implement TARGET_ASM_FILE_START. */
8822
8823 static void
8824 mips_file_start (void)
8825 {
8826 default_file_start ();
8827
8828 /* Generate a special section to describe the ABI switches used to
8829 produce the resultant binary. */
8830
8831 /* Record the ABI itself. Modern versions of binutils encode
8832 this information in the ELF header flags, but GDB needs the
8833 information in order to correctly debug binaries produced by
8834 older binutils. See the function mips_gdbarch_init in
8835 gdb/mips-tdep.c. */
8836 fprintf (asm_out_file, "\t.section .mdebug.%s\n\t.previous\n",
8837 mips_mdebug_abi_name ());
8838
8839 /* There is no ELF header flag to distinguish long32 forms of the
8840 EABI from long64 forms. Emit a special section to help tools
8841 such as GDB. Do the same for o64, which is sometimes used with
8842 -mlong64. */
8843 if (mips_abi == ABI_EABI || mips_abi == ABI_O64)
8844 fprintf (asm_out_file, "\t.section .gcc_compiled_long%d\n"
8845 "\t.previous\n", TARGET_LONG64 ? 64 : 32);
8846
8847 /* Record the NaN encoding. */
8848 if (HAVE_AS_NAN || mips_nan != MIPS_IEEE_754_DEFAULT)
8849 fprintf (asm_out_file, "\t.nan\t%s\n",
8850 mips_nan == MIPS_IEEE_754_2008 ? "2008" : "legacy");
8851
8852 #ifdef HAVE_AS_GNU_ATTRIBUTE
8853 {
8854 int attr;
8855
8856 /* No floating-point operations, -mno-float. */
8857 if (TARGET_NO_FLOAT)
8858 attr = 0;
8859 /* Soft-float code, -msoft-float. */
8860 else if (!TARGET_HARD_FLOAT_ABI)
8861 attr = 3;
8862 /* Single-float code, -msingle-float. */
8863 else if (!TARGET_DOUBLE_FLOAT)
8864 attr = 2;
8865 /* 64-bit FP registers on a 32-bit target, -mips32r2 -mfp64. */
8866 else if (!TARGET_64BIT && TARGET_FLOAT64)
8867 attr = 4;
8868 /* Regular FP code, FP regs same size as GP regs, -mdouble-float. */
8869 else
8870 attr = 1;
8871
8872 fprintf (asm_out_file, "\t.gnu_attribute 4, %d\n", attr);
8873 }
8874 #endif
8875
8876 /* If TARGET_ABICALLS, tell GAS to generate -KPIC code. */
8877 if (TARGET_ABICALLS)
8878 {
8879 fprintf (asm_out_file, "\t.abicalls\n");
8880 if (TARGET_ABICALLS_PIC0)
8881 fprintf (asm_out_file, "\t.option\tpic0\n");
8882 }
8883
8884 if (flag_verbose_asm)
8885 fprintf (asm_out_file, "\n%s -G value = %d, Arch = %s, ISA = %d\n",
8886 ASM_COMMENT_START,
8887 mips_small_data_threshold, mips_arch_info->name, mips_isa);
8888 }
8889
8890 /* Implement TARGET_ASM_CODE_END. */
8891
8892 static void
8893 mips_code_end (void)
8894 {
8895 if (mips_need_mips16_rdhwr_p)
8896 mips_output_mips16_rdhwr ();
8897 }
8898 \f
8899 /* Make the last instruction frame-related and note that it performs
8900 the operation described by FRAME_PATTERN. */
8901
8902 static void
8903 mips_set_frame_expr (rtx frame_pattern)
8904 {
8905 rtx insn;
8906
8907 insn = get_last_insn ();
8908 RTX_FRAME_RELATED_P (insn) = 1;
8909 REG_NOTES (insn) = alloc_EXPR_LIST (REG_FRAME_RELATED_EXPR,
8910 frame_pattern,
8911 REG_NOTES (insn));
8912 }
8913
8914 /* Return a frame-related rtx that stores REG at MEM.
8915 REG must be a single register. */
8916
8917 static rtx
8918 mips_frame_set (rtx mem, rtx reg)
8919 {
8920 rtx set;
8921
8922 set = gen_rtx_SET (VOIDmode, mem, reg);
8923 RTX_FRAME_RELATED_P (set) = 1;
8924
8925 return set;
8926 }
8927
8928 /* Record that the epilogue has restored call-saved register REG. */
8929
8930 static void
8931 mips_add_cfa_restore (rtx reg)
8932 {
8933 mips_epilogue.cfa_restores = alloc_reg_note (REG_CFA_RESTORE, reg,
8934 mips_epilogue.cfa_restores);
8935 }
8936 \f
8937 /* If a MIPS16e SAVE or RESTORE instruction saves or restores register
8938 mips16e_s2_s8_regs[X], it must also save the registers in indexes
8939 X + 1 onwards. Likewise mips16e_a0_a3_regs. */
8940 static const unsigned char mips16e_s2_s8_regs[] = {
8941 30, 23, 22, 21, 20, 19, 18
8942 };
8943 static const unsigned char mips16e_a0_a3_regs[] = {
8944 4, 5, 6, 7
8945 };
8946
8947 /* A list of the registers that can be saved by the MIPS16e SAVE instruction,
8948 ordered from the uppermost in memory to the lowest in memory. */
8949 static const unsigned char mips16e_save_restore_regs[] = {
8950 31, 30, 23, 22, 21, 20, 19, 18, 17, 16, 7, 6, 5, 4
8951 };
8952
8953 /* Return the index of the lowest X in the range [0, SIZE) for which
8954 bit REGS[X] is set in MASK. Return SIZE if there is no such X. */
8955
8956 static unsigned int
8957 mips16e_find_first_register (unsigned int mask, const unsigned char *regs,
8958 unsigned int size)
8959 {
8960 unsigned int i;
8961
8962 for (i = 0; i < size; i++)
8963 if (BITSET_P (mask, regs[i]))
8964 break;
8965
8966 return i;
8967 }
8968
8969 /* *MASK_PTR is a mask of general-purpose registers and *NUM_REGS_PTR
8970 is the number of set bits. If *MASK_PTR contains REGS[X] for some X
8971 in [0, SIZE), adjust *MASK_PTR and *NUM_REGS_PTR so that the same
8972 is true for all indexes (X, SIZE). */
8973
8974 static void
8975 mips16e_mask_registers (unsigned int *mask_ptr, const unsigned char *regs,
8976 unsigned int size, unsigned int *num_regs_ptr)
8977 {
8978 unsigned int i;
8979
8980 i = mips16e_find_first_register (*mask_ptr, regs, size);
8981 for (i++; i < size; i++)
8982 if (!BITSET_P (*mask_ptr, regs[i]))
8983 {
8984 *num_regs_ptr += 1;
8985 *mask_ptr |= 1 << regs[i];
8986 }
8987 }
8988
8989 /* Return a simplified form of X using the register values in REG_VALUES.
8990 REG_VALUES[R] is the last value assigned to hard register R, or null
8991 if R has not been modified.
8992
8993 This function is rather limited, but is good enough for our purposes. */
8994
8995 static rtx
8996 mips16e_collect_propagate_value (rtx x, rtx *reg_values)
8997 {
8998 x = avoid_constant_pool_reference (x);
8999
9000 if (UNARY_P (x))
9001 {
9002 rtx x0 = mips16e_collect_propagate_value (XEXP (x, 0), reg_values);
9003 return simplify_gen_unary (GET_CODE (x), GET_MODE (x),
9004 x0, GET_MODE (XEXP (x, 0)));
9005 }
9006
9007 if (ARITHMETIC_P (x))
9008 {
9009 rtx x0 = mips16e_collect_propagate_value (XEXP (x, 0), reg_values);
9010 rtx x1 = mips16e_collect_propagate_value (XEXP (x, 1), reg_values);
9011 return simplify_gen_binary (GET_CODE (x), GET_MODE (x), x0, x1);
9012 }
9013
9014 if (REG_P (x)
9015 && reg_values[REGNO (x)]
9016 && !rtx_unstable_p (reg_values[REGNO (x)]))
9017 return reg_values[REGNO (x)];
9018
9019 return x;
9020 }
9021
9022 /* Return true if (set DEST SRC) stores an argument register into its
9023 caller-allocated save slot, storing the number of that argument
9024 register in *REGNO_PTR if so. REG_VALUES is as for
9025 mips16e_collect_propagate_value. */
9026
9027 static bool
9028 mips16e_collect_argument_save_p (rtx dest, rtx src, rtx *reg_values,
9029 unsigned int *regno_ptr)
9030 {
9031 unsigned int argno, regno;
9032 HOST_WIDE_INT offset, required_offset;
9033 rtx addr, base;
9034
9035 /* Check that this is a word-mode store. */
9036 if (!MEM_P (dest) || !REG_P (src) || GET_MODE (dest) != word_mode)
9037 return false;
9038
9039 /* Check that the register being saved is an unmodified argument
9040 register. */
9041 regno = REGNO (src);
9042 if (!IN_RANGE (regno, GP_ARG_FIRST, GP_ARG_LAST) || reg_values[regno])
9043 return false;
9044 argno = regno - GP_ARG_FIRST;
9045
9046 /* Check whether the address is an appropriate stack-pointer or
9047 frame-pointer access. */
9048 addr = mips16e_collect_propagate_value (XEXP (dest, 0), reg_values);
9049 mips_split_plus (addr, &base, &offset);
9050 required_offset = cfun->machine->frame.total_size + argno * UNITS_PER_WORD;
9051 if (base == hard_frame_pointer_rtx)
9052 required_offset -= cfun->machine->frame.hard_frame_pointer_offset;
9053 else if (base != stack_pointer_rtx)
9054 return false;
9055 if (offset != required_offset)
9056 return false;
9057
9058 *regno_ptr = regno;
9059 return true;
9060 }
9061
9062 /* A subroutine of mips_expand_prologue, called only when generating
9063 MIPS16e SAVE instructions. Search the start of the function for any
9064 instructions that save argument registers into their caller-allocated
9065 save slots. Delete such instructions and return a value N such that
9066 saving [GP_ARG_FIRST, GP_ARG_FIRST + N) would make all the deleted
9067 instructions redundant. */
9068
9069 static unsigned int
9070 mips16e_collect_argument_saves (void)
9071 {
9072 rtx reg_values[FIRST_PSEUDO_REGISTER];
9073 rtx insn, next, set, dest, src;
9074 unsigned int nargs, regno;
9075
9076 push_topmost_sequence ();
9077 nargs = 0;
9078 memset (reg_values, 0, sizeof (reg_values));
9079 for (insn = get_insns (); insn; insn = next)
9080 {
9081 next = NEXT_INSN (insn);
9082 if (NOTE_P (insn) || DEBUG_INSN_P (insn))
9083 continue;
9084
9085 if (!INSN_P (insn))
9086 break;
9087
9088 set = PATTERN (insn);
9089 if (GET_CODE (set) != SET)
9090 break;
9091
9092 dest = SET_DEST (set);
9093 src = SET_SRC (set);
9094 if (mips16e_collect_argument_save_p (dest, src, reg_values, &regno))
9095 {
9096 if (!BITSET_P (cfun->machine->frame.mask, regno))
9097 {
9098 delete_insn (insn);
9099 nargs = MAX (nargs, (regno - GP_ARG_FIRST) + 1);
9100 }
9101 }
9102 else if (REG_P (dest) && GET_MODE (dest) == word_mode)
9103 reg_values[REGNO (dest)]
9104 = mips16e_collect_propagate_value (src, reg_values);
9105 else
9106 break;
9107 }
9108 pop_topmost_sequence ();
9109
9110 return nargs;
9111 }
9112
9113 /* Return a move between register REGNO and memory location SP + OFFSET.
9114 REG_PARM_P is true if SP + OFFSET belongs to REG_PARM_STACK_SPACE.
9115 Make the move a load if RESTORE_P, otherwise make it a store. */
9116
9117 static rtx
9118 mips16e_save_restore_reg (bool restore_p, bool reg_parm_p,
9119 HOST_WIDE_INT offset, unsigned int regno)
9120 {
9121 rtx reg, mem;
9122
9123 mem = gen_frame_mem (SImode, plus_constant (Pmode, stack_pointer_rtx,
9124 offset));
9125 reg = gen_rtx_REG (SImode, regno);
9126 if (restore_p)
9127 {
9128 mips_add_cfa_restore (reg);
9129 return gen_rtx_SET (VOIDmode, reg, mem);
9130 }
9131 if (reg_parm_p)
9132 return gen_rtx_SET (VOIDmode, mem, reg);
9133 return mips_frame_set (mem, reg);
9134 }
9135
9136 /* Return RTL for a MIPS16e SAVE or RESTORE instruction; RESTORE_P says which.
9137 The instruction must:
9138
9139 - Allocate or deallocate SIZE bytes in total; SIZE is known
9140 to be nonzero.
9141
9142 - Save or restore as many registers in *MASK_PTR as possible.
9143 The instruction saves the first registers at the top of the
9144 allocated area, with the other registers below it.
9145
9146 - Save NARGS argument registers above the allocated area.
9147
9148 (NARGS is always zero if RESTORE_P.)
9149
9150 The SAVE and RESTORE instructions cannot save and restore all general
9151 registers, so there may be some registers left over for the caller to
9152 handle. Destructively modify *MASK_PTR so that it contains the registers
9153 that still need to be saved or restored. The caller can save these
9154 registers in the memory immediately below *OFFSET_PTR, which is a
9155 byte offset from the bottom of the allocated stack area. */
9156
9157 static rtx
9158 mips16e_build_save_restore (bool restore_p, unsigned int *mask_ptr,
9159 HOST_WIDE_INT *offset_ptr, unsigned int nargs,
9160 HOST_WIDE_INT size)
9161 {
9162 rtx pattern, set;
9163 HOST_WIDE_INT offset, top_offset;
9164 unsigned int i, regno;
9165 int n;
9166
9167 gcc_assert (cfun->machine->frame.num_fp == 0);
9168
9169 /* Calculate the number of elements in the PARALLEL. We need one element
9170 for the stack adjustment, one for each argument register save, and one
9171 for each additional register move. */
9172 n = 1 + nargs;
9173 for (i = 0; i < ARRAY_SIZE (mips16e_save_restore_regs); i++)
9174 if (BITSET_P (*mask_ptr, mips16e_save_restore_regs[i]))
9175 n++;
9176
9177 /* Create the final PARALLEL. */
9178 pattern = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (n));
9179 n = 0;
9180
9181 /* Add the stack pointer adjustment. */
9182 set = gen_rtx_SET (VOIDmode, stack_pointer_rtx,
9183 plus_constant (Pmode, stack_pointer_rtx,
9184 restore_p ? size : -size));
9185 RTX_FRAME_RELATED_P (set) = 1;
9186 XVECEXP (pattern, 0, n++) = set;
9187
9188 /* Stack offsets in the PARALLEL are relative to the old stack pointer. */
9189 top_offset = restore_p ? size : 0;
9190
9191 /* Save the arguments. */
9192 for (i = 0; i < nargs; i++)
9193 {
9194 offset = top_offset + i * UNITS_PER_WORD;
9195 set = mips16e_save_restore_reg (restore_p, true, offset,
9196 GP_ARG_FIRST + i);
9197 XVECEXP (pattern, 0, n++) = set;
9198 }
9199
9200 /* Then fill in the other register moves. */
9201 offset = top_offset;
9202 for (i = 0; i < ARRAY_SIZE (mips16e_save_restore_regs); i++)
9203 {
9204 regno = mips16e_save_restore_regs[i];
9205 if (BITSET_P (*mask_ptr, regno))
9206 {
9207 offset -= UNITS_PER_WORD;
9208 set = mips16e_save_restore_reg (restore_p, false, offset, regno);
9209 XVECEXP (pattern, 0, n++) = set;
9210 *mask_ptr &= ~(1 << regno);
9211 }
9212 }
9213
9214 /* Tell the caller what offset it should use for the remaining registers. */
9215 *offset_ptr = size + (offset - top_offset);
9216
9217 gcc_assert (n == XVECLEN (pattern, 0));
9218
9219 return pattern;
9220 }
9221
9222 /* PATTERN is a PARALLEL whose first element adds ADJUST to the stack
9223 pointer. Return true if PATTERN matches the kind of instruction
9224 generated by mips16e_build_save_restore. If INFO is nonnull,
9225 initialize it when returning true. */
9226
9227 bool
9228 mips16e_save_restore_pattern_p (rtx pattern, HOST_WIDE_INT adjust,
9229 struct mips16e_save_restore_info *info)
9230 {
9231 unsigned int i, nargs, mask, extra;
9232 HOST_WIDE_INT top_offset, save_offset, offset;
9233 rtx set, reg, mem, base;
9234 int n;
9235
9236 if (!GENERATE_MIPS16E_SAVE_RESTORE)
9237 return false;
9238
9239 /* Stack offsets in the PARALLEL are relative to the old stack pointer. */
9240 top_offset = adjust > 0 ? adjust : 0;
9241
9242 /* Interpret all other members of the PARALLEL. */
9243 save_offset = top_offset - UNITS_PER_WORD;
9244 mask = 0;
9245 nargs = 0;
9246 i = 0;
9247 for (n = 1; n < XVECLEN (pattern, 0); n++)
9248 {
9249 /* Check that we have a SET. */
9250 set = XVECEXP (pattern, 0, n);
9251 if (GET_CODE (set) != SET)
9252 return false;
9253
9254 /* Check that the SET is a load (if restoring) or a store
9255 (if saving). */
9256 mem = adjust > 0 ? SET_SRC (set) : SET_DEST (set);
9257 if (!MEM_P (mem))
9258 return false;
9259
9260 /* Check that the address is the sum of the stack pointer and a
9261 possibly-zero constant offset. */
9262 mips_split_plus (XEXP (mem, 0), &base, &offset);
9263 if (base != stack_pointer_rtx)
9264 return false;
9265
9266 /* Check that SET's other operand is a register. */
9267 reg = adjust > 0 ? SET_DEST (set) : SET_SRC (set);
9268 if (!REG_P (reg))
9269 return false;
9270
9271 /* Check for argument saves. */
9272 if (offset == top_offset + nargs * UNITS_PER_WORD
9273 && REGNO (reg) == GP_ARG_FIRST + nargs)
9274 nargs++;
9275 else if (offset == save_offset)
9276 {
9277 while (mips16e_save_restore_regs[i++] != REGNO (reg))
9278 if (i == ARRAY_SIZE (mips16e_save_restore_regs))
9279 return false;
9280
9281 mask |= 1 << REGNO (reg);
9282 save_offset -= UNITS_PER_WORD;
9283 }
9284 else
9285 return false;
9286 }
9287
9288 /* Check that the restrictions on register ranges are met. */
9289 extra = 0;
9290 mips16e_mask_registers (&mask, mips16e_s2_s8_regs,
9291 ARRAY_SIZE (mips16e_s2_s8_regs), &extra);
9292 mips16e_mask_registers (&mask, mips16e_a0_a3_regs,
9293 ARRAY_SIZE (mips16e_a0_a3_regs), &extra);
9294 if (extra != 0)
9295 return false;
9296
9297 /* Make sure that the topmost argument register is not saved twice.
9298 The checks above ensure that the same is then true for the other
9299 argument registers. */
9300 if (nargs > 0 && BITSET_P (mask, GP_ARG_FIRST + nargs - 1))
9301 return false;
9302
9303 /* Pass back information, if requested. */
9304 if (info)
9305 {
9306 info->nargs = nargs;
9307 info->mask = mask;
9308 info->size = (adjust > 0 ? adjust : -adjust);
9309 }
9310
9311 return true;
9312 }
9313
9314 /* Add a MIPS16e SAVE or RESTORE register-range argument to string S
9315 for the register range [MIN_REG, MAX_REG]. Return a pointer to
9316 the null terminator. */
9317
9318 static char *
9319 mips16e_add_register_range (char *s, unsigned int min_reg,
9320 unsigned int max_reg)
9321 {
9322 if (min_reg != max_reg)
9323 s += sprintf (s, ",%s-%s", reg_names[min_reg], reg_names[max_reg]);
9324 else
9325 s += sprintf (s, ",%s", reg_names[min_reg]);
9326 return s;
9327 }
9328
9329 /* Return the assembly instruction for a MIPS16e SAVE or RESTORE instruction.
9330 PATTERN and ADJUST are as for mips16e_save_restore_pattern_p. */
9331
9332 const char *
9333 mips16e_output_save_restore (rtx pattern, HOST_WIDE_INT adjust)
9334 {
9335 static char buffer[300];
9336
9337 struct mips16e_save_restore_info info;
9338 unsigned int i, end;
9339 char *s;
9340
9341 /* Parse the pattern. */
9342 if (!mips16e_save_restore_pattern_p (pattern, adjust, &info))
9343 gcc_unreachable ();
9344
9345 /* Add the mnemonic. */
9346 s = strcpy (buffer, adjust > 0 ? "restore\t" : "save\t");
9347 s += strlen (s);
9348
9349 /* Save the arguments. */
9350 if (info.nargs > 1)
9351 s += sprintf (s, "%s-%s,", reg_names[GP_ARG_FIRST],
9352 reg_names[GP_ARG_FIRST + info.nargs - 1]);
9353 else if (info.nargs == 1)
9354 s += sprintf (s, "%s,", reg_names[GP_ARG_FIRST]);
9355
9356 /* Emit the amount of stack space to allocate or deallocate. */
9357 s += sprintf (s, "%d", (int) info.size);
9358
9359 /* Save or restore $16. */
9360 if (BITSET_P (info.mask, 16))
9361 s += sprintf (s, ",%s", reg_names[GP_REG_FIRST + 16]);
9362
9363 /* Save or restore $17. */
9364 if (BITSET_P (info.mask, 17))
9365 s += sprintf (s, ",%s", reg_names[GP_REG_FIRST + 17]);
9366
9367 /* Save or restore registers in the range $s2...$s8, which
9368 mips16e_s2_s8_regs lists in decreasing order. Note that this
9369 is a software register range; the hardware registers are not
9370 numbered consecutively. */
9371 end = ARRAY_SIZE (mips16e_s2_s8_regs);
9372 i = mips16e_find_first_register (info.mask, mips16e_s2_s8_regs, end);
9373 if (i < end)
9374 s = mips16e_add_register_range (s, mips16e_s2_s8_regs[end - 1],
9375 mips16e_s2_s8_regs[i]);
9376
9377 /* Save or restore registers in the range $a0...$a3. */
9378 end = ARRAY_SIZE (mips16e_a0_a3_regs);
9379 i = mips16e_find_first_register (info.mask, mips16e_a0_a3_regs, end);
9380 if (i < end)
9381 s = mips16e_add_register_range (s, mips16e_a0_a3_regs[i],
9382 mips16e_a0_a3_regs[end - 1]);
9383
9384 /* Save or restore $31. */
9385 if (BITSET_P (info.mask, RETURN_ADDR_REGNUM))
9386 s += sprintf (s, ",%s", reg_names[RETURN_ADDR_REGNUM]);
9387
9388 return buffer;
9389 }
9390 \f
9391 /* Return true if the current function returns its value in a floating-point
9392 register in MIPS16 mode. */
9393
9394 static bool
9395 mips16_cfun_returns_in_fpr_p (void)
9396 {
9397 tree return_type = DECL_RESULT (current_function_decl);
9398 return (TARGET_MIPS16
9399 && TARGET_HARD_FLOAT_ABI
9400 && !aggregate_value_p (return_type, current_function_decl)
9401 && mips_return_mode_in_fpr_p (DECL_MODE (return_type)));
9402 }
9403
9404 /* Return true if predicate PRED is true for at least one instruction.
9405 Cache the result in *CACHE, and assume that the result is true
9406 if *CACHE is already true. */
9407
9408 static bool
9409 mips_find_gp_ref (bool *cache, bool (*pred) (rtx))
9410 {
9411 rtx insn;
9412
9413 if (!*cache)
9414 {
9415 push_topmost_sequence ();
9416 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
9417 if (USEFUL_INSN_P (insn) && pred (insn))
9418 {
9419 *cache = true;
9420 break;
9421 }
9422 pop_topmost_sequence ();
9423 }
9424 return *cache;
9425 }
9426
9427 /* Return true if INSN refers to the global pointer in an "inflexible" way.
9428 See mips_cfun_has_inflexible_gp_ref_p for details. */
9429
9430 static bool
9431 mips_insn_has_inflexible_gp_ref_p (rtx insn)
9432 {
9433 /* Uses of pic_offset_table_rtx in CALL_INSN_FUNCTION_USAGE
9434 indicate that the target could be a traditional MIPS
9435 lazily-binding stub. */
9436 return find_reg_fusage (insn, USE, pic_offset_table_rtx);
9437 }
9438
9439 /* Return true if the current function refers to the global pointer
9440 in a way that forces $28 to be valid. This means that we can't
9441 change the choice of global pointer, even for NewABI code.
9442
9443 One example of this (and one which needs several checks) is that
9444 $28 must be valid when calling traditional MIPS lazy-binding stubs.
9445 (This restriction does not apply to PLTs.) */
9446
9447 static bool
9448 mips_cfun_has_inflexible_gp_ref_p (void)
9449 {
9450 /* If the function has a nonlocal goto, $28 must hold the correct
9451 global pointer for the target function. That is, the target
9452 of the goto implicitly uses $28. */
9453 if (crtl->has_nonlocal_goto)
9454 return true;
9455
9456 if (TARGET_ABICALLS_PIC2)
9457 {
9458 /* Symbolic accesses implicitly use the global pointer unless
9459 -mexplicit-relocs is in effect. JAL macros to symbolic addresses
9460 might go to traditional MIPS lazy-binding stubs. */
9461 if (!TARGET_EXPLICIT_RELOCS)
9462 return true;
9463
9464 /* FUNCTION_PROFILER includes a JAL to _mcount, which again
9465 can be lazily-bound. */
9466 if (crtl->profile)
9467 return true;
9468
9469 /* MIPS16 functions that return in FPRs need to call an
9470 external libgcc routine. This call is only made explict
9471 during mips_expand_epilogue, and it too might be lazily bound. */
9472 if (mips16_cfun_returns_in_fpr_p ())
9473 return true;
9474 }
9475
9476 return mips_find_gp_ref (&cfun->machine->has_inflexible_gp_insn_p,
9477 mips_insn_has_inflexible_gp_ref_p);
9478 }
9479
9480 /* Return true if INSN refers to the global pointer in a "flexible" way.
9481 See mips_cfun_has_flexible_gp_ref_p for details. */
9482
9483 static bool
9484 mips_insn_has_flexible_gp_ref_p (rtx insn)
9485 {
9486 return (get_attr_got (insn) != GOT_UNSET
9487 || mips_small_data_pattern_p (PATTERN (insn))
9488 || reg_overlap_mentioned_p (pic_offset_table_rtx, PATTERN (insn)));
9489 }
9490
9491 /* Return true if the current function references the global pointer,
9492 but if those references do not inherently require the global pointer
9493 to be $28. Assume !mips_cfun_has_inflexible_gp_ref_p (). */
9494
9495 static bool
9496 mips_cfun_has_flexible_gp_ref_p (void)
9497 {
9498 /* Reload can sometimes introduce constant pool references
9499 into a function that otherwise didn't need them. For example,
9500 suppose we have an instruction like:
9501
9502 (set (reg:DF R1) (float:DF (reg:SI R2)))
9503
9504 If R2 turns out to be a constant such as 1, the instruction may
9505 have a REG_EQUAL note saying that R1 == 1.0. Reload then has
9506 the option of using this constant if R2 doesn't get allocated
9507 to a register.
9508
9509 In cases like these, reload will have added the constant to the
9510 pool but no instruction will yet refer to it. */
9511 if (TARGET_ABICALLS_PIC2 && !reload_completed && crtl->uses_const_pool)
9512 return true;
9513
9514 return mips_find_gp_ref (&cfun->machine->has_flexible_gp_insn_p,
9515 mips_insn_has_flexible_gp_ref_p);
9516 }
9517
9518 /* Return the register that should be used as the global pointer
9519 within this function. Return INVALID_REGNUM if the function
9520 doesn't need a global pointer. */
9521
9522 static unsigned int
9523 mips_global_pointer (void)
9524 {
9525 unsigned int regno;
9526
9527 /* $gp is always available unless we're using a GOT. */
9528 if (!TARGET_USE_GOT)
9529 return GLOBAL_POINTER_REGNUM;
9530
9531 /* If there are inflexible references to $gp, we must use the
9532 standard register. */
9533 if (mips_cfun_has_inflexible_gp_ref_p ())
9534 return GLOBAL_POINTER_REGNUM;
9535
9536 /* If there are no current references to $gp, then the only uses
9537 we can introduce later are those involved in long branches. */
9538 if (TARGET_ABSOLUTE_JUMPS && !mips_cfun_has_flexible_gp_ref_p ())
9539 return INVALID_REGNUM;
9540
9541 /* If the global pointer is call-saved, try to use a call-clobbered
9542 alternative. */
9543 if (TARGET_CALL_SAVED_GP && crtl->is_leaf)
9544 for (regno = GP_REG_FIRST; regno <= GP_REG_LAST; regno++)
9545 if (!df_regs_ever_live_p (regno)
9546 && call_really_used_regs[regno]
9547 && !fixed_regs[regno]
9548 && regno != PIC_FUNCTION_ADDR_REGNUM)
9549 return regno;
9550
9551 return GLOBAL_POINTER_REGNUM;
9552 }
9553
9554 /* Return true if the current function's prologue must load the global
9555 pointer value into pic_offset_table_rtx and store the same value in
9556 the function's cprestore slot (if any).
9557
9558 One problem we have to deal with is that, when emitting GOT-based
9559 position independent code, long-branch sequences will need to load
9560 the address of the branch target from the GOT. We don't know until
9561 the very end of compilation whether (and where) the function needs
9562 long branches, so we must ensure that _any_ branch can access the
9563 global pointer in some form. However, we do not want to pessimize
9564 the usual case in which all branches are short.
9565
9566 We handle this as follows:
9567
9568 (1) During reload, we set cfun->machine->global_pointer to
9569 INVALID_REGNUM if we _know_ that the current function
9570 doesn't need a global pointer. This is only valid if
9571 long branches don't need the GOT.
9572
9573 Otherwise, we assume that we might need a global pointer
9574 and pick an appropriate register.
9575
9576 (2) If cfun->machine->global_pointer != INVALID_REGNUM,
9577 we ensure that the global pointer is available at every
9578 block boundary bar entry and exit. We do this in one of two ways:
9579
9580 - If the function has a cprestore slot, we ensure that this
9581 slot is valid at every branch. However, as explained in
9582 point (6) below, there is no guarantee that pic_offset_table_rtx
9583 itself is valid if new uses of the global pointer are introduced
9584 after the first post-epilogue split.
9585
9586 We guarantee that the cprestore slot is valid by loading it
9587 into a fake register, CPRESTORE_SLOT_REGNUM. We then make
9588 this register live at every block boundary bar function entry
9589 and exit. It is then invalid to move the load (and thus the
9590 preceding store) across a block boundary.
9591
9592 - If the function has no cprestore slot, we guarantee that
9593 pic_offset_table_rtx itself is valid at every branch.
9594
9595 See mips_eh_uses for the handling of the register liveness.
9596
9597 (3) During prologue and epilogue generation, we emit "ghost"
9598 placeholder instructions to manipulate the global pointer.
9599
9600 (4) During prologue generation, we set cfun->machine->must_initialize_gp_p
9601 and cfun->machine->must_restore_gp_when_clobbered_p if we already know
9602 that the function needs a global pointer. (There is no need to set
9603 them earlier than this, and doing it as late as possible leads to
9604 fewer false positives.)
9605
9606 (5) If cfun->machine->must_initialize_gp_p is true during a
9607 split_insns pass, we split the ghost instructions into real
9608 instructions. These split instructions can then be optimized in
9609 the usual way. Otherwise, we keep the ghost instructions intact,
9610 and optimize for the case where they aren't needed. We still
9611 have the option of splitting them later, if we need to introduce
9612 new uses of the global pointer.
9613
9614 For example, the scheduler ignores a ghost instruction that
9615 stores $28 to the stack, but it handles the split form of
9616 the ghost instruction as an ordinary store.
9617
9618 (6) [OldABI only.] If cfun->machine->must_restore_gp_when_clobbered_p
9619 is true during the first post-epilogue split_insns pass, we split
9620 calls and restore_gp patterns into instructions that explicitly
9621 load pic_offset_table_rtx from the cprestore slot. Otherwise,
9622 we split these patterns into instructions that _don't_ load from
9623 the cprestore slot.
9624
9625 If cfun->machine->must_restore_gp_when_clobbered_p is true at the
9626 time of the split, then any instructions that exist at that time
9627 can make free use of pic_offset_table_rtx. However, if we want
9628 to introduce new uses of the global pointer after the split,
9629 we must explicitly load the value from the cprestore slot, since
9630 pic_offset_table_rtx itself might not be valid at a given point
9631 in the function.
9632
9633 The idea is that we want to be able to delete redundant
9634 loads from the cprestore slot in the usual case where no
9635 long branches are needed.
9636
9637 (7) If cfun->machine->must_initialize_gp_p is still false at the end
9638 of md_reorg, we decide whether the global pointer is needed for
9639 long branches. If so, we set cfun->machine->must_initialize_gp_p
9640 to true and split the ghost instructions into real instructions
9641 at that stage.
9642
9643 Note that the ghost instructions must have a zero length for three reasons:
9644
9645 - Giving the length of the underlying $gp sequence might cause
9646 us to use long branches in cases where they aren't really needed.
9647
9648 - They would perturb things like alignment calculations.
9649
9650 - More importantly, the hazard detection in md_reorg relies on
9651 empty instructions having a zero length.
9652
9653 If we find a long branch and split the ghost instructions at the
9654 end of md_reorg, the split could introduce more long branches.
9655 That isn't a problem though, because we still do the split before
9656 the final shorten_branches pass.
9657
9658 This is extremely ugly, but it seems like the best compromise between
9659 correctness and efficiency. */
9660
9661 bool
9662 mips_must_initialize_gp_p (void)
9663 {
9664 return cfun->machine->must_initialize_gp_p;
9665 }
9666
9667 /* Return true if REGNO is a register that is ordinarily call-clobbered
9668 but must nevertheless be preserved by an interrupt handler. */
9669
9670 static bool
9671 mips_interrupt_extra_call_saved_reg_p (unsigned int regno)
9672 {
9673 if (MD_REG_P (regno))
9674 return true;
9675
9676 if (TARGET_DSP && DSP_ACC_REG_P (regno))
9677 return true;
9678
9679 if (GP_REG_P (regno) && !cfun->machine->use_shadow_register_set_p)
9680 {
9681 /* $0 is hard-wired. */
9682 if (regno == GP_REG_FIRST)
9683 return false;
9684
9685 /* The interrupt handler can treat kernel registers as
9686 scratch registers. */
9687 if (KERNEL_REG_P (regno))
9688 return false;
9689
9690 /* The function will return the stack pointer to its original value
9691 anyway. */
9692 if (regno == STACK_POINTER_REGNUM)
9693 return false;
9694
9695 /* Otherwise, return true for registers that aren't ordinarily
9696 call-clobbered. */
9697 return call_really_used_regs[regno];
9698 }
9699
9700 return false;
9701 }
9702
9703 /* Return true if the current function should treat register REGNO
9704 as call-saved. */
9705
9706 static bool
9707 mips_cfun_call_saved_reg_p (unsigned int regno)
9708 {
9709 /* If the user makes an ordinarily-call-saved register global,
9710 that register is no longer call-saved. */
9711 if (global_regs[regno])
9712 return false;
9713
9714 /* Interrupt handlers need to save extra registers. */
9715 if (cfun->machine->interrupt_handler_p
9716 && mips_interrupt_extra_call_saved_reg_p (regno))
9717 return true;
9718
9719 /* call_insns preserve $28 unless they explicitly say otherwise,
9720 so call_really_used_regs[] treats $28 as call-saved. However,
9721 we want the ABI property rather than the default call_insn
9722 property here. */
9723 return (regno == GLOBAL_POINTER_REGNUM
9724 ? TARGET_CALL_SAVED_GP
9725 : !call_really_used_regs[regno]);
9726 }
9727
9728 /* Return true if the function body might clobber register REGNO.
9729 We know that REGNO is call-saved. */
9730
9731 static bool
9732 mips_cfun_might_clobber_call_saved_reg_p (unsigned int regno)
9733 {
9734 /* Some functions should be treated as clobbering all call-saved
9735 registers. */
9736 if (crtl->saves_all_registers)
9737 return true;
9738
9739 /* DF handles cases where a register is explicitly referenced in
9740 the rtl. Incoming values are passed in call-clobbered registers,
9741 so we can assume that any live call-saved register is set within
9742 the function. */
9743 if (df_regs_ever_live_p (regno))
9744 return true;
9745
9746 /* Check for registers that are clobbered by FUNCTION_PROFILER.
9747 These clobbers are not explicit in the rtl. */
9748 if (crtl->profile && MIPS_SAVE_REG_FOR_PROFILING_P (regno))
9749 return true;
9750
9751 /* If we're using a call-saved global pointer, the function's
9752 prologue will need to set it up. */
9753 if (cfun->machine->global_pointer == regno)
9754 return true;
9755
9756 /* The function's prologue will need to set the frame pointer if
9757 frame_pointer_needed. */
9758 if (regno == HARD_FRAME_POINTER_REGNUM && frame_pointer_needed)
9759 return true;
9760
9761 /* If a MIPS16 function returns a value in FPRs, its epilogue
9762 will need to call an external libgcc routine. This yet-to-be
9763 generated call_insn will clobber $31. */
9764 if (regno == RETURN_ADDR_REGNUM && mips16_cfun_returns_in_fpr_p ())
9765 return true;
9766
9767 /* If REGNO is ordinarily call-clobbered, we must assume that any
9768 called function could modify it. */
9769 if (cfun->machine->interrupt_handler_p
9770 && !crtl->is_leaf
9771 && mips_interrupt_extra_call_saved_reg_p (regno))
9772 return true;
9773
9774 return false;
9775 }
9776
9777 /* Return true if the current function must save register REGNO. */
9778
9779 static bool
9780 mips_save_reg_p (unsigned int regno)
9781 {
9782 if (mips_cfun_call_saved_reg_p (regno))
9783 {
9784 if (mips_cfun_might_clobber_call_saved_reg_p (regno))
9785 return true;
9786
9787 /* Save both registers in an FPR pair if either one is used. This is
9788 needed for the case when MIN_FPRS_PER_FMT == 1, which allows the odd
9789 register to be used without the even register. */
9790 if (FP_REG_P (regno)
9791 && MAX_FPRS_PER_FMT == 2
9792 && mips_cfun_might_clobber_call_saved_reg_p (regno + 1))
9793 return true;
9794 }
9795
9796 /* We need to save the incoming return address if __builtin_eh_return
9797 is being used to set a different return address. */
9798 if (regno == RETURN_ADDR_REGNUM && crtl->calls_eh_return)
9799 return true;
9800
9801 return false;
9802 }
9803
9804 /* Populate the current function's mips_frame_info structure.
9805
9806 MIPS stack frames look like:
9807
9808 +-------------------------------+
9809 | |
9810 | incoming stack arguments |
9811 | |
9812 +-------------------------------+
9813 | |
9814 | caller-allocated save area |
9815 A | for register arguments |
9816 | |
9817 +-------------------------------+ <-- incoming stack pointer
9818 | |
9819 | callee-allocated save area |
9820 B | for arguments that are |
9821 | split between registers and |
9822 | the stack |
9823 | |
9824 +-------------------------------+ <-- arg_pointer_rtx
9825 | |
9826 C | callee-allocated save area |
9827 | for register varargs |
9828 | |
9829 +-------------------------------+ <-- frame_pointer_rtx
9830 | | + cop0_sp_offset
9831 | COP0 reg save area | + UNITS_PER_WORD
9832 | |
9833 +-------------------------------+ <-- frame_pointer_rtx + acc_sp_offset
9834 | | + UNITS_PER_WORD
9835 | accumulator save area |
9836 | |
9837 +-------------------------------+ <-- stack_pointer_rtx + fp_sp_offset
9838 | | + UNITS_PER_HWFPVALUE
9839 | FPR save area |
9840 | |
9841 +-------------------------------+ <-- stack_pointer_rtx + gp_sp_offset
9842 | | + UNITS_PER_WORD
9843 | GPR save area |
9844 | |
9845 +-------------------------------+ <-- frame_pointer_rtx with
9846 | | \ -fstack-protector
9847 | local variables | | var_size
9848 | | /
9849 +-------------------------------+
9850 | | \
9851 | $gp save area | | cprestore_size
9852 | | /
9853 P +-------------------------------+ <-- hard_frame_pointer_rtx for
9854 | | \ MIPS16 code
9855 | outgoing stack arguments | |
9856 | | |
9857 +-------------------------------+ | args_size
9858 | | |
9859 | caller-allocated save area | |
9860 | for register arguments | |
9861 | | /
9862 +-------------------------------+ <-- stack_pointer_rtx
9863 frame_pointer_rtx without
9864 -fstack-protector
9865 hard_frame_pointer_rtx for
9866 non-MIPS16 code.
9867
9868 At least two of A, B and C will be empty.
9869
9870 Dynamic stack allocations such as alloca insert data at point P.
9871 They decrease stack_pointer_rtx but leave frame_pointer_rtx and
9872 hard_frame_pointer_rtx unchanged. */
9873
9874 static void
9875 mips_compute_frame_info (void)
9876 {
9877 struct mips_frame_info *frame;
9878 HOST_WIDE_INT offset, size;
9879 unsigned int regno, i;
9880
9881 /* Set this function's interrupt properties. */
9882 if (mips_interrupt_type_p (TREE_TYPE (current_function_decl)))
9883 {
9884 if (!ISA_MIPS32R2)
9885 error ("the %<interrupt%> attribute requires a MIPS32r2 processor");
9886 else if (TARGET_HARD_FLOAT)
9887 error ("the %<interrupt%> attribute requires %<-msoft-float%>");
9888 else if (TARGET_MIPS16)
9889 error ("interrupt handlers cannot be MIPS16 functions");
9890 else
9891 {
9892 cfun->machine->interrupt_handler_p = true;
9893 cfun->machine->use_shadow_register_set_p =
9894 mips_use_shadow_register_set_p (TREE_TYPE (current_function_decl));
9895 cfun->machine->keep_interrupts_masked_p =
9896 mips_keep_interrupts_masked_p (TREE_TYPE (current_function_decl));
9897 cfun->machine->use_debug_exception_return_p =
9898 mips_use_debug_exception_return_p (TREE_TYPE
9899 (current_function_decl));
9900 }
9901 }
9902
9903 frame = &cfun->machine->frame;
9904 memset (frame, 0, sizeof (*frame));
9905 size = get_frame_size ();
9906
9907 cfun->machine->global_pointer = mips_global_pointer ();
9908
9909 /* The first two blocks contain the outgoing argument area and the $gp save
9910 slot. This area isn't needed in leaf functions, but if the
9911 target-independent frame size is nonzero, we have already committed to
9912 allocating these in STARTING_FRAME_OFFSET for !FRAME_GROWS_DOWNWARD. */
9913 if ((size == 0 || FRAME_GROWS_DOWNWARD) && crtl->is_leaf)
9914 {
9915 /* The MIPS 3.0 linker does not like functions that dynamically
9916 allocate the stack and have 0 for STACK_DYNAMIC_OFFSET, since it
9917 looks like we are trying to create a second frame pointer to the
9918 function, so allocate some stack space to make it happy. */
9919 if (cfun->calls_alloca)
9920 frame->args_size = REG_PARM_STACK_SPACE (cfun->decl);
9921 else
9922 frame->args_size = 0;
9923 frame->cprestore_size = 0;
9924 }
9925 else
9926 {
9927 frame->args_size = crtl->outgoing_args_size;
9928 frame->cprestore_size = MIPS_GP_SAVE_AREA_SIZE;
9929 }
9930 offset = frame->args_size + frame->cprestore_size;
9931
9932 /* Move above the local variables. */
9933 frame->var_size = MIPS_STACK_ALIGN (size);
9934 offset += frame->var_size;
9935
9936 /* Find out which GPRs we need to save. */
9937 for (regno = GP_REG_FIRST; regno <= GP_REG_LAST; regno++)
9938 if (mips_save_reg_p (regno))
9939 {
9940 frame->num_gp++;
9941 frame->mask |= 1 << (regno - GP_REG_FIRST);
9942 }
9943
9944 /* If this function calls eh_return, we must also save and restore the
9945 EH data registers. */
9946 if (crtl->calls_eh_return)
9947 for (i = 0; EH_RETURN_DATA_REGNO (i) != INVALID_REGNUM; i++)
9948 {
9949 frame->num_gp++;
9950 frame->mask |= 1 << (EH_RETURN_DATA_REGNO (i) - GP_REG_FIRST);
9951 }
9952
9953 /* The MIPS16e SAVE and RESTORE instructions have two ranges of registers:
9954 $a3-$a0 and $s2-$s8. If we save one register in the range, we must
9955 save all later registers too. */
9956 if (GENERATE_MIPS16E_SAVE_RESTORE)
9957 {
9958 mips16e_mask_registers (&frame->mask, mips16e_s2_s8_regs,
9959 ARRAY_SIZE (mips16e_s2_s8_regs), &frame->num_gp);
9960 mips16e_mask_registers (&frame->mask, mips16e_a0_a3_regs,
9961 ARRAY_SIZE (mips16e_a0_a3_regs), &frame->num_gp);
9962 }
9963
9964 /* Move above the GPR save area. */
9965 if (frame->num_gp > 0)
9966 {
9967 offset += MIPS_STACK_ALIGN (frame->num_gp * UNITS_PER_WORD);
9968 frame->gp_sp_offset = offset - UNITS_PER_WORD;
9969 }
9970
9971 /* Find out which FPRs we need to save. This loop must iterate over
9972 the same space as its companion in mips_for_each_saved_gpr_and_fpr. */
9973 if (TARGET_HARD_FLOAT)
9974 for (regno = FP_REG_FIRST; regno <= FP_REG_LAST; regno += MAX_FPRS_PER_FMT)
9975 if (mips_save_reg_p (regno))
9976 {
9977 frame->num_fp += MAX_FPRS_PER_FMT;
9978 frame->fmask |= ~(~0 << MAX_FPRS_PER_FMT) << (regno - FP_REG_FIRST);
9979 }
9980
9981 /* Move above the FPR save area. */
9982 if (frame->num_fp > 0)
9983 {
9984 offset += MIPS_STACK_ALIGN (frame->num_fp * UNITS_PER_FPREG);
9985 frame->fp_sp_offset = offset - UNITS_PER_HWFPVALUE;
9986 }
9987
9988 /* Add in space for the interrupt context information. */
9989 if (cfun->machine->interrupt_handler_p)
9990 {
9991 /* Check HI/LO. */
9992 if (mips_save_reg_p (LO_REGNUM) || mips_save_reg_p (HI_REGNUM))
9993 {
9994 frame->num_acc++;
9995 frame->acc_mask |= (1 << 0);
9996 }
9997
9998 /* Check accumulators 1, 2, 3. */
9999 for (i = DSP_ACC_REG_FIRST; i <= DSP_ACC_REG_LAST; i += 2)
10000 if (mips_save_reg_p (i) || mips_save_reg_p (i + 1))
10001 {
10002 frame->num_acc++;
10003 frame->acc_mask |= 1 << (((i - DSP_ACC_REG_FIRST) / 2) + 1);
10004 }
10005
10006 /* All interrupt context functions need space to preserve STATUS. */
10007 frame->num_cop0_regs++;
10008
10009 /* If we don't keep interrupts masked, we need to save EPC. */
10010 if (!cfun->machine->keep_interrupts_masked_p)
10011 frame->num_cop0_regs++;
10012 }
10013
10014 /* Move above the accumulator save area. */
10015 if (frame->num_acc > 0)
10016 {
10017 /* Each accumulator needs 2 words. */
10018 offset += frame->num_acc * 2 * UNITS_PER_WORD;
10019 frame->acc_sp_offset = offset - UNITS_PER_WORD;
10020 }
10021
10022 /* Move above the COP0 register save area. */
10023 if (frame->num_cop0_regs > 0)
10024 {
10025 offset += frame->num_cop0_regs * UNITS_PER_WORD;
10026 frame->cop0_sp_offset = offset - UNITS_PER_WORD;
10027 }
10028
10029 /* Move above the callee-allocated varargs save area. */
10030 offset += MIPS_STACK_ALIGN (cfun->machine->varargs_size);
10031 frame->arg_pointer_offset = offset;
10032
10033 /* Move above the callee-allocated area for pretend stack arguments. */
10034 offset += crtl->args.pretend_args_size;
10035 frame->total_size = offset;
10036
10037 /* Work out the offsets of the save areas from the top of the frame. */
10038 if (frame->gp_sp_offset > 0)
10039 frame->gp_save_offset = frame->gp_sp_offset - offset;
10040 if (frame->fp_sp_offset > 0)
10041 frame->fp_save_offset = frame->fp_sp_offset - offset;
10042 if (frame->acc_sp_offset > 0)
10043 frame->acc_save_offset = frame->acc_sp_offset - offset;
10044 if (frame->num_cop0_regs > 0)
10045 frame->cop0_save_offset = frame->cop0_sp_offset - offset;
10046
10047 /* MIPS16 code offsets the frame pointer by the size of the outgoing
10048 arguments. This tends to increase the chances of using unextended
10049 instructions for local variables and incoming arguments. */
10050 if (TARGET_MIPS16)
10051 frame->hard_frame_pointer_offset = frame->args_size;
10052 }
10053
10054 /* Return the style of GP load sequence that is being used for the
10055 current function. */
10056
10057 enum mips_loadgp_style
10058 mips_current_loadgp_style (void)
10059 {
10060 if (!TARGET_USE_GOT || cfun->machine->global_pointer == INVALID_REGNUM)
10061 return LOADGP_NONE;
10062
10063 if (TARGET_RTP_PIC)
10064 return LOADGP_RTP;
10065
10066 if (TARGET_ABSOLUTE_ABICALLS)
10067 return LOADGP_ABSOLUTE;
10068
10069 return TARGET_NEWABI ? LOADGP_NEWABI : LOADGP_OLDABI;
10070 }
10071
10072 /* Implement TARGET_FRAME_POINTER_REQUIRED. */
10073
10074 static bool
10075 mips_frame_pointer_required (void)
10076 {
10077 /* If the function contains dynamic stack allocations, we need to
10078 use the frame pointer to access the static parts of the frame. */
10079 if (cfun->calls_alloca)
10080 return true;
10081
10082 /* In MIPS16 mode, we need a frame pointer for a large frame; otherwise,
10083 reload may be unable to compute the address of a local variable,
10084 since there is no way to add a large constant to the stack pointer
10085 without using a second temporary register. */
10086 if (TARGET_MIPS16)
10087 {
10088 mips_compute_frame_info ();
10089 if (!SMALL_OPERAND (cfun->machine->frame.total_size))
10090 return true;
10091 }
10092
10093 return false;
10094 }
10095
10096 /* Make sure that we're not trying to eliminate to the wrong hard frame
10097 pointer. */
10098
10099 static bool
10100 mips_can_eliminate (const int from ATTRIBUTE_UNUSED, const int to)
10101 {
10102 return (to == HARD_FRAME_POINTER_REGNUM || to == STACK_POINTER_REGNUM);
10103 }
10104
10105 /* Implement INITIAL_ELIMINATION_OFFSET. FROM is either the frame pointer
10106 or argument pointer. TO is either the stack pointer or hard frame
10107 pointer. */
10108
10109 HOST_WIDE_INT
10110 mips_initial_elimination_offset (int from, int to)
10111 {
10112 HOST_WIDE_INT offset;
10113
10114 mips_compute_frame_info ();
10115
10116 /* Set OFFSET to the offset from the end-of-prologue stack pointer. */
10117 switch (from)
10118 {
10119 case FRAME_POINTER_REGNUM:
10120 if (FRAME_GROWS_DOWNWARD)
10121 offset = (cfun->machine->frame.args_size
10122 + cfun->machine->frame.cprestore_size
10123 + cfun->machine->frame.var_size);
10124 else
10125 offset = 0;
10126 break;
10127
10128 case ARG_POINTER_REGNUM:
10129 offset = cfun->machine->frame.arg_pointer_offset;
10130 break;
10131
10132 default:
10133 gcc_unreachable ();
10134 }
10135
10136 if (to == HARD_FRAME_POINTER_REGNUM)
10137 offset -= cfun->machine->frame.hard_frame_pointer_offset;
10138
10139 return offset;
10140 }
10141 \f
10142 /* Implement TARGET_EXTRA_LIVE_ON_ENTRY. */
10143
10144 static void
10145 mips_extra_live_on_entry (bitmap regs)
10146 {
10147 if (TARGET_USE_GOT)
10148 {
10149 /* PIC_FUNCTION_ADDR_REGNUM is live if we need it to set up
10150 the global pointer. */
10151 if (!TARGET_ABSOLUTE_ABICALLS)
10152 bitmap_set_bit (regs, PIC_FUNCTION_ADDR_REGNUM);
10153
10154 /* The prologue may set MIPS16_PIC_TEMP_REGNUM to the value of
10155 the global pointer. */
10156 if (TARGET_MIPS16)
10157 bitmap_set_bit (regs, MIPS16_PIC_TEMP_REGNUM);
10158
10159 /* See the comment above load_call<mode> for details. */
10160 bitmap_set_bit (regs, GOT_VERSION_REGNUM);
10161 }
10162 }
10163
10164 /* Implement RETURN_ADDR_RTX. We do not support moving back to a
10165 previous frame. */
10166
10167 rtx
10168 mips_return_addr (int count, rtx frame ATTRIBUTE_UNUSED)
10169 {
10170 if (count != 0)
10171 return const0_rtx;
10172
10173 return get_hard_reg_initial_val (Pmode, RETURN_ADDR_REGNUM);
10174 }
10175
10176 /* Emit code to change the current function's return address to
10177 ADDRESS. SCRATCH is available as a scratch register, if needed.
10178 ADDRESS and SCRATCH are both word-mode GPRs. */
10179
10180 void
10181 mips_set_return_address (rtx address, rtx scratch)
10182 {
10183 rtx slot_address;
10184
10185 gcc_assert (BITSET_P (cfun->machine->frame.mask, RETURN_ADDR_REGNUM));
10186 slot_address = mips_add_offset (scratch, stack_pointer_rtx,
10187 cfun->machine->frame.gp_sp_offset);
10188 mips_emit_move (gen_frame_mem (GET_MODE (address), slot_address), address);
10189 }
10190
10191 /* Return true if the current function has a cprestore slot. */
10192
10193 bool
10194 mips_cfun_has_cprestore_slot_p (void)
10195 {
10196 return (cfun->machine->global_pointer != INVALID_REGNUM
10197 && cfun->machine->frame.cprestore_size > 0);
10198 }
10199
10200 /* Fill *BASE and *OFFSET such that *BASE + *OFFSET refers to the
10201 cprestore slot. LOAD_P is true if the caller wants to load from
10202 the cprestore slot; it is false if the caller wants to store to
10203 the slot. */
10204
10205 static void
10206 mips_get_cprestore_base_and_offset (rtx *base, HOST_WIDE_INT *offset,
10207 bool load_p)
10208 {
10209 const struct mips_frame_info *frame;
10210
10211 frame = &cfun->machine->frame;
10212 /* .cprestore always uses the stack pointer instead of the frame pointer.
10213 We have a free choice for direct stores for non-MIPS16 functions,
10214 and for MIPS16 functions whose cprestore slot is in range of the
10215 stack pointer. Using the stack pointer would sometimes give more
10216 (early) scheduling freedom, but using the frame pointer would
10217 sometimes give more (late) scheduling freedom. It's hard to
10218 predict which applies to a given function, so let's keep things
10219 simple.
10220
10221 Loads must always use the frame pointer in functions that call
10222 alloca, and there's little benefit to using the stack pointer
10223 otherwise. */
10224 if (frame_pointer_needed && !(TARGET_CPRESTORE_DIRECTIVE && !load_p))
10225 {
10226 *base = hard_frame_pointer_rtx;
10227 *offset = frame->args_size - frame->hard_frame_pointer_offset;
10228 }
10229 else
10230 {
10231 *base = stack_pointer_rtx;
10232 *offset = frame->args_size;
10233 }
10234 }
10235
10236 /* Return true if X is the load or store address of the cprestore slot;
10237 LOAD_P says which. */
10238
10239 bool
10240 mips_cprestore_address_p (rtx x, bool load_p)
10241 {
10242 rtx given_base, required_base;
10243 HOST_WIDE_INT given_offset, required_offset;
10244
10245 mips_split_plus (x, &given_base, &given_offset);
10246 mips_get_cprestore_base_and_offset (&required_base, &required_offset, load_p);
10247 return given_base == required_base && given_offset == required_offset;
10248 }
10249
10250 /* Return a MEM rtx for the cprestore slot. LOAD_P is true if we are
10251 going to load from it, false if we are going to store to it.
10252 Use TEMP as a temporary register if need be. */
10253
10254 static rtx
10255 mips_cprestore_slot (rtx temp, bool load_p)
10256 {
10257 rtx base;
10258 HOST_WIDE_INT offset;
10259
10260 mips_get_cprestore_base_and_offset (&base, &offset, load_p);
10261 return gen_frame_mem (Pmode, mips_add_offset (temp, base, offset));
10262 }
10263
10264 /* Emit instructions to save global pointer value GP into cprestore
10265 slot MEM. OFFSET is the offset that MEM applies to the base register.
10266
10267 MEM may not be a legitimate address. If it isn't, TEMP is a
10268 temporary register that can be used, otherwise it is a SCRATCH. */
10269
10270 void
10271 mips_save_gp_to_cprestore_slot (rtx mem, rtx offset, rtx gp, rtx temp)
10272 {
10273 if (TARGET_CPRESTORE_DIRECTIVE)
10274 {
10275 gcc_assert (gp == pic_offset_table_rtx);
10276 emit_insn (PMODE_INSN (gen_cprestore, (mem, offset)));
10277 }
10278 else
10279 mips_emit_move (mips_cprestore_slot (temp, false), gp);
10280 }
10281
10282 /* Restore $gp from its save slot, using TEMP as a temporary base register
10283 if need be. This function is for o32 and o64 abicalls only.
10284
10285 See mips_must_initialize_gp_p for details about how we manage the
10286 global pointer. */
10287
10288 void
10289 mips_restore_gp_from_cprestore_slot (rtx temp)
10290 {
10291 gcc_assert (TARGET_ABICALLS && TARGET_OLDABI && epilogue_completed);
10292
10293 if (!cfun->machine->must_restore_gp_when_clobbered_p)
10294 {
10295 emit_note (NOTE_INSN_DELETED);
10296 return;
10297 }
10298
10299 if (TARGET_MIPS16)
10300 {
10301 mips_emit_move (temp, mips_cprestore_slot (temp, true));
10302 mips_emit_move (pic_offset_table_rtx, temp);
10303 }
10304 else
10305 mips_emit_move (pic_offset_table_rtx, mips_cprestore_slot (temp, true));
10306 if (!TARGET_EXPLICIT_RELOCS)
10307 emit_insn (gen_blockage ());
10308 }
10309 \f
10310 /* A function to save or store a register. The first argument is the
10311 register and the second is the stack slot. */
10312 typedef void (*mips_save_restore_fn) (rtx, rtx);
10313
10314 /* Use FN to save or restore register REGNO. MODE is the register's
10315 mode and OFFSET is the offset of its save slot from the current
10316 stack pointer. */
10317
10318 static void
10319 mips_save_restore_reg (enum machine_mode mode, int regno,
10320 HOST_WIDE_INT offset, mips_save_restore_fn fn)
10321 {
10322 rtx mem;
10323
10324 mem = gen_frame_mem (mode, plus_constant (Pmode, stack_pointer_rtx,
10325 offset));
10326 fn (gen_rtx_REG (mode, regno), mem);
10327 }
10328
10329 /* Call FN for each accumlator that is saved by the current function.
10330 SP_OFFSET is the offset of the current stack pointer from the start
10331 of the frame. */
10332
10333 static void
10334 mips_for_each_saved_acc (HOST_WIDE_INT sp_offset, mips_save_restore_fn fn)
10335 {
10336 HOST_WIDE_INT offset;
10337 int regno;
10338
10339 offset = cfun->machine->frame.acc_sp_offset - sp_offset;
10340 if (BITSET_P (cfun->machine->frame.acc_mask, 0))
10341 {
10342 mips_save_restore_reg (word_mode, LO_REGNUM, offset, fn);
10343 offset -= UNITS_PER_WORD;
10344 mips_save_restore_reg (word_mode, HI_REGNUM, offset, fn);
10345 offset -= UNITS_PER_WORD;
10346 }
10347
10348 for (regno = DSP_ACC_REG_FIRST; regno <= DSP_ACC_REG_LAST; regno++)
10349 if (BITSET_P (cfun->machine->frame.acc_mask,
10350 ((regno - DSP_ACC_REG_FIRST) / 2) + 1))
10351 {
10352 mips_save_restore_reg (word_mode, regno, offset, fn);
10353 offset -= UNITS_PER_WORD;
10354 }
10355 }
10356
10357 /* Save register REG to MEM. Make the instruction frame-related. */
10358
10359 static void
10360 mips_save_reg (rtx reg, rtx mem)
10361 {
10362 if (GET_MODE (reg) == DFmode && !TARGET_FLOAT64)
10363 {
10364 rtx x1, x2;
10365
10366 mips_emit_move_or_split (mem, reg, SPLIT_IF_NECESSARY);
10367
10368 x1 = mips_frame_set (mips_subword (mem, false),
10369 mips_subword (reg, false));
10370 x2 = mips_frame_set (mips_subword (mem, true),
10371 mips_subword (reg, true));
10372 mips_set_frame_expr (gen_rtx_PARALLEL (VOIDmode, gen_rtvec (2, x1, x2)));
10373 }
10374 else
10375 mips_emit_save_slot_move (mem, reg, MIPS_PROLOGUE_TEMP (GET_MODE (reg)));
10376 }
10377
10378 /* Capture the register combinations that are allowed in a SWM or LWM
10379 instruction. The entries are ordered by number of registers set in
10380 the mask. We also ignore the single register encodings because a
10381 normal SW/LW is preferred. */
10382
10383 static const unsigned int umips_swm_mask[17] = {
10384 0xc0ff0000, 0x80ff0000, 0x40ff0000, 0x807f0000,
10385 0x00ff0000, 0x803f0000, 0x007f0000, 0x801f0000,
10386 0x003f0000, 0x800f0000, 0x001f0000, 0x80070000,
10387 0x000f0000, 0x80030000, 0x00070000, 0x80010000,
10388 0x00030000
10389 };
10390
10391 static const unsigned int umips_swm_encoding[17] = {
10392 25, 24, 9, 23, 8, 22, 7, 21, 6, 20, 5, 19, 4, 18, 3, 17, 2
10393 };
10394
10395 /* Try to use a microMIPS LWM or SWM instruction to save or restore
10396 as many GPRs in *MASK as possible. *OFFSET is the offset from the
10397 stack pointer of the topmost save slot.
10398
10399 Remove from *MASK all registers that were handled using LWM and SWM.
10400 Update *OFFSET so that it points to the first unused save slot. */
10401
10402 static bool
10403 umips_build_save_restore (mips_save_restore_fn fn,
10404 unsigned *mask, HOST_WIDE_INT *offset)
10405 {
10406 int nregs;
10407 unsigned int i, j;
10408 rtx pattern, set, reg, mem;
10409 HOST_WIDE_INT this_offset;
10410 rtx this_base;
10411
10412 /* Try matching $16 to $31 (s0 to ra). */
10413 for (i = 0; i < ARRAY_SIZE (umips_swm_mask); i++)
10414 if ((*mask & 0xffff0000) == umips_swm_mask[i])
10415 break;
10416
10417 if (i == ARRAY_SIZE (umips_swm_mask))
10418 return false;
10419
10420 /* Get the offset of the lowest save slot. */
10421 nregs = (umips_swm_encoding[i] & 0xf) + (umips_swm_encoding[i] >> 4);
10422 this_offset = *offset - UNITS_PER_WORD * (nregs - 1);
10423
10424 /* LWM/SWM can only support offsets from -2048 to 2047. */
10425 if (!UMIPS_12BIT_OFFSET_P (this_offset))
10426 return false;
10427
10428 /* Create the final PARALLEL. */
10429 pattern = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (nregs));
10430 this_base = stack_pointer_rtx;
10431
10432 /* For registers $16-$23 and $30. */
10433 for (j = 0; j < (umips_swm_encoding[i] & 0xf); j++)
10434 {
10435 HOST_WIDE_INT offset = this_offset + j * UNITS_PER_WORD;
10436 mem = gen_frame_mem (SImode, plus_constant (Pmode, this_base, offset));
10437 unsigned int regno = (j != 8) ? 16 + j : 30;
10438 *mask &= ~(1 << regno);
10439 reg = gen_rtx_REG (SImode, regno);
10440 if (fn == mips_save_reg)
10441 set = mips_frame_set (mem, reg);
10442 else
10443 {
10444 set = gen_rtx_SET (VOIDmode, reg, mem);
10445 mips_add_cfa_restore (reg);
10446 }
10447 XVECEXP (pattern, 0, j) = set;
10448 }
10449
10450 /* For register $31. */
10451 if (umips_swm_encoding[i] >> 4)
10452 {
10453 HOST_WIDE_INT offset = this_offset + j * UNITS_PER_WORD;
10454 *mask &= ~(1 << 31);
10455 mem = gen_frame_mem (SImode, plus_constant (Pmode, this_base, offset));
10456 reg = gen_rtx_REG (SImode, 31);
10457 if (fn == mips_save_reg)
10458 set = mips_frame_set (mem, reg);
10459 else
10460 {
10461 set = gen_rtx_SET (VOIDmode, reg, mem);
10462 mips_add_cfa_restore (reg);
10463 }
10464 XVECEXP (pattern, 0, j) = set;
10465 }
10466
10467 pattern = emit_insn (pattern);
10468 if (fn == mips_save_reg)
10469 RTX_FRAME_RELATED_P (pattern) = 1;
10470
10471 /* Adjust the last offset. */
10472 *offset -= UNITS_PER_WORD * nregs;
10473
10474 return true;
10475 }
10476
10477 /* Call FN for each register that is saved by the current function.
10478 SP_OFFSET is the offset of the current stack pointer from the start
10479 of the frame. */
10480
10481 static void
10482 mips_for_each_saved_gpr_and_fpr (HOST_WIDE_INT sp_offset,
10483 mips_save_restore_fn fn)
10484 {
10485 enum machine_mode fpr_mode;
10486 int regno;
10487 const struct mips_frame_info *frame = &cfun->machine->frame;
10488 HOST_WIDE_INT offset;
10489 unsigned int mask;
10490
10491 /* Save registers starting from high to low. The debuggers prefer at least
10492 the return register be stored at func+4, and also it allows us not to
10493 need a nop in the epilogue if at least one register is reloaded in
10494 addition to return address. */
10495 offset = frame->gp_sp_offset - sp_offset;
10496 mask = frame->mask;
10497
10498 if (TARGET_MICROMIPS)
10499 umips_build_save_restore (fn, &mask, &offset);
10500
10501 for (regno = GP_REG_LAST; regno >= GP_REG_FIRST; regno--)
10502 if (BITSET_P (mask, regno - GP_REG_FIRST))
10503 {
10504 /* Record the ra offset for use by mips_function_profiler. */
10505 if (regno == RETURN_ADDR_REGNUM)
10506 cfun->machine->frame.ra_fp_offset = offset + sp_offset;
10507 mips_save_restore_reg (word_mode, regno, offset, fn);
10508 offset -= UNITS_PER_WORD;
10509 }
10510
10511 /* This loop must iterate over the same space as its companion in
10512 mips_compute_frame_info. */
10513 offset = cfun->machine->frame.fp_sp_offset - sp_offset;
10514 fpr_mode = (TARGET_SINGLE_FLOAT ? SFmode : DFmode);
10515 for (regno = FP_REG_LAST - MAX_FPRS_PER_FMT + 1;
10516 regno >= FP_REG_FIRST;
10517 regno -= MAX_FPRS_PER_FMT)
10518 if (BITSET_P (cfun->machine->frame.fmask, regno - FP_REG_FIRST))
10519 {
10520 mips_save_restore_reg (fpr_mode, regno, offset, fn);
10521 offset -= GET_MODE_SIZE (fpr_mode);
10522 }
10523 }
10524
10525 /* Return true if a move between register REGNO and its save slot (MEM)
10526 can be done in a single move. LOAD_P is true if we are loading
10527 from the slot, false if we are storing to it. */
10528
10529 static bool
10530 mips_direct_save_slot_move_p (unsigned int regno, rtx mem, bool load_p)
10531 {
10532 /* There is a specific MIPS16 instruction for saving $31 to the stack. */
10533 if (TARGET_MIPS16 && !load_p && regno == RETURN_ADDR_REGNUM)
10534 return false;
10535
10536 return mips_secondary_reload_class (REGNO_REG_CLASS (regno),
10537 GET_MODE (mem), mem, load_p) == NO_REGS;
10538 }
10539
10540 /* Emit a move from SRC to DEST, given that one of them is a register
10541 save slot and that the other is a register. TEMP is a temporary
10542 GPR of the same mode that is available if need be. */
10543
10544 void
10545 mips_emit_save_slot_move (rtx dest, rtx src, rtx temp)
10546 {
10547 unsigned int regno;
10548 rtx mem;
10549
10550 if (REG_P (src))
10551 {
10552 regno = REGNO (src);
10553 mem = dest;
10554 }
10555 else
10556 {
10557 regno = REGNO (dest);
10558 mem = src;
10559 }
10560
10561 if (regno == cfun->machine->global_pointer && !mips_must_initialize_gp_p ())
10562 {
10563 /* We don't yet know whether we'll need this instruction or not.
10564 Postpone the decision by emitting a ghost move. This move
10565 is specifically not frame-related; only the split version is. */
10566 if (TARGET_64BIT)
10567 emit_insn (gen_move_gpdi (dest, src));
10568 else
10569 emit_insn (gen_move_gpsi (dest, src));
10570 return;
10571 }
10572
10573 if (regno == HI_REGNUM)
10574 {
10575 if (REG_P (dest))
10576 {
10577 mips_emit_move (temp, src);
10578 if (TARGET_64BIT)
10579 emit_insn (gen_mthisi_di (gen_rtx_REG (TImode, MD_REG_FIRST),
10580 temp, gen_rtx_REG (DImode, LO_REGNUM)));
10581 else
10582 emit_insn (gen_mthisi_di (gen_rtx_REG (DImode, MD_REG_FIRST),
10583 temp, gen_rtx_REG (SImode, LO_REGNUM)));
10584 }
10585 else
10586 {
10587 if (TARGET_64BIT)
10588 emit_insn (gen_mfhidi_ti (temp,
10589 gen_rtx_REG (TImode, MD_REG_FIRST)));
10590 else
10591 emit_insn (gen_mfhisi_di (temp,
10592 gen_rtx_REG (DImode, MD_REG_FIRST)));
10593 mips_emit_move (dest, temp);
10594 }
10595 }
10596 else if (mips_direct_save_slot_move_p (regno, mem, mem == src))
10597 mips_emit_move (dest, src);
10598 else
10599 {
10600 gcc_assert (!reg_overlap_mentioned_p (dest, temp));
10601 mips_emit_move (temp, src);
10602 mips_emit_move (dest, temp);
10603 }
10604 if (MEM_P (dest))
10605 mips_set_frame_expr (mips_frame_set (dest, src));
10606 }
10607 \f
10608 /* If we're generating n32 or n64 abicalls, and the current function
10609 does not use $28 as its global pointer, emit a cplocal directive.
10610 Use pic_offset_table_rtx as the argument to the directive. */
10611
10612 static void
10613 mips_output_cplocal (void)
10614 {
10615 if (!TARGET_EXPLICIT_RELOCS
10616 && mips_must_initialize_gp_p ()
10617 && cfun->machine->global_pointer != GLOBAL_POINTER_REGNUM)
10618 output_asm_insn (".cplocal %+", 0);
10619 }
10620
10621 /* Implement TARGET_OUTPUT_FUNCTION_PROLOGUE. */
10622
10623 static void
10624 mips_output_function_prologue (FILE *file, HOST_WIDE_INT size ATTRIBUTE_UNUSED)
10625 {
10626 const char *fnname;
10627
10628 /* In MIPS16 mode, we may need to generate a non-MIPS16 stub to handle
10629 floating-point arguments. */
10630 if (TARGET_MIPS16
10631 && TARGET_HARD_FLOAT_ABI
10632 && crtl->args.info.fp_code != 0)
10633 mips16_build_function_stub ();
10634
10635 /* Get the function name the same way that toplev.c does before calling
10636 assemble_start_function. This is needed so that the name used here
10637 exactly matches the name used in ASM_DECLARE_FUNCTION_NAME. */
10638 fnname = XSTR (XEXP (DECL_RTL (current_function_decl), 0), 0);
10639 mips_start_function_definition (fnname, TARGET_MIPS16);
10640
10641 /* Output MIPS-specific frame information. */
10642 if (!flag_inhibit_size_directive)
10643 {
10644 const struct mips_frame_info *frame;
10645
10646 frame = &cfun->machine->frame;
10647
10648 /* .frame FRAMEREG, FRAMESIZE, RETREG. */
10649 fprintf (file,
10650 "\t.frame\t%s," HOST_WIDE_INT_PRINT_DEC ",%s\t\t"
10651 "# vars= " HOST_WIDE_INT_PRINT_DEC
10652 ", regs= %d/%d"
10653 ", args= " HOST_WIDE_INT_PRINT_DEC
10654 ", gp= " HOST_WIDE_INT_PRINT_DEC "\n",
10655 reg_names[frame_pointer_needed
10656 ? HARD_FRAME_POINTER_REGNUM
10657 : STACK_POINTER_REGNUM],
10658 (frame_pointer_needed
10659 ? frame->total_size - frame->hard_frame_pointer_offset
10660 : frame->total_size),
10661 reg_names[RETURN_ADDR_REGNUM],
10662 frame->var_size,
10663 frame->num_gp, frame->num_fp,
10664 frame->args_size,
10665 frame->cprestore_size);
10666
10667 /* .mask MASK, OFFSET. */
10668 fprintf (file, "\t.mask\t0x%08x," HOST_WIDE_INT_PRINT_DEC "\n",
10669 frame->mask, frame->gp_save_offset);
10670
10671 /* .fmask MASK, OFFSET. */
10672 fprintf (file, "\t.fmask\t0x%08x," HOST_WIDE_INT_PRINT_DEC "\n",
10673 frame->fmask, frame->fp_save_offset);
10674 }
10675
10676 /* Handle the initialization of $gp for SVR4 PIC, if applicable.
10677 Also emit the ".set noreorder; .set nomacro" sequence for functions
10678 that need it. */
10679 if (mips_must_initialize_gp_p ()
10680 && mips_current_loadgp_style () == LOADGP_OLDABI)
10681 {
10682 if (TARGET_MIPS16)
10683 {
10684 /* This is a fixed-form sequence. The position of the
10685 first two instructions is important because of the
10686 way _gp_disp is defined. */
10687 output_asm_insn ("li\t$2,%%hi(_gp_disp)", 0);
10688 output_asm_insn ("addiu\t$3,$pc,%%lo(_gp_disp)", 0);
10689 output_asm_insn ("sll\t$2,16", 0);
10690 output_asm_insn ("addu\t$2,$3", 0);
10691 }
10692 else
10693 {
10694 /* .cpload must be in a .set noreorder but not a
10695 .set nomacro block. */
10696 mips_push_asm_switch (&mips_noreorder);
10697 output_asm_insn (".cpload\t%^", 0);
10698 if (!cfun->machine->all_noreorder_p)
10699 mips_pop_asm_switch (&mips_noreorder);
10700 else
10701 mips_push_asm_switch (&mips_nomacro);
10702 }
10703 }
10704 else if (cfun->machine->all_noreorder_p)
10705 {
10706 mips_push_asm_switch (&mips_noreorder);
10707 mips_push_asm_switch (&mips_nomacro);
10708 }
10709
10710 /* Tell the assembler which register we're using as the global
10711 pointer. This is needed for thunks, since they can use either
10712 explicit relocs or assembler macros. */
10713 mips_output_cplocal ();
10714 }
10715
10716 /* Implement TARGET_OUTPUT_FUNCTION_EPILOGUE. */
10717
10718 static void
10719 mips_output_function_epilogue (FILE *file ATTRIBUTE_UNUSED,
10720 HOST_WIDE_INT size ATTRIBUTE_UNUSED)
10721 {
10722 const char *fnname;
10723
10724 /* Reinstate the normal $gp. */
10725 SET_REGNO (pic_offset_table_rtx, GLOBAL_POINTER_REGNUM);
10726 mips_output_cplocal ();
10727
10728 if (cfun->machine->all_noreorder_p)
10729 {
10730 mips_pop_asm_switch (&mips_nomacro);
10731 mips_pop_asm_switch (&mips_noreorder);
10732 }
10733
10734 /* Get the function name the same way that toplev.c does before calling
10735 assemble_start_function. This is needed so that the name used here
10736 exactly matches the name used in ASM_DECLARE_FUNCTION_NAME. */
10737 fnname = XSTR (XEXP (DECL_RTL (current_function_decl), 0), 0);
10738 mips_end_function_definition (fnname);
10739 }
10740 \f
10741 /* Emit an optimisation barrier for accesses to the current frame. */
10742
10743 static void
10744 mips_frame_barrier (void)
10745 {
10746 emit_clobber (gen_frame_mem (BLKmode, stack_pointer_rtx));
10747 }
10748
10749
10750 /* The __gnu_local_gp symbol. */
10751
10752 static GTY(()) rtx mips_gnu_local_gp;
10753
10754 /* If we're generating n32 or n64 abicalls, emit instructions
10755 to set up the global pointer. */
10756
10757 static void
10758 mips_emit_loadgp (void)
10759 {
10760 rtx addr, offset, incoming_address, base, index, pic_reg;
10761
10762 pic_reg = TARGET_MIPS16 ? MIPS16_PIC_TEMP : pic_offset_table_rtx;
10763 switch (mips_current_loadgp_style ())
10764 {
10765 case LOADGP_ABSOLUTE:
10766 if (mips_gnu_local_gp == NULL)
10767 {
10768 mips_gnu_local_gp = gen_rtx_SYMBOL_REF (Pmode, "__gnu_local_gp");
10769 SYMBOL_REF_FLAGS (mips_gnu_local_gp) |= SYMBOL_FLAG_LOCAL;
10770 }
10771 emit_insn (PMODE_INSN (gen_loadgp_absolute,
10772 (pic_reg, mips_gnu_local_gp)));
10773 break;
10774
10775 case LOADGP_OLDABI:
10776 /* Added by mips_output_function_prologue. */
10777 break;
10778
10779 case LOADGP_NEWABI:
10780 addr = XEXP (DECL_RTL (current_function_decl), 0);
10781 offset = mips_unspec_address (addr, SYMBOL_GOTOFF_LOADGP);
10782 incoming_address = gen_rtx_REG (Pmode, PIC_FUNCTION_ADDR_REGNUM);
10783 emit_insn (PMODE_INSN (gen_loadgp_newabi,
10784 (pic_reg, offset, incoming_address)));
10785 break;
10786
10787 case LOADGP_RTP:
10788 base = gen_rtx_SYMBOL_REF (Pmode, ggc_strdup (VXWORKS_GOTT_BASE));
10789 index = gen_rtx_SYMBOL_REF (Pmode, ggc_strdup (VXWORKS_GOTT_INDEX));
10790 emit_insn (PMODE_INSN (gen_loadgp_rtp, (pic_reg, base, index)));
10791 break;
10792
10793 default:
10794 return;
10795 }
10796
10797 if (TARGET_MIPS16)
10798 emit_insn (PMODE_INSN (gen_copygp_mips16,
10799 (pic_offset_table_rtx, pic_reg)));
10800
10801 /* Emit a blockage if there are implicit uses of the GP register.
10802 This includes profiled functions, because FUNCTION_PROFILE uses
10803 a jal macro. */
10804 if (!TARGET_EXPLICIT_RELOCS || crtl->profile)
10805 emit_insn (gen_loadgp_blockage ());
10806 }
10807
10808 #define PROBE_INTERVAL (1 << STACK_CHECK_PROBE_INTERVAL_EXP)
10809
10810 #if PROBE_INTERVAL > 32768
10811 #error Cannot use indexed addressing mode for stack probing
10812 #endif
10813
10814 /* Emit code to probe a range of stack addresses from FIRST to FIRST+SIZE,
10815 inclusive. These are offsets from the current stack pointer. */
10816
10817 static void
10818 mips_emit_probe_stack_range (HOST_WIDE_INT first, HOST_WIDE_INT size)
10819 {
10820 if (TARGET_MIPS16)
10821 sorry ("-fstack-check=specific not implemented for MIPS16");
10822
10823 /* See if we have a constant small number of probes to generate. If so,
10824 that's the easy case. */
10825 if (first + size <= 32768)
10826 {
10827 HOST_WIDE_INT i;
10828
10829 /* Probe at FIRST + N * PROBE_INTERVAL for values of N from 1 until
10830 it exceeds SIZE. If only one probe is needed, this will not
10831 generate any code. Then probe at FIRST + SIZE. */
10832 for (i = PROBE_INTERVAL; i < size; i += PROBE_INTERVAL)
10833 emit_stack_probe (plus_constant (Pmode, stack_pointer_rtx,
10834 -(first + i)));
10835
10836 emit_stack_probe (plus_constant (Pmode, stack_pointer_rtx,
10837 -(first + size)));
10838 }
10839
10840 /* Otherwise, do the same as above, but in a loop. Note that we must be
10841 extra careful with variables wrapping around because we might be at
10842 the very top (or the very bottom) of the address space and we have
10843 to be able to handle this case properly; in particular, we use an
10844 equality test for the loop condition. */
10845 else
10846 {
10847 HOST_WIDE_INT rounded_size;
10848 rtx r3 = MIPS_PROLOGUE_TEMP (Pmode);
10849 rtx r12 = MIPS_PROLOGUE_TEMP2 (Pmode);
10850
10851 /* Sanity check for the addressing mode we're going to use. */
10852 gcc_assert (first <= 32768);
10853
10854
10855 /* Step 1: round SIZE to the previous multiple of the interval. */
10856
10857 rounded_size = size & -PROBE_INTERVAL;
10858
10859
10860 /* Step 2: compute initial and final value of the loop counter. */
10861
10862 /* TEST_ADDR = SP + FIRST. */
10863 emit_insn (gen_rtx_SET (VOIDmode, r3,
10864 plus_constant (Pmode, stack_pointer_rtx,
10865 -first)));
10866
10867 /* LAST_ADDR = SP + FIRST + ROUNDED_SIZE. */
10868 if (rounded_size > 32768)
10869 {
10870 emit_move_insn (r12, GEN_INT (rounded_size));
10871 emit_insn (gen_rtx_SET (VOIDmode, r12,
10872 gen_rtx_MINUS (Pmode, r3, r12)));
10873 }
10874 else
10875 emit_insn (gen_rtx_SET (VOIDmode, r12,
10876 plus_constant (Pmode, r3, -rounded_size)));
10877
10878
10879 /* Step 3: the loop
10880
10881 while (TEST_ADDR != LAST_ADDR)
10882 {
10883 TEST_ADDR = TEST_ADDR + PROBE_INTERVAL
10884 probe at TEST_ADDR
10885 }
10886
10887 probes at FIRST + N * PROBE_INTERVAL for values of N from 1
10888 until it is equal to ROUNDED_SIZE. */
10889
10890 emit_insn (PMODE_INSN (gen_probe_stack_range, (r3, r3, r12)));
10891
10892
10893 /* Step 4: probe at FIRST + SIZE if we cannot assert at compile-time
10894 that SIZE is equal to ROUNDED_SIZE. */
10895
10896 if (size != rounded_size)
10897 emit_stack_probe (plus_constant (Pmode, r12, rounded_size - size));
10898 }
10899
10900 /* Make sure nothing is scheduled before we are done. */
10901 emit_insn (gen_blockage ());
10902 }
10903
10904 /* Probe a range of stack addresses from REG1 to REG2 inclusive. These are
10905 absolute addresses. */
10906
10907 const char *
10908 mips_output_probe_stack_range (rtx reg1, rtx reg2)
10909 {
10910 static int labelno = 0;
10911 char loop_lab[32], end_lab[32], tmp[64];
10912 rtx xops[2];
10913
10914 ASM_GENERATE_INTERNAL_LABEL (loop_lab, "LPSRL", labelno);
10915 ASM_GENERATE_INTERNAL_LABEL (end_lab, "LPSRE", labelno++);
10916
10917 ASM_OUTPUT_INTERNAL_LABEL (asm_out_file, loop_lab);
10918
10919 /* Jump to END_LAB if TEST_ADDR == LAST_ADDR. */
10920 xops[0] = reg1;
10921 xops[1] = reg2;
10922 strcpy (tmp, "%(%<beq\t%0,%1,");
10923 output_asm_insn (strcat (tmp, &end_lab[1]), xops);
10924
10925 /* TEST_ADDR = TEST_ADDR + PROBE_INTERVAL. */
10926 xops[1] = GEN_INT (-PROBE_INTERVAL);
10927 if (TARGET_64BIT && TARGET_LONG64)
10928 output_asm_insn ("daddiu\t%0,%0,%1", xops);
10929 else
10930 output_asm_insn ("addiu\t%0,%0,%1", xops);
10931
10932 /* Probe at TEST_ADDR and branch. */
10933 fprintf (asm_out_file, "\tb\t");
10934 assemble_name_raw (asm_out_file, loop_lab);
10935 fputc ('\n', asm_out_file);
10936 if (TARGET_64BIT)
10937 output_asm_insn ("sd\t$0,0(%0)%)", xops);
10938 else
10939 output_asm_insn ("sw\t$0,0(%0)%)", xops);
10940
10941 ASM_OUTPUT_INTERNAL_LABEL (asm_out_file, end_lab);
10942
10943 return "";
10944 }
10945
10946 /* A for_each_rtx callback. Stop the search if *X is a kernel register. */
10947
10948 static int
10949 mips_kernel_reg_p (rtx *x, void *data ATTRIBUTE_UNUSED)
10950 {
10951 return REG_P (*x) && KERNEL_REG_P (REGNO (*x));
10952 }
10953
10954 /* Expand the "prologue" pattern. */
10955
10956 void
10957 mips_expand_prologue (void)
10958 {
10959 const struct mips_frame_info *frame;
10960 HOST_WIDE_INT size;
10961 unsigned int nargs;
10962 rtx insn;
10963
10964 if (cfun->machine->global_pointer != INVALID_REGNUM)
10965 {
10966 /* Check whether an insn uses pic_offset_table_rtx, either explicitly
10967 or implicitly. If so, we can commit to using a global pointer
10968 straight away, otherwise we need to defer the decision. */
10969 if (mips_cfun_has_inflexible_gp_ref_p ()
10970 || mips_cfun_has_flexible_gp_ref_p ())
10971 {
10972 cfun->machine->must_initialize_gp_p = true;
10973 cfun->machine->must_restore_gp_when_clobbered_p = true;
10974 }
10975
10976 SET_REGNO (pic_offset_table_rtx, cfun->machine->global_pointer);
10977 }
10978
10979 frame = &cfun->machine->frame;
10980 size = frame->total_size;
10981
10982 if (flag_stack_usage_info)
10983 current_function_static_stack_size = size;
10984
10985 if (flag_stack_check == STATIC_BUILTIN_STACK_CHECK && size)
10986 mips_emit_probe_stack_range (STACK_CHECK_PROTECT, size);
10987
10988 /* Save the registers. Allocate up to MIPS_MAX_FIRST_STACK_STEP
10989 bytes beforehand; this is enough to cover the register save area
10990 without going out of range. */
10991 if (((frame->mask | frame->fmask | frame->acc_mask) != 0)
10992 || frame->num_cop0_regs > 0)
10993 {
10994 HOST_WIDE_INT step1;
10995
10996 step1 = MIN (size, MIPS_MAX_FIRST_STACK_STEP);
10997 if (GENERATE_MIPS16E_SAVE_RESTORE)
10998 {
10999 HOST_WIDE_INT offset;
11000 unsigned int mask, regno;
11001
11002 /* Try to merge argument stores into the save instruction. */
11003 nargs = mips16e_collect_argument_saves ();
11004
11005 /* Build the save instruction. */
11006 mask = frame->mask;
11007 insn = mips16e_build_save_restore (false, &mask, &offset,
11008 nargs, step1);
11009 RTX_FRAME_RELATED_P (emit_insn (insn)) = 1;
11010 mips_frame_barrier ();
11011 size -= step1;
11012
11013 /* Check if we need to save other registers. */
11014 for (regno = GP_REG_FIRST; regno < GP_REG_LAST; regno++)
11015 if (BITSET_P (mask, regno - GP_REG_FIRST))
11016 {
11017 offset -= UNITS_PER_WORD;
11018 mips_save_restore_reg (word_mode, regno,
11019 offset, mips_save_reg);
11020 }
11021 }
11022 else
11023 {
11024 if (cfun->machine->interrupt_handler_p)
11025 {
11026 HOST_WIDE_INT offset;
11027 rtx mem;
11028
11029 /* If this interrupt is using a shadow register set, we need to
11030 get the stack pointer from the previous register set. */
11031 if (cfun->machine->use_shadow_register_set_p)
11032 emit_insn (gen_mips_rdpgpr (stack_pointer_rtx,
11033 stack_pointer_rtx));
11034
11035 if (!cfun->machine->keep_interrupts_masked_p)
11036 {
11037 /* Move from COP0 Cause to K0. */
11038 emit_insn (gen_cop0_move (gen_rtx_REG (SImode, K0_REG_NUM),
11039 gen_rtx_REG (SImode,
11040 COP0_CAUSE_REG_NUM)));
11041 /* Move from COP0 EPC to K1. */
11042 emit_insn (gen_cop0_move (gen_rtx_REG (SImode, K1_REG_NUM),
11043 gen_rtx_REG (SImode,
11044 COP0_EPC_REG_NUM)));
11045 }
11046
11047 /* Allocate the first part of the frame. */
11048 insn = gen_add3_insn (stack_pointer_rtx, stack_pointer_rtx,
11049 GEN_INT (-step1));
11050 RTX_FRAME_RELATED_P (emit_insn (insn)) = 1;
11051 mips_frame_barrier ();
11052 size -= step1;
11053
11054 /* Start at the uppermost location for saving. */
11055 offset = frame->cop0_sp_offset - size;
11056 if (!cfun->machine->keep_interrupts_masked_p)
11057 {
11058 /* Push EPC into its stack slot. */
11059 mem = gen_frame_mem (word_mode,
11060 plus_constant (Pmode, stack_pointer_rtx,
11061 offset));
11062 mips_emit_move (mem, gen_rtx_REG (word_mode, K1_REG_NUM));
11063 offset -= UNITS_PER_WORD;
11064 }
11065
11066 /* Move from COP0 Status to K1. */
11067 emit_insn (gen_cop0_move (gen_rtx_REG (SImode, K1_REG_NUM),
11068 gen_rtx_REG (SImode,
11069 COP0_STATUS_REG_NUM)));
11070
11071 /* Right justify the RIPL in k0. */
11072 if (!cfun->machine->keep_interrupts_masked_p)
11073 emit_insn (gen_lshrsi3 (gen_rtx_REG (SImode, K0_REG_NUM),
11074 gen_rtx_REG (SImode, K0_REG_NUM),
11075 GEN_INT (CAUSE_IPL)));
11076
11077 /* Push Status into its stack slot. */
11078 mem = gen_frame_mem (word_mode,
11079 plus_constant (Pmode, stack_pointer_rtx,
11080 offset));
11081 mips_emit_move (mem, gen_rtx_REG (word_mode, K1_REG_NUM));
11082 offset -= UNITS_PER_WORD;
11083
11084 /* Insert the RIPL into our copy of SR (k1) as the new IPL. */
11085 if (!cfun->machine->keep_interrupts_masked_p)
11086 emit_insn (gen_insvsi (gen_rtx_REG (SImode, K1_REG_NUM),
11087 GEN_INT (6),
11088 GEN_INT (SR_IPL),
11089 gen_rtx_REG (SImode, K0_REG_NUM)));
11090
11091 if (!cfun->machine->keep_interrupts_masked_p)
11092 /* Enable interrupts by clearing the KSU ERL and EXL bits.
11093 IE is already the correct value, so we don't have to do
11094 anything explicit. */
11095 emit_insn (gen_insvsi (gen_rtx_REG (SImode, K1_REG_NUM),
11096 GEN_INT (4),
11097 GEN_INT (SR_EXL),
11098 gen_rtx_REG (SImode, GP_REG_FIRST)));
11099 else
11100 /* Disable interrupts by clearing the KSU, ERL, EXL,
11101 and IE bits. */
11102 emit_insn (gen_insvsi (gen_rtx_REG (SImode, K1_REG_NUM),
11103 GEN_INT (5),
11104 GEN_INT (SR_IE),
11105 gen_rtx_REG (SImode, GP_REG_FIRST)));
11106 }
11107 else
11108 {
11109 insn = gen_add3_insn (stack_pointer_rtx,
11110 stack_pointer_rtx,
11111 GEN_INT (-step1));
11112 RTX_FRAME_RELATED_P (emit_insn (insn)) = 1;
11113 mips_frame_barrier ();
11114 size -= step1;
11115 }
11116 mips_for_each_saved_acc (size, mips_save_reg);
11117 mips_for_each_saved_gpr_and_fpr (size, mips_save_reg);
11118 }
11119 }
11120
11121 /* Allocate the rest of the frame. */
11122 if (size > 0)
11123 {
11124 if (SMALL_OPERAND (-size))
11125 RTX_FRAME_RELATED_P (emit_insn (gen_add3_insn (stack_pointer_rtx,
11126 stack_pointer_rtx,
11127 GEN_INT (-size)))) = 1;
11128 else
11129 {
11130 mips_emit_move (MIPS_PROLOGUE_TEMP (Pmode), GEN_INT (size));
11131 if (TARGET_MIPS16)
11132 {
11133 /* There are no instructions to add or subtract registers
11134 from the stack pointer, so use the frame pointer as a
11135 temporary. We should always be using a frame pointer
11136 in this case anyway. */
11137 gcc_assert (frame_pointer_needed);
11138 mips_emit_move (hard_frame_pointer_rtx, stack_pointer_rtx);
11139 emit_insn (gen_sub3_insn (hard_frame_pointer_rtx,
11140 hard_frame_pointer_rtx,
11141 MIPS_PROLOGUE_TEMP (Pmode)));
11142 mips_emit_move (stack_pointer_rtx, hard_frame_pointer_rtx);
11143 }
11144 else
11145 emit_insn (gen_sub3_insn (stack_pointer_rtx,
11146 stack_pointer_rtx,
11147 MIPS_PROLOGUE_TEMP (Pmode)));
11148
11149 /* Describe the combined effect of the previous instructions. */
11150 mips_set_frame_expr
11151 (gen_rtx_SET (VOIDmode, stack_pointer_rtx,
11152 plus_constant (Pmode, stack_pointer_rtx, -size)));
11153 }
11154 mips_frame_barrier ();
11155 }
11156
11157 /* Set up the frame pointer, if we're using one. */
11158 if (frame_pointer_needed)
11159 {
11160 HOST_WIDE_INT offset;
11161
11162 offset = frame->hard_frame_pointer_offset;
11163 if (offset == 0)
11164 {
11165 insn = mips_emit_move (hard_frame_pointer_rtx, stack_pointer_rtx);
11166 RTX_FRAME_RELATED_P (insn) = 1;
11167 }
11168 else if (SMALL_OPERAND (offset))
11169 {
11170 insn = gen_add3_insn (hard_frame_pointer_rtx,
11171 stack_pointer_rtx, GEN_INT (offset));
11172 RTX_FRAME_RELATED_P (emit_insn (insn)) = 1;
11173 }
11174 else
11175 {
11176 mips_emit_move (MIPS_PROLOGUE_TEMP (Pmode), GEN_INT (offset));
11177 mips_emit_move (hard_frame_pointer_rtx, stack_pointer_rtx);
11178 emit_insn (gen_add3_insn (hard_frame_pointer_rtx,
11179 hard_frame_pointer_rtx,
11180 MIPS_PROLOGUE_TEMP (Pmode)));
11181 mips_set_frame_expr
11182 (gen_rtx_SET (VOIDmode, hard_frame_pointer_rtx,
11183 plus_constant (Pmode, stack_pointer_rtx, offset)));
11184 }
11185 }
11186
11187 mips_emit_loadgp ();
11188
11189 /* Initialize the $gp save slot. */
11190 if (mips_cfun_has_cprestore_slot_p ())
11191 {
11192 rtx base, mem, gp, temp;
11193 HOST_WIDE_INT offset;
11194
11195 mips_get_cprestore_base_and_offset (&base, &offset, false);
11196 mem = gen_frame_mem (Pmode, plus_constant (Pmode, base, offset));
11197 gp = TARGET_MIPS16 ? MIPS16_PIC_TEMP : pic_offset_table_rtx;
11198 temp = (SMALL_OPERAND (offset)
11199 ? gen_rtx_SCRATCH (Pmode)
11200 : MIPS_PROLOGUE_TEMP (Pmode));
11201 emit_insn (PMODE_INSN (gen_potential_cprestore,
11202 (mem, GEN_INT (offset), gp, temp)));
11203
11204 mips_get_cprestore_base_and_offset (&base, &offset, true);
11205 mem = gen_frame_mem (Pmode, plus_constant (Pmode, base, offset));
11206 emit_insn (PMODE_INSN (gen_use_cprestore, (mem)));
11207 }
11208
11209 /* We need to search back to the last use of K0 or K1. */
11210 if (cfun->machine->interrupt_handler_p)
11211 {
11212 for (insn = get_last_insn (); insn != NULL_RTX; insn = PREV_INSN (insn))
11213 if (INSN_P (insn)
11214 && for_each_rtx (&PATTERN (insn), mips_kernel_reg_p, NULL))
11215 break;
11216 /* Emit a move from K1 to COP0 Status after insn. */
11217 gcc_assert (insn != NULL_RTX);
11218 emit_insn_after (gen_cop0_move (gen_rtx_REG (SImode, COP0_STATUS_REG_NUM),
11219 gen_rtx_REG (SImode, K1_REG_NUM)),
11220 insn);
11221 }
11222
11223 /* If we are profiling, make sure no instructions are scheduled before
11224 the call to mcount. */
11225 if (crtl->profile)
11226 emit_insn (gen_blockage ());
11227 }
11228 \f
11229 /* Attach all pending register saves to the previous instruction.
11230 Return that instruction. */
11231
11232 static rtx
11233 mips_epilogue_emit_cfa_restores (void)
11234 {
11235 rtx insn;
11236
11237 insn = get_last_insn ();
11238 gcc_assert (insn && !REG_NOTES (insn));
11239 if (mips_epilogue.cfa_restores)
11240 {
11241 RTX_FRAME_RELATED_P (insn) = 1;
11242 REG_NOTES (insn) = mips_epilogue.cfa_restores;
11243 mips_epilogue.cfa_restores = 0;
11244 }
11245 return insn;
11246 }
11247
11248 /* Like mips_epilogue_emit_cfa_restores, but also record that the CFA is
11249 now at REG + OFFSET. */
11250
11251 static void
11252 mips_epilogue_set_cfa (rtx reg, HOST_WIDE_INT offset)
11253 {
11254 rtx insn;
11255
11256 insn = mips_epilogue_emit_cfa_restores ();
11257 if (reg != mips_epilogue.cfa_reg || offset != mips_epilogue.cfa_offset)
11258 {
11259 RTX_FRAME_RELATED_P (insn) = 1;
11260 REG_NOTES (insn) = alloc_reg_note (REG_CFA_DEF_CFA,
11261 plus_constant (Pmode, reg, offset),
11262 REG_NOTES (insn));
11263 mips_epilogue.cfa_reg = reg;
11264 mips_epilogue.cfa_offset = offset;
11265 }
11266 }
11267
11268 /* Emit instructions to restore register REG from slot MEM. Also update
11269 the cfa_restores list. */
11270
11271 static void
11272 mips_restore_reg (rtx reg, rtx mem)
11273 {
11274 /* There's no MIPS16 instruction to load $31 directly. Load into
11275 $7 instead and adjust the return insn appropriately. */
11276 if (TARGET_MIPS16 && REGNO (reg) == RETURN_ADDR_REGNUM)
11277 reg = gen_rtx_REG (GET_MODE (reg), GP_REG_FIRST + 7);
11278 else if (GET_MODE (reg) == DFmode && !TARGET_FLOAT64)
11279 {
11280 mips_add_cfa_restore (mips_subword (reg, true));
11281 mips_add_cfa_restore (mips_subword (reg, false));
11282 }
11283 else
11284 mips_add_cfa_restore (reg);
11285
11286 mips_emit_save_slot_move (reg, mem, MIPS_EPILOGUE_TEMP (GET_MODE (reg)));
11287 if (REGNO (reg) == REGNO (mips_epilogue.cfa_reg))
11288 /* The CFA is currently defined in terms of the register whose
11289 value we have just restored. Redefine the CFA in terms of
11290 the stack pointer. */
11291 mips_epilogue_set_cfa (stack_pointer_rtx,
11292 mips_epilogue.cfa_restore_sp_offset);
11293 }
11294
11295 /* Emit code to set the stack pointer to BASE + OFFSET, given that
11296 BASE + OFFSET is NEW_FRAME_SIZE bytes below the top of the frame.
11297 BASE, if not the stack pointer, is available as a temporary. */
11298
11299 static void
11300 mips_deallocate_stack (rtx base, rtx offset, HOST_WIDE_INT new_frame_size)
11301 {
11302 if (base == stack_pointer_rtx && offset == const0_rtx)
11303 return;
11304
11305 mips_frame_barrier ();
11306 if (offset == const0_rtx)
11307 {
11308 emit_move_insn (stack_pointer_rtx, base);
11309 mips_epilogue_set_cfa (stack_pointer_rtx, new_frame_size);
11310 }
11311 else if (TARGET_MIPS16 && base != stack_pointer_rtx)
11312 {
11313 emit_insn (gen_add3_insn (base, base, offset));
11314 mips_epilogue_set_cfa (base, new_frame_size);
11315 emit_move_insn (stack_pointer_rtx, base);
11316 }
11317 else
11318 {
11319 emit_insn (gen_add3_insn (stack_pointer_rtx, base, offset));
11320 mips_epilogue_set_cfa (stack_pointer_rtx, new_frame_size);
11321 }
11322 }
11323
11324 /* Emit any instructions needed before a return. */
11325
11326 void
11327 mips_expand_before_return (void)
11328 {
11329 /* When using a call-clobbered gp, we start out with unified call
11330 insns that include instructions to restore the gp. We then split
11331 these unified calls after reload. These split calls explicitly
11332 clobber gp, so there is no need to define
11333 PIC_OFFSET_TABLE_REG_CALL_CLOBBERED.
11334
11335 For consistency, we should also insert an explicit clobber of $28
11336 before return insns, so that the post-reload optimizers know that
11337 the register is not live on exit. */
11338 if (TARGET_CALL_CLOBBERED_GP)
11339 emit_clobber (pic_offset_table_rtx);
11340 }
11341
11342 /* Expand an "epilogue" or "sibcall_epilogue" pattern; SIBCALL_P
11343 says which. */
11344
11345 void
11346 mips_expand_epilogue (bool sibcall_p)
11347 {
11348 const struct mips_frame_info *frame;
11349 HOST_WIDE_INT step1, step2;
11350 rtx base, adjust, insn;
11351 bool use_jraddiusp_p = false;
11352
11353 if (!sibcall_p && mips_can_use_return_insn ())
11354 {
11355 emit_jump_insn (gen_return ());
11356 return;
11357 }
11358
11359 /* In MIPS16 mode, if the return value should go into a floating-point
11360 register, we need to call a helper routine to copy it over. */
11361 if (mips16_cfun_returns_in_fpr_p ())
11362 mips16_copy_fpr_return_value ();
11363
11364 /* Split the frame into two. STEP1 is the amount of stack we should
11365 deallocate before restoring the registers. STEP2 is the amount we
11366 should deallocate afterwards.
11367
11368 Start off by assuming that no registers need to be restored. */
11369 frame = &cfun->machine->frame;
11370 step1 = frame->total_size;
11371 step2 = 0;
11372
11373 /* Work out which register holds the frame address. */
11374 if (!frame_pointer_needed)
11375 base = stack_pointer_rtx;
11376 else
11377 {
11378 base = hard_frame_pointer_rtx;
11379 step1 -= frame->hard_frame_pointer_offset;
11380 }
11381 mips_epilogue.cfa_reg = base;
11382 mips_epilogue.cfa_offset = step1;
11383 mips_epilogue.cfa_restores = NULL_RTX;
11384
11385 /* If we need to restore registers, deallocate as much stack as
11386 possible in the second step without going out of range. */
11387 if ((frame->mask | frame->fmask | frame->acc_mask) != 0
11388 || frame->num_cop0_regs > 0)
11389 {
11390 step2 = MIN (step1, MIPS_MAX_FIRST_STACK_STEP);
11391 step1 -= step2;
11392 }
11393
11394 /* Get an rtx for STEP1 that we can add to BASE. */
11395 adjust = GEN_INT (step1);
11396 if (!SMALL_OPERAND (step1))
11397 {
11398 mips_emit_move (MIPS_EPILOGUE_TEMP (Pmode), adjust);
11399 adjust = MIPS_EPILOGUE_TEMP (Pmode);
11400 }
11401 mips_deallocate_stack (base, adjust, step2);
11402
11403 /* If we're using addressing macros, $gp is implicitly used by all
11404 SYMBOL_REFs. We must emit a blockage insn before restoring $gp
11405 from the stack. */
11406 if (TARGET_CALL_SAVED_GP && !TARGET_EXPLICIT_RELOCS)
11407 emit_insn (gen_blockage ());
11408
11409 mips_epilogue.cfa_restore_sp_offset = step2;
11410 if (GENERATE_MIPS16E_SAVE_RESTORE && frame->mask != 0)
11411 {
11412 unsigned int regno, mask;
11413 HOST_WIDE_INT offset;
11414 rtx restore;
11415
11416 /* Generate the restore instruction. */
11417 mask = frame->mask;
11418 restore = mips16e_build_save_restore (true, &mask, &offset, 0, step2);
11419
11420 /* Restore any other registers manually. */
11421 for (regno = GP_REG_FIRST; regno < GP_REG_LAST; regno++)
11422 if (BITSET_P (mask, regno - GP_REG_FIRST))
11423 {
11424 offset -= UNITS_PER_WORD;
11425 mips_save_restore_reg (word_mode, regno, offset, mips_restore_reg);
11426 }
11427
11428 /* Restore the remaining registers and deallocate the final bit
11429 of the frame. */
11430 mips_frame_barrier ();
11431 emit_insn (restore);
11432 mips_epilogue_set_cfa (stack_pointer_rtx, 0);
11433 }
11434 else
11435 {
11436 /* Restore the registers. */
11437 mips_for_each_saved_acc (frame->total_size - step2, mips_restore_reg);
11438 mips_for_each_saved_gpr_and_fpr (frame->total_size - step2,
11439 mips_restore_reg);
11440
11441 if (cfun->machine->interrupt_handler_p)
11442 {
11443 HOST_WIDE_INT offset;
11444 rtx mem;
11445
11446 offset = frame->cop0_sp_offset - (frame->total_size - step2);
11447 if (!cfun->machine->keep_interrupts_masked_p)
11448 {
11449 /* Restore the original EPC. */
11450 mem = gen_frame_mem (word_mode,
11451 plus_constant (Pmode, stack_pointer_rtx,
11452 offset));
11453 mips_emit_move (gen_rtx_REG (word_mode, K0_REG_NUM), mem);
11454 offset -= UNITS_PER_WORD;
11455
11456 /* Move to COP0 EPC. */
11457 emit_insn (gen_cop0_move (gen_rtx_REG (SImode, COP0_EPC_REG_NUM),
11458 gen_rtx_REG (SImode, K0_REG_NUM)));
11459 }
11460
11461 /* Restore the original Status. */
11462 mem = gen_frame_mem (word_mode,
11463 plus_constant (Pmode, stack_pointer_rtx,
11464 offset));
11465 mips_emit_move (gen_rtx_REG (word_mode, K0_REG_NUM), mem);
11466 offset -= UNITS_PER_WORD;
11467
11468 /* If we don't use shadow register set, we need to update SP. */
11469 if (!cfun->machine->use_shadow_register_set_p)
11470 mips_deallocate_stack (stack_pointer_rtx, GEN_INT (step2), 0);
11471 else
11472 /* The choice of position is somewhat arbitrary in this case. */
11473 mips_epilogue_emit_cfa_restores ();
11474
11475 /* Move to COP0 Status. */
11476 emit_insn (gen_cop0_move (gen_rtx_REG (SImode, COP0_STATUS_REG_NUM),
11477 gen_rtx_REG (SImode, K0_REG_NUM)));
11478 }
11479 else if (TARGET_MICROMIPS
11480 && !crtl->calls_eh_return
11481 && !sibcall_p
11482 && step2 > 0
11483 && mips_unsigned_immediate_p (step2, 5, 2))
11484 use_jraddiusp_p = true;
11485 else
11486 /* Deallocate the final bit of the frame. */
11487 mips_deallocate_stack (stack_pointer_rtx, GEN_INT (step2), 0);
11488 }
11489
11490 if (!use_jraddiusp_p)
11491 gcc_assert (!mips_epilogue.cfa_restores);
11492
11493 /* Add in the __builtin_eh_return stack adjustment. We need to
11494 use a temporary in MIPS16 code. */
11495 if (crtl->calls_eh_return)
11496 {
11497 if (TARGET_MIPS16)
11498 {
11499 mips_emit_move (MIPS_EPILOGUE_TEMP (Pmode), stack_pointer_rtx);
11500 emit_insn (gen_add3_insn (MIPS_EPILOGUE_TEMP (Pmode),
11501 MIPS_EPILOGUE_TEMP (Pmode),
11502 EH_RETURN_STACKADJ_RTX));
11503 mips_emit_move (stack_pointer_rtx, MIPS_EPILOGUE_TEMP (Pmode));
11504 }
11505 else
11506 emit_insn (gen_add3_insn (stack_pointer_rtx,
11507 stack_pointer_rtx,
11508 EH_RETURN_STACKADJ_RTX));
11509 }
11510
11511 if (!sibcall_p)
11512 {
11513 mips_expand_before_return ();
11514 if (cfun->machine->interrupt_handler_p)
11515 {
11516 /* Interrupt handlers generate eret or deret. */
11517 if (cfun->machine->use_debug_exception_return_p)
11518 emit_jump_insn (gen_mips_deret ());
11519 else
11520 emit_jump_insn (gen_mips_eret ());
11521 }
11522 else
11523 {
11524 rtx pat;
11525
11526 /* When generating MIPS16 code, the normal
11527 mips_for_each_saved_gpr_and_fpr path will restore the return
11528 address into $7 rather than $31. */
11529 if (TARGET_MIPS16
11530 && !GENERATE_MIPS16E_SAVE_RESTORE
11531 && BITSET_P (frame->mask, RETURN_ADDR_REGNUM))
11532 {
11533 /* simple_returns cannot rely on values that are only available
11534 on paths through the epilogue (because return paths that do
11535 not pass through the epilogue may nevertheless reuse a
11536 simple_return that occurs at the end of the epilogue).
11537 Use a normal return here instead. */
11538 rtx reg = gen_rtx_REG (Pmode, GP_REG_FIRST + 7);
11539 pat = gen_return_internal (reg);
11540 }
11541 else if (use_jraddiusp_p)
11542 pat = gen_jraddiusp (GEN_INT (step2));
11543 else
11544 {
11545 rtx reg = gen_rtx_REG (Pmode, RETURN_ADDR_REGNUM);
11546 pat = gen_simple_return_internal (reg);
11547 }
11548 emit_jump_insn (pat);
11549 if (use_jraddiusp_p)
11550 mips_epilogue_set_cfa (stack_pointer_rtx, step2);
11551 }
11552 }
11553
11554 /* Search from the beginning to the first use of K0 or K1. */
11555 if (cfun->machine->interrupt_handler_p
11556 && !cfun->machine->keep_interrupts_masked_p)
11557 {
11558 for (insn = get_insns (); insn != NULL_RTX; insn = NEXT_INSN (insn))
11559 if (INSN_P (insn)
11560 && for_each_rtx (&PATTERN(insn), mips_kernel_reg_p, NULL))
11561 break;
11562 gcc_assert (insn != NULL_RTX);
11563 /* Insert disable interrupts before the first use of K0 or K1. */
11564 emit_insn_before (gen_mips_di (), insn);
11565 emit_insn_before (gen_mips_ehb (), insn);
11566 }
11567 }
11568 \f
11569 /* Return nonzero if this function is known to have a null epilogue.
11570 This allows the optimizer to omit jumps to jumps if no stack
11571 was created. */
11572
11573 bool
11574 mips_can_use_return_insn (void)
11575 {
11576 /* Interrupt handlers need to go through the epilogue. */
11577 if (cfun->machine->interrupt_handler_p)
11578 return false;
11579
11580 if (!reload_completed)
11581 return false;
11582
11583 if (crtl->profile)
11584 return false;
11585
11586 /* In MIPS16 mode, a function that returns a floating-point value
11587 needs to arrange to copy the return value into the floating-point
11588 registers. */
11589 if (mips16_cfun_returns_in_fpr_p ())
11590 return false;
11591
11592 return cfun->machine->frame.total_size == 0;
11593 }
11594 \f
11595 /* Return true if register REGNO can store a value of mode MODE.
11596 The result of this function is cached in mips_hard_regno_mode_ok. */
11597
11598 static bool
11599 mips_hard_regno_mode_ok_p (unsigned int regno, enum machine_mode mode)
11600 {
11601 unsigned int size;
11602 enum mode_class mclass;
11603
11604 if (mode == CCV2mode)
11605 return (ISA_HAS_8CC
11606 && ST_REG_P (regno)
11607 && (regno - ST_REG_FIRST) % 2 == 0);
11608
11609 if (mode == CCV4mode)
11610 return (ISA_HAS_8CC
11611 && ST_REG_P (regno)
11612 && (regno - ST_REG_FIRST) % 4 == 0);
11613
11614 if (mode == CCmode)
11615 return ISA_HAS_8CC ? ST_REG_P (regno) : regno == FPSW_REGNUM;
11616
11617 size = GET_MODE_SIZE (mode);
11618 mclass = GET_MODE_CLASS (mode);
11619
11620 if (GP_REG_P (regno))
11621 return ((regno - GP_REG_FIRST) & 1) == 0 || size <= UNITS_PER_WORD;
11622
11623 if (FP_REG_P (regno)
11624 && (((regno - FP_REG_FIRST) % MAX_FPRS_PER_FMT) == 0
11625 || (MIN_FPRS_PER_FMT == 1 && size <= UNITS_PER_FPREG)))
11626 {
11627 /* Allow 64-bit vector modes for Loongson-2E/2F. */
11628 if (TARGET_LOONGSON_VECTORS
11629 && (mode == V2SImode
11630 || mode == V4HImode
11631 || mode == V8QImode
11632 || mode == DImode))
11633 return true;
11634
11635 if (mclass == MODE_FLOAT
11636 || mclass == MODE_COMPLEX_FLOAT
11637 || mclass == MODE_VECTOR_FLOAT)
11638 return size <= UNITS_PER_FPVALUE;
11639
11640 /* Allow integer modes that fit into a single register. We need
11641 to put integers into FPRs when using instructions like CVT
11642 and TRUNC. There's no point allowing sizes smaller than a word,
11643 because the FPU has no appropriate load/store instructions. */
11644 if (mclass == MODE_INT)
11645 return size >= MIN_UNITS_PER_WORD && size <= UNITS_PER_FPREG;
11646 }
11647
11648 if (ACC_REG_P (regno)
11649 && (INTEGRAL_MODE_P (mode) || ALL_FIXED_POINT_MODE_P (mode)))
11650 {
11651 if (MD_REG_P (regno))
11652 {
11653 /* After a multiplication or division, clobbering HI makes
11654 the value of LO unpredictable, and vice versa. This means
11655 that, for all interesting cases, HI and LO are effectively
11656 a single register.
11657
11658 We model this by requiring that any value that uses HI
11659 also uses LO. */
11660 if (size <= UNITS_PER_WORD * 2)
11661 return regno == (size <= UNITS_PER_WORD ? LO_REGNUM : MD_REG_FIRST);
11662 }
11663 else
11664 {
11665 /* DSP accumulators do not have the same restrictions as
11666 HI and LO, so we can treat them as normal doubleword
11667 registers. */
11668 if (size <= UNITS_PER_WORD)
11669 return true;
11670
11671 if (size <= UNITS_PER_WORD * 2
11672 && ((regno - DSP_ACC_REG_FIRST) & 1) == 0)
11673 return true;
11674 }
11675 }
11676
11677 if (ALL_COP_REG_P (regno))
11678 return mclass == MODE_INT && size <= UNITS_PER_WORD;
11679
11680 if (regno == GOT_VERSION_REGNUM)
11681 return mode == SImode;
11682
11683 return false;
11684 }
11685
11686 /* Implement HARD_REGNO_NREGS. */
11687
11688 unsigned int
11689 mips_hard_regno_nregs (int regno, enum machine_mode mode)
11690 {
11691 if (ST_REG_P (regno))
11692 /* The size of FP status registers is always 4, because they only hold
11693 CCmode values, and CCmode is always considered to be 4 bytes wide. */
11694 return (GET_MODE_SIZE (mode) + 3) / 4;
11695
11696 if (FP_REG_P (regno))
11697 return (GET_MODE_SIZE (mode) + UNITS_PER_FPREG - 1) / UNITS_PER_FPREG;
11698
11699 /* All other registers are word-sized. */
11700 return (GET_MODE_SIZE (mode) + UNITS_PER_WORD - 1) / UNITS_PER_WORD;
11701 }
11702
11703 /* Implement CLASS_MAX_NREGS, taking the maximum of the cases
11704 in mips_hard_regno_nregs. */
11705
11706 int
11707 mips_class_max_nregs (enum reg_class rclass, enum machine_mode mode)
11708 {
11709 int size;
11710 HARD_REG_SET left;
11711
11712 size = 0x8000;
11713 COPY_HARD_REG_SET (left, reg_class_contents[(int) rclass]);
11714 if (hard_reg_set_intersect_p (left, reg_class_contents[(int) ST_REGS]))
11715 {
11716 if (HARD_REGNO_MODE_OK (ST_REG_FIRST, mode))
11717 size = MIN (size, 4);
11718 AND_COMPL_HARD_REG_SET (left, reg_class_contents[(int) ST_REGS]);
11719 }
11720 if (hard_reg_set_intersect_p (left, reg_class_contents[(int) FP_REGS]))
11721 {
11722 if (HARD_REGNO_MODE_OK (FP_REG_FIRST, mode))
11723 size = MIN (size, UNITS_PER_FPREG);
11724 AND_COMPL_HARD_REG_SET (left, reg_class_contents[(int) FP_REGS]);
11725 }
11726 if (!hard_reg_set_empty_p (left))
11727 size = MIN (size, UNITS_PER_WORD);
11728 return (GET_MODE_SIZE (mode) + size - 1) / size;
11729 }
11730
11731 /* Implement CANNOT_CHANGE_MODE_CLASS. */
11732
11733 bool
11734 mips_cannot_change_mode_class (enum machine_mode from,
11735 enum machine_mode to,
11736 enum reg_class rclass)
11737 {
11738 /* Allow conversions between different Loongson integer vectors,
11739 and between those vectors and DImode. */
11740 if (GET_MODE_SIZE (from) == 8 && GET_MODE_SIZE (to) == 8
11741 && INTEGRAL_MODE_P (from) && INTEGRAL_MODE_P (to))
11742 return false;
11743
11744 /* Otherwise, there are several problems with changing the modes of
11745 values in floating-point registers:
11746
11747 - When a multi-word value is stored in paired floating-point
11748 registers, the first register always holds the low word. We
11749 therefore can't allow FPRs to change between single-word and
11750 multi-word modes on big-endian targets.
11751
11752 - GCC assumes that each word of a multiword register can be
11753 accessed individually using SUBREGs. This is not true for
11754 floating-point registers if they are bigger than a word.
11755
11756 - Loading a 32-bit value into a 64-bit floating-point register
11757 will not sign-extend the value, despite what LOAD_EXTEND_OP
11758 says. We can't allow FPRs to change from SImode to a wider
11759 mode on 64-bit targets.
11760
11761 - If the FPU has already interpreted a value in one format, we
11762 must not ask it to treat the value as having a different
11763 format.
11764
11765 We therefore disallow all mode changes involving FPRs. */
11766
11767 return reg_classes_intersect_p (FP_REGS, rclass);
11768 }
11769
11770 /* Implement target hook small_register_classes_for_mode_p. */
11771
11772 static bool
11773 mips_small_register_classes_for_mode_p (enum machine_mode mode
11774 ATTRIBUTE_UNUSED)
11775 {
11776 return TARGET_MIPS16;
11777 }
11778
11779 /* Return true if moves in mode MODE can use the FPU's mov.fmt instruction. */
11780
11781 static bool
11782 mips_mode_ok_for_mov_fmt_p (enum machine_mode mode)
11783 {
11784 switch (mode)
11785 {
11786 case SFmode:
11787 return TARGET_HARD_FLOAT;
11788
11789 case DFmode:
11790 return TARGET_HARD_FLOAT && TARGET_DOUBLE_FLOAT;
11791
11792 case V2SFmode:
11793 return TARGET_HARD_FLOAT && TARGET_PAIRED_SINGLE_FLOAT;
11794
11795 default:
11796 return false;
11797 }
11798 }
11799
11800 /* Implement MODES_TIEABLE_P. */
11801
11802 bool
11803 mips_modes_tieable_p (enum machine_mode mode1, enum machine_mode mode2)
11804 {
11805 /* FPRs allow no mode punning, so it's not worth tying modes if we'd
11806 prefer to put one of them in FPRs. */
11807 return (mode1 == mode2
11808 || (!mips_mode_ok_for_mov_fmt_p (mode1)
11809 && !mips_mode_ok_for_mov_fmt_p (mode2)));
11810 }
11811
11812 /* Implement TARGET_PREFERRED_RELOAD_CLASS. */
11813
11814 static reg_class_t
11815 mips_preferred_reload_class (rtx x, reg_class_t rclass)
11816 {
11817 if (mips_dangerous_for_la25_p (x) && reg_class_subset_p (LEA_REGS, rclass))
11818 return LEA_REGS;
11819
11820 if (reg_class_subset_p (FP_REGS, rclass)
11821 && mips_mode_ok_for_mov_fmt_p (GET_MODE (x)))
11822 return FP_REGS;
11823
11824 if (reg_class_subset_p (GR_REGS, rclass))
11825 rclass = GR_REGS;
11826
11827 if (TARGET_MIPS16 && reg_class_subset_p (M16_REGS, rclass))
11828 rclass = M16_REGS;
11829
11830 return rclass;
11831 }
11832
11833 /* RCLASS is a class involved in a REGISTER_MOVE_COST calculation.
11834 Return a "canonical" class to represent it in later calculations. */
11835
11836 static reg_class_t
11837 mips_canonicalize_move_class (reg_class_t rclass)
11838 {
11839 /* All moves involving accumulator registers have the same cost. */
11840 if (reg_class_subset_p (rclass, ACC_REGS))
11841 rclass = ACC_REGS;
11842
11843 /* Likewise promote subclasses of general registers to the most
11844 interesting containing class. */
11845 if (TARGET_MIPS16 && reg_class_subset_p (rclass, M16_REGS))
11846 rclass = M16_REGS;
11847 else if (reg_class_subset_p (rclass, GENERAL_REGS))
11848 rclass = GENERAL_REGS;
11849
11850 return rclass;
11851 }
11852
11853 /* Return the cost of moving a value of mode MODE from a register of
11854 class FROM to a GPR. Return 0 for classes that are unions of other
11855 classes handled by this function. */
11856
11857 static int
11858 mips_move_to_gpr_cost (enum machine_mode mode ATTRIBUTE_UNUSED,
11859 reg_class_t from)
11860 {
11861 switch (from)
11862 {
11863 case GENERAL_REGS:
11864 /* A MIPS16 MOVE instruction, or a non-MIPS16 MOVE macro. */
11865 return 2;
11866
11867 case ACC_REGS:
11868 /* MFLO and MFHI. */
11869 return 6;
11870
11871 case FP_REGS:
11872 /* MFC1, etc. */
11873 return 4;
11874
11875 case ST_REGS:
11876 /* LUI followed by MOVF. */
11877 return 4;
11878
11879 case COP0_REGS:
11880 case COP2_REGS:
11881 case COP3_REGS:
11882 /* This choice of value is historical. */
11883 return 5;
11884
11885 default:
11886 return 0;
11887 }
11888 }
11889
11890 /* Return the cost of moving a value of mode MODE from a GPR to a
11891 register of class TO. Return 0 for classes that are unions of
11892 other classes handled by this function. */
11893
11894 static int
11895 mips_move_from_gpr_cost (enum machine_mode mode, reg_class_t to)
11896 {
11897 switch (to)
11898 {
11899 case GENERAL_REGS:
11900 /* A MIPS16 MOVE instruction, or a non-MIPS16 MOVE macro. */
11901 return 2;
11902
11903 case ACC_REGS:
11904 /* MTLO and MTHI. */
11905 return 6;
11906
11907 case FP_REGS:
11908 /* MTC1, etc. */
11909 return 4;
11910
11911 case ST_REGS:
11912 /* A secondary reload through an FPR scratch. */
11913 return (mips_register_move_cost (mode, GENERAL_REGS, FP_REGS)
11914 + mips_register_move_cost (mode, FP_REGS, ST_REGS));
11915
11916 case COP0_REGS:
11917 case COP2_REGS:
11918 case COP3_REGS:
11919 /* This choice of value is historical. */
11920 return 5;
11921
11922 default:
11923 return 0;
11924 }
11925 }
11926
11927 /* Implement TARGET_REGISTER_MOVE_COST. Return 0 for classes that are the
11928 maximum of the move costs for subclasses; regclass will work out
11929 the maximum for us. */
11930
11931 static int
11932 mips_register_move_cost (enum machine_mode mode,
11933 reg_class_t from, reg_class_t to)
11934 {
11935 reg_class_t dregs;
11936 int cost1, cost2;
11937
11938 from = mips_canonicalize_move_class (from);
11939 to = mips_canonicalize_move_class (to);
11940
11941 /* Handle moves that can be done without using general-purpose registers. */
11942 if (from == FP_REGS)
11943 {
11944 if (to == FP_REGS && mips_mode_ok_for_mov_fmt_p (mode))
11945 /* MOV.FMT. */
11946 return 4;
11947 if (to == ST_REGS)
11948 /* The sequence generated by mips_expand_fcc_reload. */
11949 return 8;
11950 }
11951
11952 /* Handle cases in which only one class deviates from the ideal. */
11953 dregs = TARGET_MIPS16 ? M16_REGS : GENERAL_REGS;
11954 if (from == dregs)
11955 return mips_move_from_gpr_cost (mode, to);
11956 if (to == dregs)
11957 return mips_move_to_gpr_cost (mode, from);
11958
11959 /* Handles cases that require a GPR temporary. */
11960 cost1 = mips_move_to_gpr_cost (mode, from);
11961 if (cost1 != 0)
11962 {
11963 cost2 = mips_move_from_gpr_cost (mode, to);
11964 if (cost2 != 0)
11965 return cost1 + cost2;
11966 }
11967
11968 return 0;
11969 }
11970
11971 /* Implement TARGET_MEMORY_MOVE_COST. */
11972
11973 static int
11974 mips_memory_move_cost (enum machine_mode mode, reg_class_t rclass, bool in)
11975 {
11976 return (mips_cost->memory_latency
11977 + memory_move_secondary_cost (mode, rclass, in));
11978 }
11979
11980 /* Return the register class required for a secondary register when
11981 copying between one of the registers in RCLASS and value X, which
11982 has mode MODE. X is the source of the move if IN_P, otherwise it
11983 is the destination. Return NO_REGS if no secondary register is
11984 needed. */
11985
11986 enum reg_class
11987 mips_secondary_reload_class (enum reg_class rclass,
11988 enum machine_mode mode, rtx x, bool in_p)
11989 {
11990 int regno;
11991
11992 /* If X is a constant that cannot be loaded into $25, it must be loaded
11993 into some other GPR. No other register class allows a direct move. */
11994 if (mips_dangerous_for_la25_p (x))
11995 return reg_class_subset_p (rclass, LEA_REGS) ? NO_REGS : LEA_REGS;
11996
11997 regno = true_regnum (x);
11998 if (TARGET_MIPS16)
11999 {
12000 /* In MIPS16 mode, every move must involve a member of M16_REGS. */
12001 if (!reg_class_subset_p (rclass, M16_REGS) && !M16_REG_P (regno))
12002 return M16_REGS;
12003
12004 return NO_REGS;
12005 }
12006
12007 /* Copying from accumulator registers to anywhere other than a general
12008 register requires a temporary general register. */
12009 if (reg_class_subset_p (rclass, ACC_REGS))
12010 return GP_REG_P (regno) ? NO_REGS : GR_REGS;
12011 if (ACC_REG_P (regno))
12012 return reg_class_subset_p (rclass, GR_REGS) ? NO_REGS : GR_REGS;
12013
12014 /* We can only copy a value to a condition code register from a
12015 floating-point register, and even then we require a scratch
12016 floating-point register. We can only copy a value out of a
12017 condition-code register into a general register. */
12018 if (reg_class_subset_p (rclass, ST_REGS))
12019 {
12020 if (in_p)
12021 return FP_REGS;
12022 return GP_REG_P (regno) ? NO_REGS : GR_REGS;
12023 }
12024 if (ST_REG_P (regno))
12025 {
12026 if (!in_p)
12027 return FP_REGS;
12028 return reg_class_subset_p (rclass, GR_REGS) ? NO_REGS : GR_REGS;
12029 }
12030
12031 if (reg_class_subset_p (rclass, FP_REGS))
12032 {
12033 if (MEM_P (x)
12034 && (GET_MODE_SIZE (mode) == 4 || GET_MODE_SIZE (mode) == 8))
12035 /* In this case we can use lwc1, swc1, ldc1 or sdc1. We'll use
12036 pairs of lwc1s and swc1s if ldc1 and sdc1 are not supported. */
12037 return NO_REGS;
12038
12039 if (GP_REG_P (regno) || x == CONST0_RTX (mode))
12040 /* In this case we can use mtc1, mfc1, dmtc1 or dmfc1. */
12041 return NO_REGS;
12042
12043 if (CONSTANT_P (x) && !targetm.cannot_force_const_mem (mode, x))
12044 /* We can force the constant to memory and use lwc1
12045 and ldc1. As above, we will use pairs of lwc1s if
12046 ldc1 is not supported. */
12047 return NO_REGS;
12048
12049 if (FP_REG_P (regno) && mips_mode_ok_for_mov_fmt_p (mode))
12050 /* In this case we can use mov.fmt. */
12051 return NO_REGS;
12052
12053 /* Otherwise, we need to reload through an integer register. */
12054 return GR_REGS;
12055 }
12056 if (FP_REG_P (regno))
12057 return reg_class_subset_p (rclass, GR_REGS) ? NO_REGS : GR_REGS;
12058
12059 return NO_REGS;
12060 }
12061
12062 /* Implement TARGET_MODE_REP_EXTENDED. */
12063
12064 static int
12065 mips_mode_rep_extended (enum machine_mode mode, enum machine_mode mode_rep)
12066 {
12067 /* On 64-bit targets, SImode register values are sign-extended to DImode. */
12068 if (TARGET_64BIT && mode == SImode && mode_rep == DImode)
12069 return SIGN_EXTEND;
12070
12071 return UNKNOWN;
12072 }
12073 \f
12074 /* Implement TARGET_VALID_POINTER_MODE. */
12075
12076 static bool
12077 mips_valid_pointer_mode (enum machine_mode mode)
12078 {
12079 return mode == SImode || (TARGET_64BIT && mode == DImode);
12080 }
12081
12082 /* Implement TARGET_VECTOR_MODE_SUPPORTED_P. */
12083
12084 static bool
12085 mips_vector_mode_supported_p (enum machine_mode mode)
12086 {
12087 switch (mode)
12088 {
12089 case V2SFmode:
12090 return TARGET_PAIRED_SINGLE_FLOAT;
12091
12092 case V2HImode:
12093 case V4QImode:
12094 case V2HQmode:
12095 case V2UHQmode:
12096 case V2HAmode:
12097 case V2UHAmode:
12098 case V4QQmode:
12099 case V4UQQmode:
12100 return TARGET_DSP;
12101
12102 case V2SImode:
12103 case V4HImode:
12104 case V8QImode:
12105 return TARGET_LOONGSON_VECTORS;
12106
12107 default:
12108 return false;
12109 }
12110 }
12111
12112 /* Implement TARGET_SCALAR_MODE_SUPPORTED_P. */
12113
12114 static bool
12115 mips_scalar_mode_supported_p (enum machine_mode mode)
12116 {
12117 if (ALL_FIXED_POINT_MODE_P (mode)
12118 && GET_MODE_PRECISION (mode) <= 2 * BITS_PER_WORD)
12119 return true;
12120
12121 return default_scalar_mode_supported_p (mode);
12122 }
12123 \f
12124 /* Implement TARGET_VECTORIZE_PREFERRED_SIMD_MODE. */
12125
12126 static enum machine_mode
12127 mips_preferred_simd_mode (enum machine_mode mode ATTRIBUTE_UNUSED)
12128 {
12129 if (TARGET_PAIRED_SINGLE_FLOAT
12130 && mode == SFmode)
12131 return V2SFmode;
12132 return word_mode;
12133 }
12134
12135 /* Implement TARGET_INIT_LIBFUNCS. */
12136
12137 static void
12138 mips_init_libfuncs (void)
12139 {
12140 if (TARGET_FIX_VR4120)
12141 {
12142 /* Register the special divsi3 and modsi3 functions needed to work
12143 around VR4120 division errata. */
12144 set_optab_libfunc (sdiv_optab, SImode, "__vr4120_divsi3");
12145 set_optab_libfunc (smod_optab, SImode, "__vr4120_modsi3");
12146 }
12147
12148 if (TARGET_MIPS16 && TARGET_HARD_FLOAT_ABI)
12149 {
12150 /* Register the MIPS16 -mhard-float stubs. */
12151 set_optab_libfunc (add_optab, SFmode, "__mips16_addsf3");
12152 set_optab_libfunc (sub_optab, SFmode, "__mips16_subsf3");
12153 set_optab_libfunc (smul_optab, SFmode, "__mips16_mulsf3");
12154 set_optab_libfunc (sdiv_optab, SFmode, "__mips16_divsf3");
12155
12156 set_optab_libfunc (eq_optab, SFmode, "__mips16_eqsf2");
12157 set_optab_libfunc (ne_optab, SFmode, "__mips16_nesf2");
12158 set_optab_libfunc (gt_optab, SFmode, "__mips16_gtsf2");
12159 set_optab_libfunc (ge_optab, SFmode, "__mips16_gesf2");
12160 set_optab_libfunc (lt_optab, SFmode, "__mips16_ltsf2");
12161 set_optab_libfunc (le_optab, SFmode, "__mips16_lesf2");
12162 set_optab_libfunc (unord_optab, SFmode, "__mips16_unordsf2");
12163
12164 set_conv_libfunc (sfix_optab, SImode, SFmode, "__mips16_fix_truncsfsi");
12165 set_conv_libfunc (sfloat_optab, SFmode, SImode, "__mips16_floatsisf");
12166 set_conv_libfunc (ufloat_optab, SFmode, SImode, "__mips16_floatunsisf");
12167
12168 if (TARGET_DOUBLE_FLOAT)
12169 {
12170 set_optab_libfunc (add_optab, DFmode, "__mips16_adddf3");
12171 set_optab_libfunc (sub_optab, DFmode, "__mips16_subdf3");
12172 set_optab_libfunc (smul_optab, DFmode, "__mips16_muldf3");
12173 set_optab_libfunc (sdiv_optab, DFmode, "__mips16_divdf3");
12174
12175 set_optab_libfunc (eq_optab, DFmode, "__mips16_eqdf2");
12176 set_optab_libfunc (ne_optab, DFmode, "__mips16_nedf2");
12177 set_optab_libfunc (gt_optab, DFmode, "__mips16_gtdf2");
12178 set_optab_libfunc (ge_optab, DFmode, "__mips16_gedf2");
12179 set_optab_libfunc (lt_optab, DFmode, "__mips16_ltdf2");
12180 set_optab_libfunc (le_optab, DFmode, "__mips16_ledf2");
12181 set_optab_libfunc (unord_optab, DFmode, "__mips16_unorddf2");
12182
12183 set_conv_libfunc (sext_optab, DFmode, SFmode,
12184 "__mips16_extendsfdf2");
12185 set_conv_libfunc (trunc_optab, SFmode, DFmode,
12186 "__mips16_truncdfsf2");
12187 set_conv_libfunc (sfix_optab, SImode, DFmode,
12188 "__mips16_fix_truncdfsi");
12189 set_conv_libfunc (sfloat_optab, DFmode, SImode,
12190 "__mips16_floatsidf");
12191 set_conv_libfunc (ufloat_optab, DFmode, SImode,
12192 "__mips16_floatunsidf");
12193 }
12194 }
12195
12196 /* The MIPS16 ISA does not have an encoding for "sync", so we rely
12197 on an external non-MIPS16 routine to implement __sync_synchronize.
12198 Similarly for the rest of the ll/sc libfuncs. */
12199 if (TARGET_MIPS16)
12200 {
12201 synchronize_libfunc = init_one_libfunc ("__sync_synchronize");
12202 init_sync_libfuncs (UNITS_PER_WORD);
12203 }
12204 }
12205
12206 /* Build up a multi-insn sequence that loads label TARGET into $AT. */
12207
12208 static void
12209 mips_process_load_label (rtx target)
12210 {
12211 rtx base, gp, intop;
12212 HOST_WIDE_INT offset;
12213
12214 mips_multi_start ();
12215 switch (mips_abi)
12216 {
12217 case ABI_N32:
12218 mips_multi_add_insn ("lw\t%@,%%got_page(%0)(%+)", target, 0);
12219 mips_multi_add_insn ("addiu\t%@,%@,%%got_ofst(%0)", target, 0);
12220 break;
12221
12222 case ABI_64:
12223 mips_multi_add_insn ("ld\t%@,%%got_page(%0)(%+)", target, 0);
12224 mips_multi_add_insn ("daddiu\t%@,%@,%%got_ofst(%0)", target, 0);
12225 break;
12226
12227 default:
12228 gp = pic_offset_table_rtx;
12229 if (mips_cfun_has_cprestore_slot_p ())
12230 {
12231 gp = gen_rtx_REG (Pmode, AT_REGNUM);
12232 mips_get_cprestore_base_and_offset (&base, &offset, true);
12233 if (!SMALL_OPERAND (offset))
12234 {
12235 intop = GEN_INT (CONST_HIGH_PART (offset));
12236 mips_multi_add_insn ("lui\t%0,%1", gp, intop, 0);
12237 mips_multi_add_insn ("addu\t%0,%0,%1", gp, base, 0);
12238
12239 base = gp;
12240 offset = CONST_LOW_PART (offset);
12241 }
12242 intop = GEN_INT (offset);
12243 if (ISA_HAS_LOAD_DELAY)
12244 mips_multi_add_insn ("lw\t%0,%1(%2)%#", gp, intop, base, 0);
12245 else
12246 mips_multi_add_insn ("lw\t%0,%1(%2)", gp, intop, base, 0);
12247 }
12248 if (ISA_HAS_LOAD_DELAY)
12249 mips_multi_add_insn ("lw\t%@,%%got(%0)(%1)%#", target, gp, 0);
12250 else
12251 mips_multi_add_insn ("lw\t%@,%%got(%0)(%1)", target, gp, 0);
12252 mips_multi_add_insn ("addiu\t%@,%@,%%lo(%0)", target, 0);
12253 break;
12254 }
12255 }
12256
12257 /* Return the number of instructions needed to load a label into $AT. */
12258
12259 static unsigned int
12260 mips_load_label_num_insns (void)
12261 {
12262 if (cfun->machine->load_label_num_insns == 0)
12263 {
12264 mips_process_load_label (pc_rtx);
12265 cfun->machine->load_label_num_insns = mips_multi_num_insns;
12266 }
12267 return cfun->machine->load_label_num_insns;
12268 }
12269
12270 /* Emit an asm sequence to start a noat block and load the address
12271 of a label into $1. */
12272
12273 void
12274 mips_output_load_label (rtx target)
12275 {
12276 mips_push_asm_switch (&mips_noat);
12277 if (TARGET_EXPLICIT_RELOCS)
12278 {
12279 mips_process_load_label (target);
12280 mips_multi_write ();
12281 }
12282 else
12283 {
12284 if (Pmode == DImode)
12285 output_asm_insn ("dla\t%@,%0", &target);
12286 else
12287 output_asm_insn ("la\t%@,%0", &target);
12288 }
12289 }
12290
12291 /* Return the length of INSN. LENGTH is the initial length computed by
12292 attributes in the machine-description file. */
12293
12294 int
12295 mips_adjust_insn_length (rtx insn, int length)
12296 {
12297 /* mips.md uses MAX_PIC_BRANCH_LENGTH as a placeholder for the length
12298 of a PIC long-branch sequence. Substitute the correct value. */
12299 if (length == MAX_PIC_BRANCH_LENGTH
12300 && INSN_CODE (insn) >= 0
12301 && get_attr_type (insn) == TYPE_BRANCH)
12302 {
12303 /* Add the branch-over instruction and its delay slot, if this
12304 is a conditional branch. */
12305 length = simplejump_p (insn) ? 0 : 8;
12306
12307 /* Add the size of a load into $AT. */
12308 length += BASE_INSN_LENGTH * mips_load_label_num_insns ();
12309
12310 /* Add the length of an indirect jump, ignoring the delay slot. */
12311 length += TARGET_COMPRESSION ? 2 : 4;
12312 }
12313
12314 /* A unconditional jump has an unfilled delay slot if it is not part
12315 of a sequence. A conditional jump normally has a delay slot, but
12316 does not on MIPS16. */
12317 if (CALL_P (insn) || (TARGET_MIPS16 ? simplejump_p (insn) : JUMP_P (insn)))
12318 length += TARGET_MIPS16 ? 2 : 4;
12319
12320 /* See how many nops might be needed to avoid hardware hazards. */
12321 if (!cfun->machine->ignore_hazard_length_p && INSN_CODE (insn) >= 0)
12322 switch (get_attr_hazard (insn))
12323 {
12324 case HAZARD_NONE:
12325 break;
12326
12327 case HAZARD_DELAY:
12328 length += NOP_INSN_LENGTH;
12329 break;
12330
12331 case HAZARD_HILO:
12332 length += NOP_INSN_LENGTH * 2;
12333 break;
12334 }
12335
12336 return length;
12337 }
12338
12339 /* Return the assembly code for INSN, which has the operands given by
12340 OPERANDS, and which branches to OPERANDS[0] if some condition is true.
12341 BRANCH_IF_TRUE is the asm template that should be used if OPERANDS[0]
12342 is in range of a direct branch. BRANCH_IF_FALSE is an inverted
12343 version of BRANCH_IF_TRUE. */
12344
12345 const char *
12346 mips_output_conditional_branch (rtx insn, rtx *operands,
12347 const char *branch_if_true,
12348 const char *branch_if_false)
12349 {
12350 unsigned int length;
12351 rtx taken, not_taken;
12352
12353 gcc_assert (LABEL_P (operands[0]));
12354
12355 length = get_attr_length (insn);
12356 if (length <= 8)
12357 {
12358 /* Just a simple conditional branch. */
12359 mips_branch_likely = (final_sequence && INSN_ANNULLED_BRANCH_P (insn));
12360 return branch_if_true;
12361 }
12362
12363 /* Generate a reversed branch around a direct jump. This fallback does
12364 not use branch-likely instructions. */
12365 mips_branch_likely = false;
12366 not_taken = gen_label_rtx ();
12367 taken = operands[0];
12368
12369 /* Generate the reversed branch to NOT_TAKEN. */
12370 operands[0] = not_taken;
12371 output_asm_insn (branch_if_false, operands);
12372
12373 /* If INSN has a delay slot, we must provide delay slots for both the
12374 branch to NOT_TAKEN and the conditional jump. We must also ensure
12375 that INSN's delay slot is executed in the appropriate cases. */
12376 if (final_sequence)
12377 {
12378 /* This first delay slot will always be executed, so use INSN's
12379 delay slot if is not annulled. */
12380 if (!INSN_ANNULLED_BRANCH_P (insn))
12381 {
12382 final_scan_insn (XVECEXP (final_sequence, 0, 1),
12383 asm_out_file, optimize, 1, NULL);
12384 INSN_DELETED_P (XVECEXP (final_sequence, 0, 1)) = 1;
12385 }
12386 else
12387 output_asm_insn ("nop", 0);
12388 fprintf (asm_out_file, "\n");
12389 }
12390
12391 /* Output the unconditional branch to TAKEN. */
12392 if (TARGET_ABSOLUTE_JUMPS)
12393 output_asm_insn (MIPS_ABSOLUTE_JUMP ("j\t%0%/"), &taken);
12394 else
12395 {
12396 mips_output_load_label (taken);
12397 output_asm_insn ("jr\t%@%]%/", 0);
12398 }
12399
12400 /* Now deal with its delay slot; see above. */
12401 if (final_sequence)
12402 {
12403 /* This delay slot will only be executed if the branch is taken.
12404 Use INSN's delay slot if is annulled. */
12405 if (INSN_ANNULLED_BRANCH_P (insn))
12406 {
12407 final_scan_insn (XVECEXP (final_sequence, 0, 1),
12408 asm_out_file, optimize, 1, NULL);
12409 INSN_DELETED_P (XVECEXP (final_sequence, 0, 1)) = 1;
12410 }
12411 else
12412 output_asm_insn ("nop", 0);
12413 fprintf (asm_out_file, "\n");
12414 }
12415
12416 /* Output NOT_TAKEN. */
12417 targetm.asm_out.internal_label (asm_out_file, "L",
12418 CODE_LABEL_NUMBER (not_taken));
12419 return "";
12420 }
12421
12422 /* Return the assembly code for INSN, which branches to OPERANDS[0]
12423 if some ordering condition is true. The condition is given by
12424 OPERANDS[1] if !INVERTED_P, otherwise it is the inverse of
12425 OPERANDS[1]. OPERANDS[2] is the comparison's first operand;
12426 its second is always zero. */
12427
12428 const char *
12429 mips_output_order_conditional_branch (rtx insn, rtx *operands, bool inverted_p)
12430 {
12431 const char *branch[2];
12432
12433 /* Make BRANCH[1] branch to OPERANDS[0] when the condition is true.
12434 Make BRANCH[0] branch on the inverse condition. */
12435 switch (GET_CODE (operands[1]))
12436 {
12437 /* These cases are equivalent to comparisons against zero. */
12438 case LEU:
12439 inverted_p = !inverted_p;
12440 /* Fall through. */
12441 case GTU:
12442 branch[!inverted_p] = MIPS_BRANCH ("bne", "%2,%.,%0");
12443 branch[inverted_p] = MIPS_BRANCH ("beq", "%2,%.,%0");
12444 break;
12445
12446 /* These cases are always true or always false. */
12447 case LTU:
12448 inverted_p = !inverted_p;
12449 /* Fall through. */
12450 case GEU:
12451 branch[!inverted_p] = MIPS_BRANCH ("beq", "%.,%.,%0");
12452 branch[inverted_p] = MIPS_BRANCH ("bne", "%.,%.,%0");
12453 break;
12454
12455 default:
12456 branch[!inverted_p] = MIPS_BRANCH ("b%C1z", "%2,%0");
12457 branch[inverted_p] = MIPS_BRANCH ("b%N1z", "%2,%0");
12458 break;
12459 }
12460 return mips_output_conditional_branch (insn, operands, branch[1], branch[0]);
12461 }
12462 \f
12463 /* Start a block of code that needs access to the LL, SC and SYNC
12464 instructions. */
12465
12466 static void
12467 mips_start_ll_sc_sync_block (void)
12468 {
12469 if (!ISA_HAS_LL_SC)
12470 {
12471 output_asm_insn (".set\tpush", 0);
12472 if (TARGET_64BIT)
12473 output_asm_insn (".set\tmips3", 0);
12474 else
12475 output_asm_insn (".set\tmips2", 0);
12476 }
12477 }
12478
12479 /* End a block started by mips_start_ll_sc_sync_block. */
12480
12481 static void
12482 mips_end_ll_sc_sync_block (void)
12483 {
12484 if (!ISA_HAS_LL_SC)
12485 output_asm_insn (".set\tpop", 0);
12486 }
12487
12488 /* Output and/or return the asm template for a sync instruction. */
12489
12490 const char *
12491 mips_output_sync (void)
12492 {
12493 mips_start_ll_sc_sync_block ();
12494 output_asm_insn ("sync", 0);
12495 mips_end_ll_sc_sync_block ();
12496 return "";
12497 }
12498
12499 /* Return the asm template associated with sync_insn1 value TYPE.
12500 IS_64BIT_P is true if we want a 64-bit rather than 32-bit operation. */
12501
12502 static const char *
12503 mips_sync_insn1_template (enum attr_sync_insn1 type, bool is_64bit_p)
12504 {
12505 switch (type)
12506 {
12507 case SYNC_INSN1_MOVE:
12508 return "move\t%0,%z2";
12509 case SYNC_INSN1_LI:
12510 return "li\t%0,%2";
12511 case SYNC_INSN1_ADDU:
12512 return is_64bit_p ? "daddu\t%0,%1,%z2" : "addu\t%0,%1,%z2";
12513 case SYNC_INSN1_ADDIU:
12514 return is_64bit_p ? "daddiu\t%0,%1,%2" : "addiu\t%0,%1,%2";
12515 case SYNC_INSN1_SUBU:
12516 return is_64bit_p ? "dsubu\t%0,%1,%z2" : "subu\t%0,%1,%z2";
12517 case SYNC_INSN1_AND:
12518 return "and\t%0,%1,%z2";
12519 case SYNC_INSN1_ANDI:
12520 return "andi\t%0,%1,%2";
12521 case SYNC_INSN1_OR:
12522 return "or\t%0,%1,%z2";
12523 case SYNC_INSN1_ORI:
12524 return "ori\t%0,%1,%2";
12525 case SYNC_INSN1_XOR:
12526 return "xor\t%0,%1,%z2";
12527 case SYNC_INSN1_XORI:
12528 return "xori\t%0,%1,%2";
12529 }
12530 gcc_unreachable ();
12531 }
12532
12533 /* Return the asm template associated with sync_insn2 value TYPE. */
12534
12535 static const char *
12536 mips_sync_insn2_template (enum attr_sync_insn2 type)
12537 {
12538 switch (type)
12539 {
12540 case SYNC_INSN2_NOP:
12541 gcc_unreachable ();
12542 case SYNC_INSN2_AND:
12543 return "and\t%0,%1,%z2";
12544 case SYNC_INSN2_XOR:
12545 return "xor\t%0,%1,%z2";
12546 case SYNC_INSN2_NOT:
12547 return "nor\t%0,%1,%.";
12548 }
12549 gcc_unreachable ();
12550 }
12551
12552 /* OPERANDS are the operands to a sync loop instruction and INDEX is
12553 the value of the one of the sync_* attributes. Return the operand
12554 referred to by the attribute, or DEFAULT_VALUE if the insn doesn't
12555 have the associated attribute. */
12556
12557 static rtx
12558 mips_get_sync_operand (rtx *operands, int index, rtx default_value)
12559 {
12560 if (index > 0)
12561 default_value = operands[index - 1];
12562 return default_value;
12563 }
12564
12565 /* INSN is a sync loop with operands OPERANDS. Build up a multi-insn
12566 sequence for it. */
12567
12568 static void
12569 mips_process_sync_loop (rtx insn, rtx *operands)
12570 {
12571 rtx at, mem, oldval, newval, inclusive_mask, exclusive_mask;
12572 rtx required_oldval, insn1_op2, tmp1, tmp2, tmp3, cmp;
12573 unsigned int tmp3_insn;
12574 enum attr_sync_insn1 insn1;
12575 enum attr_sync_insn2 insn2;
12576 bool is_64bit_p;
12577 int memmodel_attr;
12578 enum memmodel model;
12579
12580 /* Read an operand from the sync_WHAT attribute and store it in
12581 variable WHAT. DEFAULT is the default value if no attribute
12582 is specified. */
12583 #define READ_OPERAND(WHAT, DEFAULT) \
12584 WHAT = mips_get_sync_operand (operands, (int) get_attr_sync_##WHAT (insn), \
12585 DEFAULT)
12586
12587 /* Read the memory. */
12588 READ_OPERAND (mem, 0);
12589 gcc_assert (mem);
12590 is_64bit_p = (GET_MODE_BITSIZE (GET_MODE (mem)) == 64);
12591
12592 /* Read the other attributes. */
12593 at = gen_rtx_REG (GET_MODE (mem), AT_REGNUM);
12594 READ_OPERAND (oldval, at);
12595 READ_OPERAND (cmp, 0);
12596 READ_OPERAND (newval, at);
12597 READ_OPERAND (inclusive_mask, 0);
12598 READ_OPERAND (exclusive_mask, 0);
12599 READ_OPERAND (required_oldval, 0);
12600 READ_OPERAND (insn1_op2, 0);
12601 insn1 = get_attr_sync_insn1 (insn);
12602 insn2 = get_attr_sync_insn2 (insn);
12603
12604 /* Don't bother setting CMP result that is never used. */
12605 if (cmp && find_reg_note (insn, REG_UNUSED, cmp))
12606 cmp = 0;
12607
12608 memmodel_attr = get_attr_sync_memmodel (insn);
12609 switch (memmodel_attr)
12610 {
12611 case 10:
12612 model = MEMMODEL_ACQ_REL;
12613 break;
12614 case 11:
12615 model = MEMMODEL_ACQUIRE;
12616 break;
12617 default:
12618 model = (enum memmodel) INTVAL (operands[memmodel_attr]);
12619 }
12620
12621 mips_multi_start ();
12622
12623 /* Output the release side of the memory barrier. */
12624 if (need_atomic_barrier_p (model, true))
12625 {
12626 if (required_oldval == 0 && TARGET_OCTEON)
12627 {
12628 /* Octeon doesn't reorder reads, so a full barrier can be
12629 created by using SYNCW to order writes combined with the
12630 write from the following SC. When the SC successfully
12631 completes, we know that all preceding writes are also
12632 committed to the coherent memory system. It is possible
12633 for a single SYNCW to fail, but a pair of them will never
12634 fail, so we use two. */
12635 mips_multi_add_insn ("syncw", NULL);
12636 mips_multi_add_insn ("syncw", NULL);
12637 }
12638 else
12639 mips_multi_add_insn ("sync", NULL);
12640 }
12641
12642 /* Output the branch-back label. */
12643 mips_multi_add_label ("1:");
12644
12645 /* OLDVAL = *MEM. */
12646 mips_multi_add_insn (is_64bit_p ? "lld\t%0,%1" : "ll\t%0,%1",
12647 oldval, mem, NULL);
12648
12649 /* if ((OLDVAL & INCLUSIVE_MASK) != REQUIRED_OLDVAL) goto 2. */
12650 if (required_oldval)
12651 {
12652 if (inclusive_mask == 0)
12653 tmp1 = oldval;
12654 else
12655 {
12656 gcc_assert (oldval != at);
12657 mips_multi_add_insn ("and\t%0,%1,%2",
12658 at, oldval, inclusive_mask, NULL);
12659 tmp1 = at;
12660 }
12661 mips_multi_add_insn ("bne\t%0,%z1,2f", tmp1, required_oldval, NULL);
12662
12663 /* CMP = 0 [delay slot]. */
12664 if (cmp)
12665 mips_multi_add_insn ("li\t%0,0", cmp, NULL);
12666 }
12667
12668 /* $TMP1 = OLDVAL & EXCLUSIVE_MASK. */
12669 if (exclusive_mask == 0)
12670 tmp1 = const0_rtx;
12671 else
12672 {
12673 gcc_assert (oldval != at);
12674 mips_multi_add_insn ("and\t%0,%1,%z2",
12675 at, oldval, exclusive_mask, NULL);
12676 tmp1 = at;
12677 }
12678
12679 /* $TMP2 = INSN1 (OLDVAL, INSN1_OP2).
12680
12681 We can ignore moves if $TMP4 != INSN1_OP2, since we'll still emit
12682 at least one instruction in that case. */
12683 if (insn1 == SYNC_INSN1_MOVE
12684 && (tmp1 != const0_rtx || insn2 != SYNC_INSN2_NOP))
12685 tmp2 = insn1_op2;
12686 else
12687 {
12688 mips_multi_add_insn (mips_sync_insn1_template (insn1, is_64bit_p),
12689 newval, oldval, insn1_op2, NULL);
12690 tmp2 = newval;
12691 }
12692
12693 /* $TMP3 = INSN2 ($TMP2, INCLUSIVE_MASK). */
12694 if (insn2 == SYNC_INSN2_NOP)
12695 tmp3 = tmp2;
12696 else
12697 {
12698 mips_multi_add_insn (mips_sync_insn2_template (insn2),
12699 newval, tmp2, inclusive_mask, NULL);
12700 tmp3 = newval;
12701 }
12702 tmp3_insn = mips_multi_last_index ();
12703
12704 /* $AT = $TMP1 | $TMP3. */
12705 if (tmp1 == const0_rtx || tmp3 == const0_rtx)
12706 {
12707 mips_multi_set_operand (tmp3_insn, 0, at);
12708 tmp3 = at;
12709 }
12710 else
12711 {
12712 gcc_assert (tmp1 != tmp3);
12713 mips_multi_add_insn ("or\t%0,%1,%2", at, tmp1, tmp3, NULL);
12714 }
12715
12716 /* if (!commit (*MEM = $AT)) goto 1.
12717
12718 This will sometimes be a delayed branch; see the write code below
12719 for details. */
12720 mips_multi_add_insn (is_64bit_p ? "scd\t%0,%1" : "sc\t%0,%1", at, mem, NULL);
12721 mips_multi_add_insn ("beq%?\t%0,%.,1b", at, NULL);
12722
12723 /* if (INSN1 != MOVE && INSN1 != LI) NEWVAL = $TMP3 [delay slot]. */
12724 if (insn1 != SYNC_INSN1_MOVE && insn1 != SYNC_INSN1_LI && tmp3 != newval)
12725 {
12726 mips_multi_copy_insn (tmp3_insn);
12727 mips_multi_set_operand (mips_multi_last_index (), 0, newval);
12728 }
12729 else if (!(required_oldval && cmp))
12730 mips_multi_add_insn ("nop", NULL);
12731
12732 /* CMP = 1 -- either standalone or in a delay slot. */
12733 if (required_oldval && cmp)
12734 mips_multi_add_insn ("li\t%0,1", cmp, NULL);
12735
12736 /* Output the acquire side of the memory barrier. */
12737 if (TARGET_SYNC_AFTER_SC && need_atomic_barrier_p (model, false))
12738 mips_multi_add_insn ("sync", NULL);
12739
12740 /* Output the exit label, if needed. */
12741 if (required_oldval)
12742 mips_multi_add_label ("2:");
12743
12744 #undef READ_OPERAND
12745 }
12746
12747 /* Output and/or return the asm template for sync loop INSN, which has
12748 the operands given by OPERANDS. */
12749
12750 const char *
12751 mips_output_sync_loop (rtx insn, rtx *operands)
12752 {
12753 mips_process_sync_loop (insn, operands);
12754
12755 /* Use branch-likely instructions to work around the LL/SC R10000
12756 errata. */
12757 mips_branch_likely = TARGET_FIX_R10000;
12758
12759 mips_push_asm_switch (&mips_noreorder);
12760 mips_push_asm_switch (&mips_nomacro);
12761 mips_push_asm_switch (&mips_noat);
12762 mips_start_ll_sc_sync_block ();
12763
12764 mips_multi_write ();
12765
12766 mips_end_ll_sc_sync_block ();
12767 mips_pop_asm_switch (&mips_noat);
12768 mips_pop_asm_switch (&mips_nomacro);
12769 mips_pop_asm_switch (&mips_noreorder);
12770
12771 return "";
12772 }
12773
12774 /* Return the number of individual instructions in sync loop INSN,
12775 which has the operands given by OPERANDS. */
12776
12777 unsigned int
12778 mips_sync_loop_insns (rtx insn, rtx *operands)
12779 {
12780 mips_process_sync_loop (insn, operands);
12781 return mips_multi_num_insns;
12782 }
12783 \f
12784 /* Return the assembly code for DIV or DDIV instruction DIVISION, which has
12785 the operands given by OPERANDS. Add in a divide-by-zero check if needed.
12786
12787 When working around R4000 and R4400 errata, we need to make sure that
12788 the division is not immediately followed by a shift[1][2]. We also
12789 need to stop the division from being put into a branch delay slot[3].
12790 The easiest way to avoid both problems is to add a nop after the
12791 division. When a divide-by-zero check is needed, this nop can be
12792 used to fill the branch delay slot.
12793
12794 [1] If a double-word or a variable shift executes immediately
12795 after starting an integer division, the shift may give an
12796 incorrect result. See quotations of errata #16 and #28 from
12797 "MIPS R4000PC/SC Errata, Processor Revision 2.2 and 3.0"
12798 in mips.md for details.
12799
12800 [2] A similar bug to [1] exists for all revisions of the
12801 R4000 and the R4400 when run in an MC configuration.
12802 From "MIPS R4000MC Errata, Processor Revision 2.2 and 3.0":
12803
12804 "19. In this following sequence:
12805
12806 ddiv (or ddivu or div or divu)
12807 dsll32 (or dsrl32, dsra32)
12808
12809 if an MPT stall occurs, while the divide is slipping the cpu
12810 pipeline, then the following double shift would end up with an
12811 incorrect result.
12812
12813 Workaround: The compiler needs to avoid generating any
12814 sequence with divide followed by extended double shift."
12815
12816 This erratum is also present in "MIPS R4400MC Errata, Processor
12817 Revision 1.0" and "MIPS R4400MC Errata, Processor Revision 2.0
12818 & 3.0" as errata #10 and #4, respectively.
12819
12820 [3] From "MIPS R4000PC/SC Errata, Processor Revision 2.2 and 3.0"
12821 (also valid for MIPS R4000MC processors):
12822
12823 "52. R4000SC: This bug does not apply for the R4000PC.
12824
12825 There are two flavors of this bug:
12826
12827 1) If the instruction just after divide takes an RF exception
12828 (tlb-refill, tlb-invalid) and gets an instruction cache
12829 miss (both primary and secondary) and the line which is
12830 currently in secondary cache at this index had the first
12831 data word, where the bits 5..2 are set, then R4000 would
12832 get a wrong result for the div.
12833
12834 ##1
12835 nop
12836 div r8, r9
12837 ------------------- # end-of page. -tlb-refill
12838 nop
12839 ##2
12840 nop
12841 div r8, r9
12842 ------------------- # end-of page. -tlb-invalid
12843 nop
12844
12845 2) If the divide is in the taken branch delay slot, where the
12846 target takes RF exception and gets an I-cache miss for the
12847 exception vector or where I-cache miss occurs for the
12848 target address, under the above mentioned scenarios, the
12849 div would get wrong results.
12850
12851 ##1
12852 j r2 # to next page mapped or unmapped
12853 div r8,r9 # this bug would be there as long
12854 # as there is an ICache miss and
12855 nop # the "data pattern" is present
12856
12857 ##2
12858 beq r0, r0, NextPage # to Next page
12859 div r8,r9
12860 nop
12861
12862 This bug is present for div, divu, ddiv, and ddivu
12863 instructions.
12864
12865 Workaround: For item 1), OS could make sure that the next page
12866 after the divide instruction is also mapped. For item 2), the
12867 compiler could make sure that the divide instruction is not in
12868 the branch delay slot."
12869
12870 These processors have PRId values of 0x00004220 and 0x00004300 for
12871 the R4000 and 0x00004400, 0x00004500 and 0x00004600 for the R4400. */
12872
12873 const char *
12874 mips_output_division (const char *division, rtx *operands)
12875 {
12876 const char *s;
12877
12878 s = division;
12879 if (TARGET_FIX_R4000 || TARGET_FIX_R4400)
12880 {
12881 output_asm_insn (s, operands);
12882 s = "nop";
12883 }
12884 if (TARGET_CHECK_ZERO_DIV)
12885 {
12886 if (TARGET_MIPS16)
12887 {
12888 output_asm_insn (s, operands);
12889 s = "bnez\t%2,1f\n\tbreak\t7\n1:";
12890 }
12891 else if (GENERATE_DIVIDE_TRAPS)
12892 {
12893 /* Avoid long replay penalty on load miss by putting the trap before
12894 the divide. */
12895 if (TUNE_74K)
12896 output_asm_insn ("teq\t%2,%.,7", operands);
12897 else
12898 {
12899 output_asm_insn (s, operands);
12900 s = "teq\t%2,%.,7";
12901 }
12902 }
12903 else
12904 {
12905 output_asm_insn ("%(bne\t%2,%.,1f", operands);
12906 output_asm_insn (s, operands);
12907 s = "break\t7%)\n1:";
12908 }
12909 }
12910 return s;
12911 }
12912 \f
12913 /* Return true if IN_INSN is a multiply-add or multiply-subtract
12914 instruction and if OUT_INSN assigns to the accumulator operand. */
12915
12916 bool
12917 mips_linked_madd_p (rtx out_insn, rtx in_insn)
12918 {
12919 enum attr_accum_in accum_in;
12920 int accum_in_opnum;
12921 rtx accum_in_op;
12922
12923 if (recog_memoized (in_insn) < 0)
12924 return false;
12925
12926 accum_in = get_attr_accum_in (in_insn);
12927 if (accum_in == ACCUM_IN_NONE)
12928 return false;
12929
12930 accum_in_opnum = accum_in - ACCUM_IN_0;
12931
12932 extract_insn (in_insn);
12933 gcc_assert (accum_in_opnum < recog_data.n_operands);
12934 accum_in_op = recog_data.operand[accum_in_opnum];
12935
12936 return reg_set_p (accum_in_op, out_insn);
12937 }
12938
12939 /* True if the dependency between OUT_INSN and IN_INSN is on the store
12940 data rather than the address. We need this because the cprestore
12941 pattern is type "store", but is defined using an UNSPEC_VOLATILE,
12942 which causes the default routine to abort. We just return false
12943 for that case. */
12944
12945 bool
12946 mips_store_data_bypass_p (rtx out_insn, rtx in_insn)
12947 {
12948 if (GET_CODE (PATTERN (in_insn)) == UNSPEC_VOLATILE)
12949 return false;
12950
12951 return !store_data_bypass_p (out_insn, in_insn);
12952 }
12953 \f
12954
12955 /* Variables and flags used in scheduler hooks when tuning for
12956 Loongson 2E/2F. */
12957 static struct
12958 {
12959 /* Variables to support Loongson 2E/2F round-robin [F]ALU1/2 dispatch
12960 strategy. */
12961
12962 /* If true, then next ALU1/2 instruction will go to ALU1. */
12963 bool alu1_turn_p;
12964
12965 /* If true, then next FALU1/2 unstruction will go to FALU1. */
12966 bool falu1_turn_p;
12967
12968 /* Codes to query if [f]alu{1,2}_core units are subscribed or not. */
12969 int alu1_core_unit_code;
12970 int alu2_core_unit_code;
12971 int falu1_core_unit_code;
12972 int falu2_core_unit_code;
12973
12974 /* True if current cycle has a multi instruction.
12975 This flag is used in mips_ls2_dfa_post_advance_cycle. */
12976 bool cycle_has_multi_p;
12977
12978 /* Instructions to subscribe ls2_[f]alu{1,2}_turn_enabled units.
12979 These are used in mips_ls2_dfa_post_advance_cycle to initialize
12980 DFA state.
12981 E.g., when alu1_turn_enabled_insn is issued it makes next ALU1/2
12982 instruction to go ALU1. */
12983 rtx alu1_turn_enabled_insn;
12984 rtx alu2_turn_enabled_insn;
12985 rtx falu1_turn_enabled_insn;
12986 rtx falu2_turn_enabled_insn;
12987 } mips_ls2;
12988
12989 /* Implement TARGET_SCHED_ADJUST_COST. We assume that anti and output
12990 dependencies have no cost, except on the 20Kc where output-dependence
12991 is treated like input-dependence. */
12992
12993 static int
12994 mips_adjust_cost (rtx insn ATTRIBUTE_UNUSED, rtx link,
12995 rtx dep ATTRIBUTE_UNUSED, int cost)
12996 {
12997 if (REG_NOTE_KIND (link) == REG_DEP_OUTPUT
12998 && TUNE_20KC)
12999 return cost;
13000 if (REG_NOTE_KIND (link) != 0)
13001 return 0;
13002 return cost;
13003 }
13004
13005 /* Return the number of instructions that can be issued per cycle. */
13006
13007 static int
13008 mips_issue_rate (void)
13009 {
13010 switch (mips_tune)
13011 {
13012 case PROCESSOR_74KC:
13013 case PROCESSOR_74KF2_1:
13014 case PROCESSOR_74KF1_1:
13015 case PROCESSOR_74KF3_2:
13016 /* The 74k is not strictly quad-issue cpu, but can be seen as one
13017 by the scheduler. It can issue 1 ALU, 1 AGEN and 2 FPU insns,
13018 but in reality only a maximum of 3 insns can be issued as
13019 floating-point loads and stores also require a slot in the
13020 AGEN pipe. */
13021 case PROCESSOR_R10000:
13022 /* All R10K Processors are quad-issue (being the first MIPS
13023 processors to support this feature). */
13024 return 4;
13025
13026 case PROCESSOR_20KC:
13027 case PROCESSOR_R4130:
13028 case PROCESSOR_R5400:
13029 case PROCESSOR_R5500:
13030 case PROCESSOR_R5900:
13031 case PROCESSOR_R7000:
13032 case PROCESSOR_R9000:
13033 case PROCESSOR_OCTEON:
13034 case PROCESSOR_OCTEON2:
13035 return 2;
13036
13037 case PROCESSOR_SB1:
13038 case PROCESSOR_SB1A:
13039 /* This is actually 4, but we get better performance if we claim 3.
13040 This is partly because of unwanted speculative code motion with the
13041 larger number, and partly because in most common cases we can't
13042 reach the theoretical max of 4. */
13043 return 3;
13044
13045 case PROCESSOR_LOONGSON_2E:
13046 case PROCESSOR_LOONGSON_2F:
13047 case PROCESSOR_LOONGSON_3A:
13048 return 4;
13049
13050 case PROCESSOR_XLP:
13051 return (reload_completed ? 4 : 3);
13052
13053 default:
13054 return 1;
13055 }
13056 }
13057
13058 /* Implement TARGET_SCHED_INIT_DFA_POST_CYCLE_INSN hook for Loongson2. */
13059
13060 static void
13061 mips_ls2_init_dfa_post_cycle_insn (void)
13062 {
13063 start_sequence ();
13064 emit_insn (gen_ls2_alu1_turn_enabled_insn ());
13065 mips_ls2.alu1_turn_enabled_insn = get_insns ();
13066 end_sequence ();
13067
13068 start_sequence ();
13069 emit_insn (gen_ls2_alu2_turn_enabled_insn ());
13070 mips_ls2.alu2_turn_enabled_insn = get_insns ();
13071 end_sequence ();
13072
13073 start_sequence ();
13074 emit_insn (gen_ls2_falu1_turn_enabled_insn ());
13075 mips_ls2.falu1_turn_enabled_insn = get_insns ();
13076 end_sequence ();
13077
13078 start_sequence ();
13079 emit_insn (gen_ls2_falu2_turn_enabled_insn ());
13080 mips_ls2.falu2_turn_enabled_insn = get_insns ();
13081 end_sequence ();
13082
13083 mips_ls2.alu1_core_unit_code = get_cpu_unit_code ("ls2_alu1_core");
13084 mips_ls2.alu2_core_unit_code = get_cpu_unit_code ("ls2_alu2_core");
13085 mips_ls2.falu1_core_unit_code = get_cpu_unit_code ("ls2_falu1_core");
13086 mips_ls2.falu2_core_unit_code = get_cpu_unit_code ("ls2_falu2_core");
13087 }
13088
13089 /* Implement TARGET_SCHED_INIT_DFA_POST_CYCLE_INSN hook.
13090 Init data used in mips_dfa_post_advance_cycle. */
13091
13092 static void
13093 mips_init_dfa_post_cycle_insn (void)
13094 {
13095 if (TUNE_LOONGSON_2EF)
13096 mips_ls2_init_dfa_post_cycle_insn ();
13097 }
13098
13099 /* Initialize STATE when scheduling for Loongson 2E/2F.
13100 Support round-robin dispatch scheme by enabling only one of
13101 ALU1/ALU2 and one of FALU1/FALU2 units for ALU1/2 and FALU1/2 instructions
13102 respectively. */
13103
13104 static void
13105 mips_ls2_dfa_post_advance_cycle (state_t state)
13106 {
13107 if (cpu_unit_reservation_p (state, mips_ls2.alu1_core_unit_code))
13108 {
13109 /* Though there are no non-pipelined ALU1 insns,
13110 we can get an instruction of type 'multi' before reload. */
13111 gcc_assert (mips_ls2.cycle_has_multi_p);
13112 mips_ls2.alu1_turn_p = false;
13113 }
13114
13115 mips_ls2.cycle_has_multi_p = false;
13116
13117 if (cpu_unit_reservation_p (state, mips_ls2.alu2_core_unit_code))
13118 /* We have a non-pipelined alu instruction in the core,
13119 adjust round-robin counter. */
13120 mips_ls2.alu1_turn_p = true;
13121
13122 if (mips_ls2.alu1_turn_p)
13123 {
13124 if (state_transition (state, mips_ls2.alu1_turn_enabled_insn) >= 0)
13125 gcc_unreachable ();
13126 }
13127 else
13128 {
13129 if (state_transition (state, mips_ls2.alu2_turn_enabled_insn) >= 0)
13130 gcc_unreachable ();
13131 }
13132
13133 if (cpu_unit_reservation_p (state, mips_ls2.falu1_core_unit_code))
13134 {
13135 /* There are no non-pipelined FALU1 insns. */
13136 gcc_unreachable ();
13137 mips_ls2.falu1_turn_p = false;
13138 }
13139
13140 if (cpu_unit_reservation_p (state, mips_ls2.falu2_core_unit_code))
13141 /* We have a non-pipelined falu instruction in the core,
13142 adjust round-robin counter. */
13143 mips_ls2.falu1_turn_p = true;
13144
13145 if (mips_ls2.falu1_turn_p)
13146 {
13147 if (state_transition (state, mips_ls2.falu1_turn_enabled_insn) >= 0)
13148 gcc_unreachable ();
13149 }
13150 else
13151 {
13152 if (state_transition (state, mips_ls2.falu2_turn_enabled_insn) >= 0)
13153 gcc_unreachable ();
13154 }
13155 }
13156
13157 /* Implement TARGET_SCHED_DFA_POST_ADVANCE_CYCLE.
13158 This hook is being called at the start of each cycle. */
13159
13160 static void
13161 mips_dfa_post_advance_cycle (void)
13162 {
13163 if (TUNE_LOONGSON_2EF)
13164 mips_ls2_dfa_post_advance_cycle (curr_state);
13165 }
13166
13167 /* Implement TARGET_SCHED_FIRST_CYCLE_MULTIPASS_DFA_LOOKAHEAD. This should
13168 be as wide as the scheduling freedom in the DFA. */
13169
13170 static int
13171 mips_multipass_dfa_lookahead (void)
13172 {
13173 /* Can schedule up to 4 of the 6 function units in any one cycle. */
13174 if (TUNE_SB1)
13175 return 4;
13176
13177 if (TUNE_LOONGSON_2EF || TUNE_LOONGSON_3A)
13178 return 4;
13179
13180 if (TUNE_OCTEON)
13181 return 2;
13182
13183 return 0;
13184 }
13185 \f
13186 /* Remove the instruction at index LOWER from ready queue READY and
13187 reinsert it in front of the instruction at index HIGHER. LOWER must
13188 be <= HIGHER. */
13189
13190 static void
13191 mips_promote_ready (rtx *ready, int lower, int higher)
13192 {
13193 rtx new_head;
13194 int i;
13195
13196 new_head = ready[lower];
13197 for (i = lower; i < higher; i++)
13198 ready[i] = ready[i + 1];
13199 ready[i] = new_head;
13200 }
13201
13202 /* If the priority of the instruction at POS2 in the ready queue READY
13203 is within LIMIT units of that of the instruction at POS1, swap the
13204 instructions if POS2 is not already less than POS1. */
13205
13206 static void
13207 mips_maybe_swap_ready (rtx *ready, int pos1, int pos2, int limit)
13208 {
13209 if (pos1 < pos2
13210 && INSN_PRIORITY (ready[pos1]) + limit >= INSN_PRIORITY (ready[pos2]))
13211 {
13212 rtx temp;
13213
13214 temp = ready[pos1];
13215 ready[pos1] = ready[pos2];
13216 ready[pos2] = temp;
13217 }
13218 }
13219 \f
13220 /* Used by TUNE_MACC_CHAINS to record the last scheduled instruction
13221 that may clobber hi or lo. */
13222 static rtx mips_macc_chains_last_hilo;
13223
13224 /* A TUNE_MACC_CHAINS helper function. Record that instruction INSN has
13225 been scheduled, updating mips_macc_chains_last_hilo appropriately. */
13226
13227 static void
13228 mips_macc_chains_record (rtx insn)
13229 {
13230 if (get_attr_may_clobber_hilo (insn))
13231 mips_macc_chains_last_hilo = insn;
13232 }
13233
13234 /* A TUNE_MACC_CHAINS helper function. Search ready queue READY, which
13235 has NREADY elements, looking for a multiply-add or multiply-subtract
13236 instruction that is cumulative with mips_macc_chains_last_hilo.
13237 If there is one, promote it ahead of anything else that might
13238 clobber hi or lo. */
13239
13240 static void
13241 mips_macc_chains_reorder (rtx *ready, int nready)
13242 {
13243 int i, j;
13244
13245 if (mips_macc_chains_last_hilo != 0)
13246 for (i = nready - 1; i >= 0; i--)
13247 if (mips_linked_madd_p (mips_macc_chains_last_hilo, ready[i]))
13248 {
13249 for (j = nready - 1; j > i; j--)
13250 if (recog_memoized (ready[j]) >= 0
13251 && get_attr_may_clobber_hilo (ready[j]))
13252 {
13253 mips_promote_ready (ready, i, j);
13254 break;
13255 }
13256 break;
13257 }
13258 }
13259 \f
13260 /* The last instruction to be scheduled. */
13261 static rtx vr4130_last_insn;
13262
13263 /* A note_stores callback used by vr4130_true_reg_dependence_p. DATA
13264 points to an rtx that is initially an instruction. Nullify the rtx
13265 if the instruction uses the value of register X. */
13266
13267 static void
13268 vr4130_true_reg_dependence_p_1 (rtx x, const_rtx pat ATTRIBUTE_UNUSED,
13269 void *data)
13270 {
13271 rtx *insn_ptr;
13272
13273 insn_ptr = (rtx *) data;
13274 if (REG_P (x)
13275 && *insn_ptr != 0
13276 && reg_referenced_p (x, PATTERN (*insn_ptr)))
13277 *insn_ptr = 0;
13278 }
13279
13280 /* Return true if there is true register dependence between vr4130_last_insn
13281 and INSN. */
13282
13283 static bool
13284 vr4130_true_reg_dependence_p (rtx insn)
13285 {
13286 note_stores (PATTERN (vr4130_last_insn),
13287 vr4130_true_reg_dependence_p_1, &insn);
13288 return insn == 0;
13289 }
13290
13291 /* A TUNE_MIPS4130 helper function. Given that INSN1 is at the head of
13292 the ready queue and that INSN2 is the instruction after it, return
13293 true if it is worth promoting INSN2 ahead of INSN1. Look for cases
13294 in which INSN1 and INSN2 can probably issue in parallel, but for
13295 which (INSN2, INSN1) should be less sensitive to instruction
13296 alignment than (INSN1, INSN2). See 4130.md for more details. */
13297
13298 static bool
13299 vr4130_swap_insns_p (rtx insn1, rtx insn2)
13300 {
13301 sd_iterator_def sd_it;
13302 dep_t dep;
13303
13304 /* Check for the following case:
13305
13306 1) there is some other instruction X with an anti dependence on INSN1;
13307 2) X has a higher priority than INSN2; and
13308 3) X is an arithmetic instruction (and thus has no unit restrictions).
13309
13310 If INSN1 is the last instruction blocking X, it would better to
13311 choose (INSN1, X) over (INSN2, INSN1). */
13312 FOR_EACH_DEP (insn1, SD_LIST_FORW, sd_it, dep)
13313 if (DEP_TYPE (dep) == REG_DEP_ANTI
13314 && INSN_PRIORITY (DEP_CON (dep)) > INSN_PRIORITY (insn2)
13315 && recog_memoized (DEP_CON (dep)) >= 0
13316 && get_attr_vr4130_class (DEP_CON (dep)) == VR4130_CLASS_ALU)
13317 return false;
13318
13319 if (vr4130_last_insn != 0
13320 && recog_memoized (insn1) >= 0
13321 && recog_memoized (insn2) >= 0)
13322 {
13323 /* See whether INSN1 and INSN2 use different execution units,
13324 or if they are both ALU-type instructions. If so, they can
13325 probably execute in parallel. */
13326 enum attr_vr4130_class class1 = get_attr_vr4130_class (insn1);
13327 enum attr_vr4130_class class2 = get_attr_vr4130_class (insn2);
13328 if (class1 != class2 || class1 == VR4130_CLASS_ALU)
13329 {
13330 /* If only one of the instructions has a dependence on
13331 vr4130_last_insn, prefer to schedule the other one first. */
13332 bool dep1_p = vr4130_true_reg_dependence_p (insn1);
13333 bool dep2_p = vr4130_true_reg_dependence_p (insn2);
13334 if (dep1_p != dep2_p)
13335 return dep1_p;
13336
13337 /* Prefer to schedule INSN2 ahead of INSN1 if vr4130_last_insn
13338 is not an ALU-type instruction and if INSN1 uses the same
13339 execution unit. (Note that if this condition holds, we already
13340 know that INSN2 uses a different execution unit.) */
13341 if (class1 != VR4130_CLASS_ALU
13342 && recog_memoized (vr4130_last_insn) >= 0
13343 && class1 == get_attr_vr4130_class (vr4130_last_insn))
13344 return true;
13345 }
13346 }
13347 return false;
13348 }
13349
13350 /* A TUNE_MIPS4130 helper function. (READY, NREADY) describes a ready
13351 queue with at least two instructions. Swap the first two if
13352 vr4130_swap_insns_p says that it could be worthwhile. */
13353
13354 static void
13355 vr4130_reorder (rtx *ready, int nready)
13356 {
13357 if (vr4130_swap_insns_p (ready[nready - 1], ready[nready - 2]))
13358 mips_promote_ready (ready, nready - 2, nready - 1);
13359 }
13360 \f
13361 /* Record whether last 74k AGEN instruction was a load or store. */
13362 static enum attr_type mips_last_74k_agen_insn = TYPE_UNKNOWN;
13363
13364 /* Initialize mips_last_74k_agen_insn from INSN. A null argument
13365 resets to TYPE_UNKNOWN state. */
13366
13367 static void
13368 mips_74k_agen_init (rtx insn)
13369 {
13370 if (!insn || CALL_P (insn) || JUMP_P (insn))
13371 mips_last_74k_agen_insn = TYPE_UNKNOWN;
13372 else
13373 {
13374 enum attr_type type = get_attr_type (insn);
13375 if (type == TYPE_LOAD || type == TYPE_STORE)
13376 mips_last_74k_agen_insn = type;
13377 }
13378 }
13379
13380 /* A TUNE_74K helper function. The 74K AGEN pipeline likes multiple
13381 loads to be grouped together, and multiple stores to be grouped
13382 together. Swap things around in the ready queue to make this happen. */
13383
13384 static void
13385 mips_74k_agen_reorder (rtx *ready, int nready)
13386 {
13387 int i;
13388 int store_pos, load_pos;
13389
13390 store_pos = -1;
13391 load_pos = -1;
13392
13393 for (i = nready - 1; i >= 0; i--)
13394 {
13395 rtx insn = ready[i];
13396 if (USEFUL_INSN_P (insn))
13397 switch (get_attr_type (insn))
13398 {
13399 case TYPE_STORE:
13400 if (store_pos == -1)
13401 store_pos = i;
13402 break;
13403
13404 case TYPE_LOAD:
13405 if (load_pos == -1)
13406 load_pos = i;
13407 break;
13408
13409 default:
13410 break;
13411 }
13412 }
13413
13414 if (load_pos == -1 || store_pos == -1)
13415 return;
13416
13417 switch (mips_last_74k_agen_insn)
13418 {
13419 case TYPE_UNKNOWN:
13420 /* Prefer to schedule loads since they have a higher latency. */
13421 case TYPE_LOAD:
13422 /* Swap loads to the front of the queue. */
13423 mips_maybe_swap_ready (ready, load_pos, store_pos, 4);
13424 break;
13425 case TYPE_STORE:
13426 /* Swap stores to the front of the queue. */
13427 mips_maybe_swap_ready (ready, store_pos, load_pos, 4);
13428 break;
13429 default:
13430 break;
13431 }
13432 }
13433 \f
13434 /* Implement TARGET_SCHED_INIT. */
13435
13436 static void
13437 mips_sched_init (FILE *file ATTRIBUTE_UNUSED, int verbose ATTRIBUTE_UNUSED,
13438 int max_ready ATTRIBUTE_UNUSED)
13439 {
13440 mips_macc_chains_last_hilo = 0;
13441 vr4130_last_insn = 0;
13442 mips_74k_agen_init (NULL_RTX);
13443
13444 /* When scheduling for Loongson2, branch instructions go to ALU1,
13445 therefore basic block is most likely to start with round-robin counter
13446 pointed to ALU2. */
13447 mips_ls2.alu1_turn_p = false;
13448 mips_ls2.falu1_turn_p = true;
13449 }
13450
13451 /* Subroutine used by TARGET_SCHED_REORDER and TARGET_SCHED_REORDER2. */
13452
13453 static void
13454 mips_sched_reorder_1 (FILE *file ATTRIBUTE_UNUSED, int verbose ATTRIBUTE_UNUSED,
13455 rtx *ready, int *nreadyp, int cycle ATTRIBUTE_UNUSED)
13456 {
13457 if (!reload_completed
13458 && TUNE_MACC_CHAINS
13459 && *nreadyp > 0)
13460 mips_macc_chains_reorder (ready, *nreadyp);
13461
13462 if (reload_completed
13463 && TUNE_MIPS4130
13464 && !TARGET_VR4130_ALIGN
13465 && *nreadyp > 1)
13466 vr4130_reorder (ready, *nreadyp);
13467
13468 if (TUNE_74K)
13469 mips_74k_agen_reorder (ready, *nreadyp);
13470 }
13471
13472 /* Implement TARGET_SCHED_REORDER. */
13473
13474 static int
13475 mips_sched_reorder (FILE *file ATTRIBUTE_UNUSED, int verbose ATTRIBUTE_UNUSED,
13476 rtx *ready, int *nreadyp, int cycle ATTRIBUTE_UNUSED)
13477 {
13478 mips_sched_reorder_1 (file, verbose, ready, nreadyp, cycle);
13479 return mips_issue_rate ();
13480 }
13481
13482 /* Implement TARGET_SCHED_REORDER2. */
13483
13484 static int
13485 mips_sched_reorder2 (FILE *file ATTRIBUTE_UNUSED, int verbose ATTRIBUTE_UNUSED,
13486 rtx *ready, int *nreadyp, int cycle ATTRIBUTE_UNUSED)
13487 {
13488 mips_sched_reorder_1 (file, verbose, ready, nreadyp, cycle);
13489 return cached_can_issue_more;
13490 }
13491
13492 /* Update round-robin counters for ALU1/2 and FALU1/2. */
13493
13494 static void
13495 mips_ls2_variable_issue (rtx insn)
13496 {
13497 if (mips_ls2.alu1_turn_p)
13498 {
13499 if (cpu_unit_reservation_p (curr_state, mips_ls2.alu1_core_unit_code))
13500 mips_ls2.alu1_turn_p = false;
13501 }
13502 else
13503 {
13504 if (cpu_unit_reservation_p (curr_state, mips_ls2.alu2_core_unit_code))
13505 mips_ls2.alu1_turn_p = true;
13506 }
13507
13508 if (mips_ls2.falu1_turn_p)
13509 {
13510 if (cpu_unit_reservation_p (curr_state, mips_ls2.falu1_core_unit_code))
13511 mips_ls2.falu1_turn_p = false;
13512 }
13513 else
13514 {
13515 if (cpu_unit_reservation_p (curr_state, mips_ls2.falu2_core_unit_code))
13516 mips_ls2.falu1_turn_p = true;
13517 }
13518
13519 if (recog_memoized (insn) >= 0)
13520 mips_ls2.cycle_has_multi_p |= (get_attr_type (insn) == TYPE_MULTI);
13521 }
13522
13523 /* Implement TARGET_SCHED_VARIABLE_ISSUE. */
13524
13525 static int
13526 mips_variable_issue (FILE *file ATTRIBUTE_UNUSED, int verbose ATTRIBUTE_UNUSED,
13527 rtx insn, int more)
13528 {
13529 /* Ignore USEs and CLOBBERs; don't count them against the issue rate. */
13530 if (USEFUL_INSN_P (insn))
13531 {
13532 if (get_attr_type (insn) != TYPE_GHOST)
13533 more--;
13534 if (!reload_completed && TUNE_MACC_CHAINS)
13535 mips_macc_chains_record (insn);
13536 vr4130_last_insn = insn;
13537 if (TUNE_74K)
13538 mips_74k_agen_init (insn);
13539 else if (TUNE_LOONGSON_2EF)
13540 mips_ls2_variable_issue (insn);
13541 }
13542
13543 /* Instructions of type 'multi' should all be split before
13544 the second scheduling pass. */
13545 gcc_assert (!reload_completed
13546 || recog_memoized (insn) < 0
13547 || get_attr_type (insn) != TYPE_MULTI);
13548
13549 cached_can_issue_more = more;
13550 return more;
13551 }
13552 \f
13553 /* Given that we have an rtx of the form (prefetch ... WRITE LOCALITY),
13554 return the first operand of the associated PREF or PREFX insn. */
13555
13556 rtx
13557 mips_prefetch_cookie (rtx write, rtx locality)
13558 {
13559 /* store_streamed / load_streamed. */
13560 if (INTVAL (locality) <= 0)
13561 return GEN_INT (INTVAL (write) + 4);
13562
13563 /* store / load. */
13564 if (INTVAL (locality) <= 2)
13565 return write;
13566
13567 /* store_retained / load_retained. */
13568 return GEN_INT (INTVAL (write) + 6);
13569 }
13570 \f
13571 /* Flags that indicate when a built-in function is available.
13572
13573 BUILTIN_AVAIL_NON_MIPS16
13574 The function is available on the current target, but only
13575 in non-MIPS16 mode. */
13576 #define BUILTIN_AVAIL_NON_MIPS16 1
13577
13578 /* Declare an availability predicate for built-in functions that
13579 require non-MIPS16 mode and also require COND to be true.
13580 NAME is the main part of the predicate's name. */
13581 #define AVAIL_NON_MIPS16(NAME, COND) \
13582 static unsigned int \
13583 mips_builtin_avail_##NAME (void) \
13584 { \
13585 return (COND) ? BUILTIN_AVAIL_NON_MIPS16 : 0; \
13586 }
13587
13588 /* This structure describes a single built-in function. */
13589 struct mips_builtin_description {
13590 /* The code of the main .md file instruction. See mips_builtin_type
13591 for more information. */
13592 enum insn_code icode;
13593
13594 /* The floating-point comparison code to use with ICODE, if any. */
13595 enum mips_fp_condition cond;
13596
13597 /* The name of the built-in function. */
13598 const char *name;
13599
13600 /* Specifies how the function should be expanded. */
13601 enum mips_builtin_type builtin_type;
13602
13603 /* The function's prototype. */
13604 enum mips_function_type function_type;
13605
13606 /* Whether the function is available. */
13607 unsigned int (*avail) (void);
13608 };
13609
13610 AVAIL_NON_MIPS16 (paired_single, TARGET_PAIRED_SINGLE_FLOAT)
13611 AVAIL_NON_MIPS16 (sb1_paired_single, TARGET_SB1 && TARGET_PAIRED_SINGLE_FLOAT)
13612 AVAIL_NON_MIPS16 (mips3d, TARGET_MIPS3D)
13613 AVAIL_NON_MIPS16 (dsp, TARGET_DSP)
13614 AVAIL_NON_MIPS16 (dspr2, TARGET_DSPR2)
13615 AVAIL_NON_MIPS16 (dsp_32, !TARGET_64BIT && TARGET_DSP)
13616 AVAIL_NON_MIPS16 (dsp_64, TARGET_64BIT && TARGET_DSP)
13617 AVAIL_NON_MIPS16 (dspr2_32, !TARGET_64BIT && TARGET_DSPR2)
13618 AVAIL_NON_MIPS16 (loongson, TARGET_LOONGSON_VECTORS)
13619 AVAIL_NON_MIPS16 (cache, TARGET_CACHE_BUILTIN)
13620
13621 /* Construct a mips_builtin_description from the given arguments.
13622
13623 INSN is the name of the associated instruction pattern, without the
13624 leading CODE_FOR_mips_.
13625
13626 CODE is the floating-point condition code associated with the
13627 function. It can be 'f' if the field is not applicable.
13628
13629 NAME is the name of the function itself, without the leading
13630 "__builtin_mips_".
13631
13632 BUILTIN_TYPE and FUNCTION_TYPE are mips_builtin_description fields.
13633
13634 AVAIL is the name of the availability predicate, without the leading
13635 mips_builtin_avail_. */
13636 #define MIPS_BUILTIN(INSN, COND, NAME, BUILTIN_TYPE, \
13637 FUNCTION_TYPE, AVAIL) \
13638 { CODE_FOR_mips_ ## INSN, MIPS_FP_COND_ ## COND, \
13639 "__builtin_mips_" NAME, BUILTIN_TYPE, FUNCTION_TYPE, \
13640 mips_builtin_avail_ ## AVAIL }
13641
13642 /* Define __builtin_mips_<INSN>, which is a MIPS_BUILTIN_DIRECT function
13643 mapped to instruction CODE_FOR_mips_<INSN>, FUNCTION_TYPE and AVAIL
13644 are as for MIPS_BUILTIN. */
13645 #define DIRECT_BUILTIN(INSN, FUNCTION_TYPE, AVAIL) \
13646 MIPS_BUILTIN (INSN, f, #INSN, MIPS_BUILTIN_DIRECT, FUNCTION_TYPE, AVAIL)
13647
13648 /* Define __builtin_mips_<INSN>_<COND>_{s,d} functions, both of which
13649 are subject to mips_builtin_avail_<AVAIL>. */
13650 #define CMP_SCALAR_BUILTINS(INSN, COND, AVAIL) \
13651 MIPS_BUILTIN (INSN ## _cond_s, COND, #INSN "_" #COND "_s", \
13652 MIPS_BUILTIN_CMP_SINGLE, MIPS_INT_FTYPE_SF_SF, AVAIL), \
13653 MIPS_BUILTIN (INSN ## _cond_d, COND, #INSN "_" #COND "_d", \
13654 MIPS_BUILTIN_CMP_SINGLE, MIPS_INT_FTYPE_DF_DF, AVAIL)
13655
13656 /* Define __builtin_mips_{any,all,upper,lower}_<INSN>_<COND>_ps.
13657 The lower and upper forms are subject to mips_builtin_avail_<AVAIL>
13658 while the any and all forms are subject to mips_builtin_avail_mips3d. */
13659 #define CMP_PS_BUILTINS(INSN, COND, AVAIL) \
13660 MIPS_BUILTIN (INSN ## _cond_ps, COND, "any_" #INSN "_" #COND "_ps", \
13661 MIPS_BUILTIN_CMP_ANY, MIPS_INT_FTYPE_V2SF_V2SF, \
13662 mips3d), \
13663 MIPS_BUILTIN (INSN ## _cond_ps, COND, "all_" #INSN "_" #COND "_ps", \
13664 MIPS_BUILTIN_CMP_ALL, MIPS_INT_FTYPE_V2SF_V2SF, \
13665 mips3d), \
13666 MIPS_BUILTIN (INSN ## _cond_ps, COND, "lower_" #INSN "_" #COND "_ps", \
13667 MIPS_BUILTIN_CMP_LOWER, MIPS_INT_FTYPE_V2SF_V2SF, \
13668 AVAIL), \
13669 MIPS_BUILTIN (INSN ## _cond_ps, COND, "upper_" #INSN "_" #COND "_ps", \
13670 MIPS_BUILTIN_CMP_UPPER, MIPS_INT_FTYPE_V2SF_V2SF, \
13671 AVAIL)
13672
13673 /* Define __builtin_mips_{any,all}_<INSN>_<COND>_4s. The functions
13674 are subject to mips_builtin_avail_mips3d. */
13675 #define CMP_4S_BUILTINS(INSN, COND) \
13676 MIPS_BUILTIN (INSN ## _cond_4s, COND, "any_" #INSN "_" #COND "_4s", \
13677 MIPS_BUILTIN_CMP_ANY, \
13678 MIPS_INT_FTYPE_V2SF_V2SF_V2SF_V2SF, mips3d), \
13679 MIPS_BUILTIN (INSN ## _cond_4s, COND, "all_" #INSN "_" #COND "_4s", \
13680 MIPS_BUILTIN_CMP_ALL, \
13681 MIPS_INT_FTYPE_V2SF_V2SF_V2SF_V2SF, mips3d)
13682
13683 /* Define __builtin_mips_mov{t,f}_<INSN>_<COND>_ps. The comparison
13684 instruction requires mips_builtin_avail_<AVAIL>. */
13685 #define MOVTF_BUILTINS(INSN, COND, AVAIL) \
13686 MIPS_BUILTIN (INSN ## _cond_ps, COND, "movt_" #INSN "_" #COND "_ps", \
13687 MIPS_BUILTIN_MOVT, MIPS_V2SF_FTYPE_V2SF_V2SF_V2SF_V2SF, \
13688 AVAIL), \
13689 MIPS_BUILTIN (INSN ## _cond_ps, COND, "movf_" #INSN "_" #COND "_ps", \
13690 MIPS_BUILTIN_MOVF, MIPS_V2SF_FTYPE_V2SF_V2SF_V2SF_V2SF, \
13691 AVAIL)
13692
13693 /* Define all the built-in functions related to C.cond.fmt condition COND. */
13694 #define CMP_BUILTINS(COND) \
13695 MOVTF_BUILTINS (c, COND, paired_single), \
13696 MOVTF_BUILTINS (cabs, COND, mips3d), \
13697 CMP_SCALAR_BUILTINS (cabs, COND, mips3d), \
13698 CMP_PS_BUILTINS (c, COND, paired_single), \
13699 CMP_PS_BUILTINS (cabs, COND, mips3d), \
13700 CMP_4S_BUILTINS (c, COND), \
13701 CMP_4S_BUILTINS (cabs, COND)
13702
13703 /* Define __builtin_mips_<INSN>, which is a MIPS_BUILTIN_DIRECT_NO_TARGET
13704 function mapped to instruction CODE_FOR_mips_<INSN>, FUNCTION_TYPE
13705 and AVAIL are as for MIPS_BUILTIN. */
13706 #define DIRECT_NO_TARGET_BUILTIN(INSN, FUNCTION_TYPE, AVAIL) \
13707 MIPS_BUILTIN (INSN, f, #INSN, MIPS_BUILTIN_DIRECT_NO_TARGET, \
13708 FUNCTION_TYPE, AVAIL)
13709
13710 /* Define __builtin_mips_bposge<VALUE>. <VALUE> is 32 for the MIPS32 DSP
13711 branch instruction. AVAIL is as for MIPS_BUILTIN. */
13712 #define BPOSGE_BUILTIN(VALUE, AVAIL) \
13713 MIPS_BUILTIN (bposge, f, "bposge" #VALUE, \
13714 MIPS_BUILTIN_BPOSGE ## VALUE, MIPS_SI_FTYPE_VOID, AVAIL)
13715
13716 /* Define a Loongson MIPS_BUILTIN_DIRECT function __builtin_loongson_<FN_NAME>
13717 for instruction CODE_FOR_loongson_<INSN>. FUNCTION_TYPE is a
13718 builtin_description field. */
13719 #define LOONGSON_BUILTIN_ALIAS(INSN, FN_NAME, FUNCTION_TYPE) \
13720 { CODE_FOR_loongson_ ## INSN, MIPS_FP_COND_f, \
13721 "__builtin_loongson_" #FN_NAME, MIPS_BUILTIN_DIRECT, \
13722 FUNCTION_TYPE, mips_builtin_avail_loongson }
13723
13724 /* Define a Loongson MIPS_BUILTIN_DIRECT function __builtin_loongson_<INSN>
13725 for instruction CODE_FOR_loongson_<INSN>. FUNCTION_TYPE is a
13726 builtin_description field. */
13727 #define LOONGSON_BUILTIN(INSN, FUNCTION_TYPE) \
13728 LOONGSON_BUILTIN_ALIAS (INSN, INSN, FUNCTION_TYPE)
13729
13730 /* Like LOONGSON_BUILTIN, but add _<SUFFIX> to the end of the function name.
13731 We use functions of this form when the same insn can be usefully applied
13732 to more than one datatype. */
13733 #define LOONGSON_BUILTIN_SUFFIX(INSN, SUFFIX, FUNCTION_TYPE) \
13734 LOONGSON_BUILTIN_ALIAS (INSN, INSN ## _ ## SUFFIX, FUNCTION_TYPE)
13735
13736 #define CODE_FOR_mips_sqrt_ps CODE_FOR_sqrtv2sf2
13737 #define CODE_FOR_mips_addq_ph CODE_FOR_addv2hi3
13738 #define CODE_FOR_mips_addu_qb CODE_FOR_addv4qi3
13739 #define CODE_FOR_mips_subq_ph CODE_FOR_subv2hi3
13740 #define CODE_FOR_mips_subu_qb CODE_FOR_subv4qi3
13741 #define CODE_FOR_mips_mul_ph CODE_FOR_mulv2hi3
13742 #define CODE_FOR_mips_mult CODE_FOR_mulsidi3_32bit
13743 #define CODE_FOR_mips_multu CODE_FOR_umulsidi3_32bit
13744
13745 #define CODE_FOR_loongson_packsswh CODE_FOR_vec_pack_ssat_v2si
13746 #define CODE_FOR_loongson_packsshb CODE_FOR_vec_pack_ssat_v4hi
13747 #define CODE_FOR_loongson_packushb CODE_FOR_vec_pack_usat_v4hi
13748 #define CODE_FOR_loongson_paddw CODE_FOR_addv2si3
13749 #define CODE_FOR_loongson_paddh CODE_FOR_addv4hi3
13750 #define CODE_FOR_loongson_paddb CODE_FOR_addv8qi3
13751 #define CODE_FOR_loongson_paddsh CODE_FOR_ssaddv4hi3
13752 #define CODE_FOR_loongson_paddsb CODE_FOR_ssaddv8qi3
13753 #define CODE_FOR_loongson_paddush CODE_FOR_usaddv4hi3
13754 #define CODE_FOR_loongson_paddusb CODE_FOR_usaddv8qi3
13755 #define CODE_FOR_loongson_pmaxsh CODE_FOR_smaxv4hi3
13756 #define CODE_FOR_loongson_pmaxub CODE_FOR_umaxv8qi3
13757 #define CODE_FOR_loongson_pminsh CODE_FOR_sminv4hi3
13758 #define CODE_FOR_loongson_pminub CODE_FOR_uminv8qi3
13759 #define CODE_FOR_loongson_pmulhuh CODE_FOR_umulv4hi3_highpart
13760 #define CODE_FOR_loongson_pmulhh CODE_FOR_smulv4hi3_highpart
13761 #define CODE_FOR_loongson_pmullh CODE_FOR_mulv4hi3
13762 #define CODE_FOR_loongson_psllh CODE_FOR_ashlv4hi3
13763 #define CODE_FOR_loongson_psllw CODE_FOR_ashlv2si3
13764 #define CODE_FOR_loongson_psrlh CODE_FOR_lshrv4hi3
13765 #define CODE_FOR_loongson_psrlw CODE_FOR_lshrv2si3
13766 #define CODE_FOR_loongson_psrah CODE_FOR_ashrv4hi3
13767 #define CODE_FOR_loongson_psraw CODE_FOR_ashrv2si3
13768 #define CODE_FOR_loongson_psubw CODE_FOR_subv2si3
13769 #define CODE_FOR_loongson_psubh CODE_FOR_subv4hi3
13770 #define CODE_FOR_loongson_psubb CODE_FOR_subv8qi3
13771 #define CODE_FOR_loongson_psubsh CODE_FOR_sssubv4hi3
13772 #define CODE_FOR_loongson_psubsb CODE_FOR_sssubv8qi3
13773 #define CODE_FOR_loongson_psubush CODE_FOR_ussubv4hi3
13774 #define CODE_FOR_loongson_psubusb CODE_FOR_ussubv8qi3
13775
13776 static const struct mips_builtin_description mips_builtins[] = {
13777 DIRECT_BUILTIN (pll_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, paired_single),
13778 DIRECT_BUILTIN (pul_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, paired_single),
13779 DIRECT_BUILTIN (plu_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, paired_single),
13780 DIRECT_BUILTIN (puu_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, paired_single),
13781 DIRECT_BUILTIN (cvt_ps_s, MIPS_V2SF_FTYPE_SF_SF, paired_single),
13782 DIRECT_BUILTIN (cvt_s_pl, MIPS_SF_FTYPE_V2SF, paired_single),
13783 DIRECT_BUILTIN (cvt_s_pu, MIPS_SF_FTYPE_V2SF, paired_single),
13784 DIRECT_BUILTIN (abs_ps, MIPS_V2SF_FTYPE_V2SF, paired_single),
13785
13786 DIRECT_BUILTIN (alnv_ps, MIPS_V2SF_FTYPE_V2SF_V2SF_INT, paired_single),
13787 DIRECT_BUILTIN (addr_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, mips3d),
13788 DIRECT_BUILTIN (mulr_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, mips3d),
13789 DIRECT_BUILTIN (cvt_pw_ps, MIPS_V2SF_FTYPE_V2SF, mips3d),
13790 DIRECT_BUILTIN (cvt_ps_pw, MIPS_V2SF_FTYPE_V2SF, mips3d),
13791
13792 DIRECT_BUILTIN (recip1_s, MIPS_SF_FTYPE_SF, mips3d),
13793 DIRECT_BUILTIN (recip1_d, MIPS_DF_FTYPE_DF, mips3d),
13794 DIRECT_BUILTIN (recip1_ps, MIPS_V2SF_FTYPE_V2SF, mips3d),
13795 DIRECT_BUILTIN (recip2_s, MIPS_SF_FTYPE_SF_SF, mips3d),
13796 DIRECT_BUILTIN (recip2_d, MIPS_DF_FTYPE_DF_DF, mips3d),
13797 DIRECT_BUILTIN (recip2_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, mips3d),
13798
13799 DIRECT_BUILTIN (rsqrt1_s, MIPS_SF_FTYPE_SF, mips3d),
13800 DIRECT_BUILTIN (rsqrt1_d, MIPS_DF_FTYPE_DF, mips3d),
13801 DIRECT_BUILTIN (rsqrt1_ps, MIPS_V2SF_FTYPE_V2SF, mips3d),
13802 DIRECT_BUILTIN (rsqrt2_s, MIPS_SF_FTYPE_SF_SF, mips3d),
13803 DIRECT_BUILTIN (rsqrt2_d, MIPS_DF_FTYPE_DF_DF, mips3d),
13804 DIRECT_BUILTIN (rsqrt2_ps, MIPS_V2SF_FTYPE_V2SF_V2SF, mips3d),
13805
13806 MIPS_FP_CONDITIONS (CMP_BUILTINS),
13807
13808 /* Built-in functions for the SB-1 processor. */
13809 DIRECT_BUILTIN (sqrt_ps, MIPS_V2SF_FTYPE_V2SF, sb1_paired_single),
13810
13811 /* Built-in functions for the DSP ASE (32-bit and 64-bit). */
13812 DIRECT_BUILTIN (addq_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dsp),
13813 DIRECT_BUILTIN (addq_s_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dsp),
13814 DIRECT_BUILTIN (addq_s_w, MIPS_SI_FTYPE_SI_SI, dsp),
13815 DIRECT_BUILTIN (addu_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dsp),
13816 DIRECT_BUILTIN (addu_s_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dsp),
13817 DIRECT_BUILTIN (subq_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dsp),
13818 DIRECT_BUILTIN (subq_s_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dsp),
13819 DIRECT_BUILTIN (subq_s_w, MIPS_SI_FTYPE_SI_SI, dsp),
13820 DIRECT_BUILTIN (subu_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dsp),
13821 DIRECT_BUILTIN (subu_s_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dsp),
13822 DIRECT_BUILTIN (addsc, MIPS_SI_FTYPE_SI_SI, dsp),
13823 DIRECT_BUILTIN (addwc, MIPS_SI_FTYPE_SI_SI, dsp),
13824 DIRECT_BUILTIN (modsub, MIPS_SI_FTYPE_SI_SI, dsp),
13825 DIRECT_BUILTIN (raddu_w_qb, MIPS_SI_FTYPE_V4QI, dsp),
13826 DIRECT_BUILTIN (absq_s_ph, MIPS_V2HI_FTYPE_V2HI, dsp),
13827 DIRECT_BUILTIN (absq_s_w, MIPS_SI_FTYPE_SI, dsp),
13828 DIRECT_BUILTIN (precrq_qb_ph, MIPS_V4QI_FTYPE_V2HI_V2HI, dsp),
13829 DIRECT_BUILTIN (precrq_ph_w, MIPS_V2HI_FTYPE_SI_SI, dsp),
13830 DIRECT_BUILTIN (precrq_rs_ph_w, MIPS_V2HI_FTYPE_SI_SI, dsp),
13831 DIRECT_BUILTIN (precrqu_s_qb_ph, MIPS_V4QI_FTYPE_V2HI_V2HI, dsp),
13832 DIRECT_BUILTIN (preceq_w_phl, MIPS_SI_FTYPE_V2HI, dsp),
13833 DIRECT_BUILTIN (preceq_w_phr, MIPS_SI_FTYPE_V2HI, dsp),
13834 DIRECT_BUILTIN (precequ_ph_qbl, MIPS_V2HI_FTYPE_V4QI, dsp),
13835 DIRECT_BUILTIN (precequ_ph_qbr, MIPS_V2HI_FTYPE_V4QI, dsp),
13836 DIRECT_BUILTIN (precequ_ph_qbla, MIPS_V2HI_FTYPE_V4QI, dsp),
13837 DIRECT_BUILTIN (precequ_ph_qbra, MIPS_V2HI_FTYPE_V4QI, dsp),
13838 DIRECT_BUILTIN (preceu_ph_qbl, MIPS_V2HI_FTYPE_V4QI, dsp),
13839 DIRECT_BUILTIN (preceu_ph_qbr, MIPS_V2HI_FTYPE_V4QI, dsp),
13840 DIRECT_BUILTIN (preceu_ph_qbla, MIPS_V2HI_FTYPE_V4QI, dsp),
13841 DIRECT_BUILTIN (preceu_ph_qbra, MIPS_V2HI_FTYPE_V4QI, dsp),
13842 DIRECT_BUILTIN (shll_qb, MIPS_V4QI_FTYPE_V4QI_SI, dsp),
13843 DIRECT_BUILTIN (shll_ph, MIPS_V2HI_FTYPE_V2HI_SI, dsp),
13844 DIRECT_BUILTIN (shll_s_ph, MIPS_V2HI_FTYPE_V2HI_SI, dsp),
13845 DIRECT_BUILTIN (shll_s_w, MIPS_SI_FTYPE_SI_SI, dsp),
13846 DIRECT_BUILTIN (shrl_qb, MIPS_V4QI_FTYPE_V4QI_SI, dsp),
13847 DIRECT_BUILTIN (shra_ph, MIPS_V2HI_FTYPE_V2HI_SI, dsp),
13848 DIRECT_BUILTIN (shra_r_ph, MIPS_V2HI_FTYPE_V2HI_SI, dsp),
13849 DIRECT_BUILTIN (shra_r_w, MIPS_SI_FTYPE_SI_SI, dsp),
13850 DIRECT_BUILTIN (muleu_s_ph_qbl, MIPS_V2HI_FTYPE_V4QI_V2HI, dsp),
13851 DIRECT_BUILTIN (muleu_s_ph_qbr, MIPS_V2HI_FTYPE_V4QI_V2HI, dsp),
13852 DIRECT_BUILTIN (mulq_rs_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dsp),
13853 DIRECT_BUILTIN (muleq_s_w_phl, MIPS_SI_FTYPE_V2HI_V2HI, dsp),
13854 DIRECT_BUILTIN (muleq_s_w_phr, MIPS_SI_FTYPE_V2HI_V2HI, dsp),
13855 DIRECT_BUILTIN (bitrev, MIPS_SI_FTYPE_SI, dsp),
13856 DIRECT_BUILTIN (insv, MIPS_SI_FTYPE_SI_SI, dsp),
13857 DIRECT_BUILTIN (repl_qb, MIPS_V4QI_FTYPE_SI, dsp),
13858 DIRECT_BUILTIN (repl_ph, MIPS_V2HI_FTYPE_SI, dsp),
13859 DIRECT_NO_TARGET_BUILTIN (cmpu_eq_qb, MIPS_VOID_FTYPE_V4QI_V4QI, dsp),
13860 DIRECT_NO_TARGET_BUILTIN (cmpu_lt_qb, MIPS_VOID_FTYPE_V4QI_V4QI, dsp),
13861 DIRECT_NO_TARGET_BUILTIN (cmpu_le_qb, MIPS_VOID_FTYPE_V4QI_V4QI, dsp),
13862 DIRECT_BUILTIN (cmpgu_eq_qb, MIPS_SI_FTYPE_V4QI_V4QI, dsp),
13863 DIRECT_BUILTIN (cmpgu_lt_qb, MIPS_SI_FTYPE_V4QI_V4QI, dsp),
13864 DIRECT_BUILTIN (cmpgu_le_qb, MIPS_SI_FTYPE_V4QI_V4QI, dsp),
13865 DIRECT_NO_TARGET_BUILTIN (cmp_eq_ph, MIPS_VOID_FTYPE_V2HI_V2HI, dsp),
13866 DIRECT_NO_TARGET_BUILTIN (cmp_lt_ph, MIPS_VOID_FTYPE_V2HI_V2HI, dsp),
13867 DIRECT_NO_TARGET_BUILTIN (cmp_le_ph, MIPS_VOID_FTYPE_V2HI_V2HI, dsp),
13868 DIRECT_BUILTIN (pick_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dsp),
13869 DIRECT_BUILTIN (pick_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dsp),
13870 DIRECT_BUILTIN (packrl_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dsp),
13871 DIRECT_NO_TARGET_BUILTIN (wrdsp, MIPS_VOID_FTYPE_SI_SI, dsp),
13872 DIRECT_BUILTIN (rddsp, MIPS_SI_FTYPE_SI, dsp),
13873 DIRECT_BUILTIN (lbux, MIPS_SI_FTYPE_POINTER_SI, dsp),
13874 DIRECT_BUILTIN (lhx, MIPS_SI_FTYPE_POINTER_SI, dsp),
13875 DIRECT_BUILTIN (lwx, MIPS_SI_FTYPE_POINTER_SI, dsp),
13876 BPOSGE_BUILTIN (32, dsp),
13877
13878 /* The following are for the MIPS DSP ASE REV 2 (32-bit and 64-bit). */
13879 DIRECT_BUILTIN (absq_s_qb, MIPS_V4QI_FTYPE_V4QI, dspr2),
13880 DIRECT_BUILTIN (addu_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
13881 DIRECT_BUILTIN (addu_s_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
13882 DIRECT_BUILTIN (adduh_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dspr2),
13883 DIRECT_BUILTIN (adduh_r_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dspr2),
13884 DIRECT_BUILTIN (append, MIPS_SI_FTYPE_SI_SI_SI, dspr2),
13885 DIRECT_BUILTIN (balign, MIPS_SI_FTYPE_SI_SI_SI, dspr2),
13886 DIRECT_BUILTIN (cmpgdu_eq_qb, MIPS_SI_FTYPE_V4QI_V4QI, dspr2),
13887 DIRECT_BUILTIN (cmpgdu_lt_qb, MIPS_SI_FTYPE_V4QI_V4QI, dspr2),
13888 DIRECT_BUILTIN (cmpgdu_le_qb, MIPS_SI_FTYPE_V4QI_V4QI, dspr2),
13889 DIRECT_BUILTIN (mul_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
13890 DIRECT_BUILTIN (mul_s_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
13891 DIRECT_BUILTIN (mulq_rs_w, MIPS_SI_FTYPE_SI_SI, dspr2),
13892 DIRECT_BUILTIN (mulq_s_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
13893 DIRECT_BUILTIN (mulq_s_w, MIPS_SI_FTYPE_SI_SI, dspr2),
13894 DIRECT_BUILTIN (precr_qb_ph, MIPS_V4QI_FTYPE_V2HI_V2HI, dspr2),
13895 DIRECT_BUILTIN (precr_sra_ph_w, MIPS_V2HI_FTYPE_SI_SI_SI, dspr2),
13896 DIRECT_BUILTIN (precr_sra_r_ph_w, MIPS_V2HI_FTYPE_SI_SI_SI, dspr2),
13897 DIRECT_BUILTIN (prepend, MIPS_SI_FTYPE_SI_SI_SI, dspr2),
13898 DIRECT_BUILTIN (shra_qb, MIPS_V4QI_FTYPE_V4QI_SI, dspr2),
13899 DIRECT_BUILTIN (shra_r_qb, MIPS_V4QI_FTYPE_V4QI_SI, dspr2),
13900 DIRECT_BUILTIN (shrl_ph, MIPS_V2HI_FTYPE_V2HI_SI, dspr2),
13901 DIRECT_BUILTIN (subu_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
13902 DIRECT_BUILTIN (subu_s_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
13903 DIRECT_BUILTIN (subuh_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dspr2),
13904 DIRECT_BUILTIN (subuh_r_qb, MIPS_V4QI_FTYPE_V4QI_V4QI, dspr2),
13905 DIRECT_BUILTIN (addqh_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
13906 DIRECT_BUILTIN (addqh_r_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
13907 DIRECT_BUILTIN (addqh_w, MIPS_SI_FTYPE_SI_SI, dspr2),
13908 DIRECT_BUILTIN (addqh_r_w, MIPS_SI_FTYPE_SI_SI, dspr2),
13909 DIRECT_BUILTIN (subqh_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
13910 DIRECT_BUILTIN (subqh_r_ph, MIPS_V2HI_FTYPE_V2HI_V2HI, dspr2),
13911 DIRECT_BUILTIN (subqh_w, MIPS_SI_FTYPE_SI_SI, dspr2),
13912 DIRECT_BUILTIN (subqh_r_w, MIPS_SI_FTYPE_SI_SI, dspr2),
13913
13914 /* Built-in functions for the DSP ASE (32-bit only). */
13915 DIRECT_BUILTIN (dpau_h_qbl, MIPS_DI_FTYPE_DI_V4QI_V4QI, dsp_32),
13916 DIRECT_BUILTIN (dpau_h_qbr, MIPS_DI_FTYPE_DI_V4QI_V4QI, dsp_32),
13917 DIRECT_BUILTIN (dpsu_h_qbl, MIPS_DI_FTYPE_DI_V4QI_V4QI, dsp_32),
13918 DIRECT_BUILTIN (dpsu_h_qbr, MIPS_DI_FTYPE_DI_V4QI_V4QI, dsp_32),
13919 DIRECT_BUILTIN (dpaq_s_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dsp_32),
13920 DIRECT_BUILTIN (dpsq_s_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dsp_32),
13921 DIRECT_BUILTIN (mulsaq_s_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dsp_32),
13922 DIRECT_BUILTIN (dpaq_sa_l_w, MIPS_DI_FTYPE_DI_SI_SI, dsp_32),
13923 DIRECT_BUILTIN (dpsq_sa_l_w, MIPS_DI_FTYPE_DI_SI_SI, dsp_32),
13924 DIRECT_BUILTIN (maq_s_w_phl, MIPS_DI_FTYPE_DI_V2HI_V2HI, dsp_32),
13925 DIRECT_BUILTIN (maq_s_w_phr, MIPS_DI_FTYPE_DI_V2HI_V2HI, dsp_32),
13926 DIRECT_BUILTIN (maq_sa_w_phl, MIPS_DI_FTYPE_DI_V2HI_V2HI, dsp_32),
13927 DIRECT_BUILTIN (maq_sa_w_phr, MIPS_DI_FTYPE_DI_V2HI_V2HI, dsp_32),
13928 DIRECT_BUILTIN (extr_w, MIPS_SI_FTYPE_DI_SI, dsp_32),
13929 DIRECT_BUILTIN (extr_r_w, MIPS_SI_FTYPE_DI_SI, dsp_32),
13930 DIRECT_BUILTIN (extr_rs_w, MIPS_SI_FTYPE_DI_SI, dsp_32),
13931 DIRECT_BUILTIN (extr_s_h, MIPS_SI_FTYPE_DI_SI, dsp_32),
13932 DIRECT_BUILTIN (extp, MIPS_SI_FTYPE_DI_SI, dsp_32),
13933 DIRECT_BUILTIN (extpdp, MIPS_SI_FTYPE_DI_SI, dsp_32),
13934 DIRECT_BUILTIN (shilo, MIPS_DI_FTYPE_DI_SI, dsp_32),
13935 DIRECT_BUILTIN (mthlip, MIPS_DI_FTYPE_DI_SI, dsp_32),
13936 DIRECT_BUILTIN (madd, MIPS_DI_FTYPE_DI_SI_SI, dsp_32),
13937 DIRECT_BUILTIN (maddu, MIPS_DI_FTYPE_DI_USI_USI, dsp_32),
13938 DIRECT_BUILTIN (msub, MIPS_DI_FTYPE_DI_SI_SI, dsp_32),
13939 DIRECT_BUILTIN (msubu, MIPS_DI_FTYPE_DI_USI_USI, dsp_32),
13940 DIRECT_BUILTIN (mult, MIPS_DI_FTYPE_SI_SI, dsp_32),
13941 DIRECT_BUILTIN (multu, MIPS_DI_FTYPE_USI_USI, dsp_32),
13942
13943 /* Built-in functions for the DSP ASE (64-bit only). */
13944 DIRECT_BUILTIN (ldx, MIPS_DI_FTYPE_POINTER_SI, dsp_64),
13945
13946 /* The following are for the MIPS DSP ASE REV 2 (32-bit only). */
13947 DIRECT_BUILTIN (dpa_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32),
13948 DIRECT_BUILTIN (dps_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32),
13949 DIRECT_BUILTIN (mulsa_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32),
13950 DIRECT_BUILTIN (dpax_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32),
13951 DIRECT_BUILTIN (dpsx_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32),
13952 DIRECT_BUILTIN (dpaqx_s_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32),
13953 DIRECT_BUILTIN (dpaqx_sa_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32),
13954 DIRECT_BUILTIN (dpsqx_s_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32),
13955 DIRECT_BUILTIN (dpsqx_sa_w_ph, MIPS_DI_FTYPE_DI_V2HI_V2HI, dspr2_32),
13956
13957 /* Builtin functions for ST Microelectronics Loongson-2E/2F cores. */
13958 LOONGSON_BUILTIN (packsswh, MIPS_V4HI_FTYPE_V2SI_V2SI),
13959 LOONGSON_BUILTIN (packsshb, MIPS_V8QI_FTYPE_V4HI_V4HI),
13960 LOONGSON_BUILTIN (packushb, MIPS_UV8QI_FTYPE_UV4HI_UV4HI),
13961 LOONGSON_BUILTIN_SUFFIX (paddw, u, MIPS_UV2SI_FTYPE_UV2SI_UV2SI),
13962 LOONGSON_BUILTIN_SUFFIX (paddh, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
13963 LOONGSON_BUILTIN_SUFFIX (paddb, u, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
13964 LOONGSON_BUILTIN_SUFFIX (paddw, s, MIPS_V2SI_FTYPE_V2SI_V2SI),
13965 LOONGSON_BUILTIN_SUFFIX (paddh, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
13966 LOONGSON_BUILTIN_SUFFIX (paddb, s, MIPS_V8QI_FTYPE_V8QI_V8QI),
13967 LOONGSON_BUILTIN_SUFFIX (paddd, u, MIPS_UDI_FTYPE_UDI_UDI),
13968 LOONGSON_BUILTIN_SUFFIX (paddd, s, MIPS_DI_FTYPE_DI_DI),
13969 LOONGSON_BUILTIN (paddsh, MIPS_V4HI_FTYPE_V4HI_V4HI),
13970 LOONGSON_BUILTIN (paddsb, MIPS_V8QI_FTYPE_V8QI_V8QI),
13971 LOONGSON_BUILTIN (paddush, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
13972 LOONGSON_BUILTIN (paddusb, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
13973 LOONGSON_BUILTIN_ALIAS (pandn_d, pandn_ud, MIPS_UDI_FTYPE_UDI_UDI),
13974 LOONGSON_BUILTIN_ALIAS (pandn_w, pandn_uw, MIPS_UV2SI_FTYPE_UV2SI_UV2SI),
13975 LOONGSON_BUILTIN_ALIAS (pandn_h, pandn_uh, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
13976 LOONGSON_BUILTIN_ALIAS (pandn_b, pandn_ub, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
13977 LOONGSON_BUILTIN_ALIAS (pandn_d, pandn_sd, MIPS_DI_FTYPE_DI_DI),
13978 LOONGSON_BUILTIN_ALIAS (pandn_w, pandn_sw, MIPS_V2SI_FTYPE_V2SI_V2SI),
13979 LOONGSON_BUILTIN_ALIAS (pandn_h, pandn_sh, MIPS_V4HI_FTYPE_V4HI_V4HI),
13980 LOONGSON_BUILTIN_ALIAS (pandn_b, pandn_sb, MIPS_V8QI_FTYPE_V8QI_V8QI),
13981 LOONGSON_BUILTIN (pavgh, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
13982 LOONGSON_BUILTIN (pavgb, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
13983 LOONGSON_BUILTIN_SUFFIX (pcmpeqw, u, MIPS_UV2SI_FTYPE_UV2SI_UV2SI),
13984 LOONGSON_BUILTIN_SUFFIX (pcmpeqh, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
13985 LOONGSON_BUILTIN_SUFFIX (pcmpeqb, u, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
13986 LOONGSON_BUILTIN_SUFFIX (pcmpeqw, s, MIPS_V2SI_FTYPE_V2SI_V2SI),
13987 LOONGSON_BUILTIN_SUFFIX (pcmpeqh, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
13988 LOONGSON_BUILTIN_SUFFIX (pcmpeqb, s, MIPS_V8QI_FTYPE_V8QI_V8QI),
13989 LOONGSON_BUILTIN_SUFFIX (pcmpgtw, u, MIPS_UV2SI_FTYPE_UV2SI_UV2SI),
13990 LOONGSON_BUILTIN_SUFFIX (pcmpgth, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
13991 LOONGSON_BUILTIN_SUFFIX (pcmpgtb, u, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
13992 LOONGSON_BUILTIN_SUFFIX (pcmpgtw, s, MIPS_V2SI_FTYPE_V2SI_V2SI),
13993 LOONGSON_BUILTIN_SUFFIX (pcmpgth, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
13994 LOONGSON_BUILTIN_SUFFIX (pcmpgtb, s, MIPS_V8QI_FTYPE_V8QI_V8QI),
13995 LOONGSON_BUILTIN_SUFFIX (pextrh, u, MIPS_UV4HI_FTYPE_UV4HI_USI),
13996 LOONGSON_BUILTIN_SUFFIX (pextrh, s, MIPS_V4HI_FTYPE_V4HI_USI),
13997 LOONGSON_BUILTIN_SUFFIX (pinsrh_0, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
13998 LOONGSON_BUILTIN_SUFFIX (pinsrh_1, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
13999 LOONGSON_BUILTIN_SUFFIX (pinsrh_2, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
14000 LOONGSON_BUILTIN_SUFFIX (pinsrh_3, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
14001 LOONGSON_BUILTIN_SUFFIX (pinsrh_0, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
14002 LOONGSON_BUILTIN_SUFFIX (pinsrh_1, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
14003 LOONGSON_BUILTIN_SUFFIX (pinsrh_2, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
14004 LOONGSON_BUILTIN_SUFFIX (pinsrh_3, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
14005 LOONGSON_BUILTIN (pmaddhw, MIPS_V2SI_FTYPE_V4HI_V4HI),
14006 LOONGSON_BUILTIN (pmaxsh, MIPS_V4HI_FTYPE_V4HI_V4HI),
14007 LOONGSON_BUILTIN (pmaxub, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
14008 LOONGSON_BUILTIN (pminsh, MIPS_V4HI_FTYPE_V4HI_V4HI),
14009 LOONGSON_BUILTIN (pminub, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
14010 LOONGSON_BUILTIN_SUFFIX (pmovmskb, u, MIPS_UV8QI_FTYPE_UV8QI),
14011 LOONGSON_BUILTIN_SUFFIX (pmovmskb, s, MIPS_V8QI_FTYPE_V8QI),
14012 LOONGSON_BUILTIN (pmulhuh, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
14013 LOONGSON_BUILTIN (pmulhh, MIPS_V4HI_FTYPE_V4HI_V4HI),
14014 LOONGSON_BUILTIN (pmullh, MIPS_V4HI_FTYPE_V4HI_V4HI),
14015 LOONGSON_BUILTIN (pmuluw, MIPS_UDI_FTYPE_UV2SI_UV2SI),
14016 LOONGSON_BUILTIN (pasubub, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
14017 LOONGSON_BUILTIN (biadd, MIPS_UV4HI_FTYPE_UV8QI),
14018 LOONGSON_BUILTIN (psadbh, MIPS_UV4HI_FTYPE_UV8QI_UV8QI),
14019 LOONGSON_BUILTIN_SUFFIX (pshufh, u, MIPS_UV4HI_FTYPE_UV4HI_UQI),
14020 LOONGSON_BUILTIN_SUFFIX (pshufh, s, MIPS_V4HI_FTYPE_V4HI_UQI),
14021 LOONGSON_BUILTIN_SUFFIX (psllh, u, MIPS_UV4HI_FTYPE_UV4HI_UQI),
14022 LOONGSON_BUILTIN_SUFFIX (psllh, s, MIPS_V4HI_FTYPE_V4HI_UQI),
14023 LOONGSON_BUILTIN_SUFFIX (psllw, u, MIPS_UV2SI_FTYPE_UV2SI_UQI),
14024 LOONGSON_BUILTIN_SUFFIX (psllw, s, MIPS_V2SI_FTYPE_V2SI_UQI),
14025 LOONGSON_BUILTIN_SUFFIX (psrah, u, MIPS_UV4HI_FTYPE_UV4HI_UQI),
14026 LOONGSON_BUILTIN_SUFFIX (psrah, s, MIPS_V4HI_FTYPE_V4HI_UQI),
14027 LOONGSON_BUILTIN_SUFFIX (psraw, u, MIPS_UV2SI_FTYPE_UV2SI_UQI),
14028 LOONGSON_BUILTIN_SUFFIX (psraw, s, MIPS_V2SI_FTYPE_V2SI_UQI),
14029 LOONGSON_BUILTIN_SUFFIX (psrlh, u, MIPS_UV4HI_FTYPE_UV4HI_UQI),
14030 LOONGSON_BUILTIN_SUFFIX (psrlh, s, MIPS_V4HI_FTYPE_V4HI_UQI),
14031 LOONGSON_BUILTIN_SUFFIX (psrlw, u, MIPS_UV2SI_FTYPE_UV2SI_UQI),
14032 LOONGSON_BUILTIN_SUFFIX (psrlw, s, MIPS_V2SI_FTYPE_V2SI_UQI),
14033 LOONGSON_BUILTIN_SUFFIX (psubw, u, MIPS_UV2SI_FTYPE_UV2SI_UV2SI),
14034 LOONGSON_BUILTIN_SUFFIX (psubh, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
14035 LOONGSON_BUILTIN_SUFFIX (psubb, u, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
14036 LOONGSON_BUILTIN_SUFFIX (psubw, s, MIPS_V2SI_FTYPE_V2SI_V2SI),
14037 LOONGSON_BUILTIN_SUFFIX (psubh, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
14038 LOONGSON_BUILTIN_SUFFIX (psubb, s, MIPS_V8QI_FTYPE_V8QI_V8QI),
14039 LOONGSON_BUILTIN_SUFFIX (psubd, u, MIPS_UDI_FTYPE_UDI_UDI),
14040 LOONGSON_BUILTIN_SUFFIX (psubd, s, MIPS_DI_FTYPE_DI_DI),
14041 LOONGSON_BUILTIN (psubsh, MIPS_V4HI_FTYPE_V4HI_V4HI),
14042 LOONGSON_BUILTIN (psubsb, MIPS_V8QI_FTYPE_V8QI_V8QI),
14043 LOONGSON_BUILTIN (psubush, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
14044 LOONGSON_BUILTIN (psubusb, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
14045 LOONGSON_BUILTIN_SUFFIX (punpckhbh, u, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
14046 LOONGSON_BUILTIN_SUFFIX (punpckhhw, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
14047 LOONGSON_BUILTIN_SUFFIX (punpckhwd, u, MIPS_UV2SI_FTYPE_UV2SI_UV2SI),
14048 LOONGSON_BUILTIN_SUFFIX (punpckhbh, s, MIPS_V8QI_FTYPE_V8QI_V8QI),
14049 LOONGSON_BUILTIN_SUFFIX (punpckhhw, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
14050 LOONGSON_BUILTIN_SUFFIX (punpckhwd, s, MIPS_V2SI_FTYPE_V2SI_V2SI),
14051 LOONGSON_BUILTIN_SUFFIX (punpcklbh, u, MIPS_UV8QI_FTYPE_UV8QI_UV8QI),
14052 LOONGSON_BUILTIN_SUFFIX (punpcklhw, u, MIPS_UV4HI_FTYPE_UV4HI_UV4HI),
14053 LOONGSON_BUILTIN_SUFFIX (punpcklwd, u, MIPS_UV2SI_FTYPE_UV2SI_UV2SI),
14054 LOONGSON_BUILTIN_SUFFIX (punpcklbh, s, MIPS_V8QI_FTYPE_V8QI_V8QI),
14055 LOONGSON_BUILTIN_SUFFIX (punpcklhw, s, MIPS_V4HI_FTYPE_V4HI_V4HI),
14056 LOONGSON_BUILTIN_SUFFIX (punpcklwd, s, MIPS_V2SI_FTYPE_V2SI_V2SI),
14057
14058 /* Sundry other built-in functions. */
14059 DIRECT_NO_TARGET_BUILTIN (cache, MIPS_VOID_FTYPE_SI_CVPOINTER, cache)
14060 };
14061
14062 /* Index I is the function declaration for mips_builtins[I], or null if the
14063 function isn't defined on this target. */
14064 static GTY(()) tree mips_builtin_decls[ARRAY_SIZE (mips_builtins)];
14065
14066 /* MODE is a vector mode whose elements have type TYPE. Return the type
14067 of the vector itself. */
14068
14069 static tree
14070 mips_builtin_vector_type (tree type, enum machine_mode mode)
14071 {
14072 static tree types[2 * (int) MAX_MACHINE_MODE];
14073 int mode_index;
14074
14075 mode_index = (int) mode;
14076
14077 if (TREE_CODE (type) == INTEGER_TYPE && TYPE_UNSIGNED (type))
14078 mode_index += MAX_MACHINE_MODE;
14079
14080 if (types[mode_index] == NULL_TREE)
14081 types[mode_index] = build_vector_type_for_mode (type, mode);
14082 return types[mode_index];
14083 }
14084
14085 /* Return a type for 'const volatile void *'. */
14086
14087 static tree
14088 mips_build_cvpointer_type (void)
14089 {
14090 static tree cache;
14091
14092 if (cache == NULL_TREE)
14093 cache = build_pointer_type (build_qualified_type
14094 (void_type_node,
14095 TYPE_QUAL_CONST | TYPE_QUAL_VOLATILE));
14096 return cache;
14097 }
14098
14099 /* Source-level argument types. */
14100 #define MIPS_ATYPE_VOID void_type_node
14101 #define MIPS_ATYPE_INT integer_type_node
14102 #define MIPS_ATYPE_POINTER ptr_type_node
14103 #define MIPS_ATYPE_CVPOINTER mips_build_cvpointer_type ()
14104
14105 /* Standard mode-based argument types. */
14106 #define MIPS_ATYPE_UQI unsigned_intQI_type_node
14107 #define MIPS_ATYPE_SI intSI_type_node
14108 #define MIPS_ATYPE_USI unsigned_intSI_type_node
14109 #define MIPS_ATYPE_DI intDI_type_node
14110 #define MIPS_ATYPE_UDI unsigned_intDI_type_node
14111 #define MIPS_ATYPE_SF float_type_node
14112 #define MIPS_ATYPE_DF double_type_node
14113
14114 /* Vector argument types. */
14115 #define MIPS_ATYPE_V2SF mips_builtin_vector_type (float_type_node, V2SFmode)
14116 #define MIPS_ATYPE_V2HI mips_builtin_vector_type (intHI_type_node, V2HImode)
14117 #define MIPS_ATYPE_V2SI mips_builtin_vector_type (intSI_type_node, V2SImode)
14118 #define MIPS_ATYPE_V4QI mips_builtin_vector_type (intQI_type_node, V4QImode)
14119 #define MIPS_ATYPE_V4HI mips_builtin_vector_type (intHI_type_node, V4HImode)
14120 #define MIPS_ATYPE_V8QI mips_builtin_vector_type (intQI_type_node, V8QImode)
14121 #define MIPS_ATYPE_UV2SI \
14122 mips_builtin_vector_type (unsigned_intSI_type_node, V2SImode)
14123 #define MIPS_ATYPE_UV4HI \
14124 mips_builtin_vector_type (unsigned_intHI_type_node, V4HImode)
14125 #define MIPS_ATYPE_UV8QI \
14126 mips_builtin_vector_type (unsigned_intQI_type_node, V8QImode)
14127
14128 /* MIPS_FTYPE_ATYPESN takes N MIPS_FTYPES-like type codes and lists
14129 their associated MIPS_ATYPEs. */
14130 #define MIPS_FTYPE_ATYPES1(A, B) \
14131 MIPS_ATYPE_##A, MIPS_ATYPE_##B
14132
14133 #define MIPS_FTYPE_ATYPES2(A, B, C) \
14134 MIPS_ATYPE_##A, MIPS_ATYPE_##B, MIPS_ATYPE_##C
14135
14136 #define MIPS_FTYPE_ATYPES3(A, B, C, D) \
14137 MIPS_ATYPE_##A, MIPS_ATYPE_##B, MIPS_ATYPE_##C, MIPS_ATYPE_##D
14138
14139 #define MIPS_FTYPE_ATYPES4(A, B, C, D, E) \
14140 MIPS_ATYPE_##A, MIPS_ATYPE_##B, MIPS_ATYPE_##C, MIPS_ATYPE_##D, \
14141 MIPS_ATYPE_##E
14142
14143 /* Return the function type associated with function prototype TYPE. */
14144
14145 static tree
14146 mips_build_function_type (enum mips_function_type type)
14147 {
14148 static tree types[(int) MIPS_MAX_FTYPE_MAX];
14149
14150 if (types[(int) type] == NULL_TREE)
14151 switch (type)
14152 {
14153 #define DEF_MIPS_FTYPE(NUM, ARGS) \
14154 case MIPS_FTYPE_NAME##NUM ARGS: \
14155 types[(int) type] \
14156 = build_function_type_list (MIPS_FTYPE_ATYPES##NUM ARGS, \
14157 NULL_TREE); \
14158 break;
14159 #include "config/mips/mips-ftypes.def"
14160 #undef DEF_MIPS_FTYPE
14161 default:
14162 gcc_unreachable ();
14163 }
14164
14165 return types[(int) type];
14166 }
14167
14168 /* Implement TARGET_INIT_BUILTINS. */
14169
14170 static void
14171 mips_init_builtins (void)
14172 {
14173 const struct mips_builtin_description *d;
14174 unsigned int i;
14175
14176 /* Iterate through all of the bdesc arrays, initializing all of the
14177 builtin functions. */
14178 for (i = 0; i < ARRAY_SIZE (mips_builtins); i++)
14179 {
14180 d = &mips_builtins[i];
14181 if (d->avail ())
14182 mips_builtin_decls[i]
14183 = add_builtin_function (d->name,
14184 mips_build_function_type (d->function_type),
14185 i, BUILT_IN_MD, NULL, NULL);
14186 }
14187 }
14188
14189 /* Implement TARGET_BUILTIN_DECL. */
14190
14191 static tree
14192 mips_builtin_decl (unsigned int code, bool initialize_p ATTRIBUTE_UNUSED)
14193 {
14194 if (code >= ARRAY_SIZE (mips_builtins))
14195 return error_mark_node;
14196 return mips_builtin_decls[code];
14197 }
14198
14199 /* Take argument ARGNO from EXP's argument list and convert it into
14200 an expand operand. Store the operand in *OP. */
14201
14202 static void
14203 mips_prepare_builtin_arg (struct expand_operand *op, tree exp,
14204 unsigned int argno)
14205 {
14206 tree arg;
14207 rtx value;
14208
14209 arg = CALL_EXPR_ARG (exp, argno);
14210 value = expand_normal (arg);
14211 create_input_operand (op, value, TYPE_MODE (TREE_TYPE (arg)));
14212 }
14213
14214 /* Expand instruction ICODE as part of a built-in function sequence.
14215 Use the first NOPS elements of OPS as the instruction's operands.
14216 HAS_TARGET_P is true if operand 0 is a target; it is false if the
14217 instruction has no target.
14218
14219 Return the target rtx if HAS_TARGET_P, otherwise return const0_rtx. */
14220
14221 static rtx
14222 mips_expand_builtin_insn (enum insn_code icode, unsigned int nops,
14223 struct expand_operand *ops, bool has_target_p)
14224 {
14225 if (!maybe_expand_insn (icode, nops, ops))
14226 {
14227 error ("invalid argument to built-in function");
14228 return has_target_p ? gen_reg_rtx (ops[0].mode) : const0_rtx;
14229 }
14230 return has_target_p ? ops[0].value : const0_rtx;
14231 }
14232
14233 /* Expand a floating-point comparison for built-in function call EXP.
14234 The first NARGS arguments are the values to be compared. ICODE is
14235 the .md pattern that does the comparison and COND is the condition
14236 that is being tested. Return an rtx for the result. */
14237
14238 static rtx
14239 mips_expand_builtin_compare_1 (enum insn_code icode,
14240 enum mips_fp_condition cond,
14241 tree exp, int nargs)
14242 {
14243 struct expand_operand ops[MAX_RECOG_OPERANDS];
14244 rtx output;
14245 int opno, argno;
14246
14247 /* The instruction should have a target operand, an operand for each
14248 argument, and an operand for COND. */
14249 gcc_assert (nargs + 2 == insn_data[(int) icode].n_generator_args);
14250
14251 output = mips_allocate_fcc (insn_data[(int) icode].operand[0].mode);
14252 opno = 0;
14253 create_fixed_operand (&ops[opno++], output);
14254 for (argno = 0; argno < nargs; argno++)
14255 mips_prepare_builtin_arg (&ops[opno++], exp, argno);
14256 create_integer_operand (&ops[opno++], (int) cond);
14257 return mips_expand_builtin_insn (icode, opno, ops, true);
14258 }
14259
14260 /* Expand a MIPS_BUILTIN_DIRECT or MIPS_BUILTIN_DIRECT_NO_TARGET function;
14261 HAS_TARGET_P says which. EXP is the CALL_EXPR that calls the function
14262 and ICODE is the code of the associated .md pattern. TARGET, if nonnull,
14263 suggests a good place to put the result. */
14264
14265 static rtx
14266 mips_expand_builtin_direct (enum insn_code icode, rtx target, tree exp,
14267 bool has_target_p)
14268 {
14269 struct expand_operand ops[MAX_RECOG_OPERANDS];
14270 int opno, argno;
14271
14272 /* Map any target to operand 0. */
14273 opno = 0;
14274 if (has_target_p)
14275 create_output_operand (&ops[opno++], target, TYPE_MODE (TREE_TYPE (exp)));
14276
14277 /* Map the arguments to the other operands. */
14278 gcc_assert (opno + call_expr_nargs (exp)
14279 == insn_data[icode].n_generator_args);
14280 for (argno = 0; argno < call_expr_nargs (exp); argno++)
14281 mips_prepare_builtin_arg (&ops[opno++], exp, argno);
14282
14283 return mips_expand_builtin_insn (icode, opno, ops, has_target_p);
14284 }
14285
14286 /* Expand a __builtin_mips_movt_*_ps or __builtin_mips_movf_*_ps
14287 function; TYPE says which. EXP is the CALL_EXPR that calls the
14288 function, ICODE is the instruction that should be used to compare
14289 the first two arguments, and COND is the condition it should test.
14290 TARGET, if nonnull, suggests a good place to put the result. */
14291
14292 static rtx
14293 mips_expand_builtin_movtf (enum mips_builtin_type type,
14294 enum insn_code icode, enum mips_fp_condition cond,
14295 rtx target, tree exp)
14296 {
14297 struct expand_operand ops[4];
14298 rtx cmp_result;
14299
14300 cmp_result = mips_expand_builtin_compare_1 (icode, cond, exp, 2);
14301 create_output_operand (&ops[0], target, TYPE_MODE (TREE_TYPE (exp)));
14302 if (type == MIPS_BUILTIN_MOVT)
14303 {
14304 mips_prepare_builtin_arg (&ops[2], exp, 2);
14305 mips_prepare_builtin_arg (&ops[1], exp, 3);
14306 }
14307 else
14308 {
14309 mips_prepare_builtin_arg (&ops[1], exp, 2);
14310 mips_prepare_builtin_arg (&ops[2], exp, 3);
14311 }
14312 create_fixed_operand (&ops[3], cmp_result);
14313 return mips_expand_builtin_insn (CODE_FOR_mips_cond_move_tf_ps,
14314 4, ops, true);
14315 }
14316
14317 /* Move VALUE_IF_TRUE into TARGET if CONDITION is true; move VALUE_IF_FALSE
14318 into TARGET otherwise. Return TARGET. */
14319
14320 static rtx
14321 mips_builtin_branch_and_move (rtx condition, rtx target,
14322 rtx value_if_true, rtx value_if_false)
14323 {
14324 rtx true_label, done_label;
14325
14326 true_label = gen_label_rtx ();
14327 done_label = gen_label_rtx ();
14328
14329 /* First assume that CONDITION is false. */
14330 mips_emit_move (target, value_if_false);
14331
14332 /* Branch to TRUE_LABEL if CONDITION is true and DONE_LABEL otherwise. */
14333 emit_jump_insn (gen_condjump (condition, true_label));
14334 emit_jump_insn (gen_jump (done_label));
14335 emit_barrier ();
14336
14337 /* Fix TARGET if CONDITION is true. */
14338 emit_label (true_label);
14339 mips_emit_move (target, value_if_true);
14340
14341 emit_label (done_label);
14342 return target;
14343 }
14344
14345 /* Expand a comparison built-in function of type BUILTIN_TYPE. EXP is
14346 the CALL_EXPR that calls the function, ICODE is the code of the
14347 comparison instruction, and COND is the condition it should test.
14348 TARGET, if nonnull, suggests a good place to put the boolean result. */
14349
14350 static rtx
14351 mips_expand_builtin_compare (enum mips_builtin_type builtin_type,
14352 enum insn_code icode, enum mips_fp_condition cond,
14353 rtx target, tree exp)
14354 {
14355 rtx offset, condition, cmp_result;
14356
14357 if (target == 0 || GET_MODE (target) != SImode)
14358 target = gen_reg_rtx (SImode);
14359 cmp_result = mips_expand_builtin_compare_1 (icode, cond, exp,
14360 call_expr_nargs (exp));
14361
14362 /* If the comparison sets more than one register, we define the result
14363 to be 0 if all registers are false and -1 if all registers are true.
14364 The value of the complete result is indeterminate otherwise. */
14365 switch (builtin_type)
14366 {
14367 case MIPS_BUILTIN_CMP_ALL:
14368 condition = gen_rtx_NE (VOIDmode, cmp_result, constm1_rtx);
14369 return mips_builtin_branch_and_move (condition, target,
14370 const0_rtx, const1_rtx);
14371
14372 case MIPS_BUILTIN_CMP_UPPER:
14373 case MIPS_BUILTIN_CMP_LOWER:
14374 offset = GEN_INT (builtin_type == MIPS_BUILTIN_CMP_UPPER);
14375 condition = gen_single_cc (cmp_result, offset);
14376 return mips_builtin_branch_and_move (condition, target,
14377 const1_rtx, const0_rtx);
14378
14379 default:
14380 condition = gen_rtx_NE (VOIDmode, cmp_result, const0_rtx);
14381 return mips_builtin_branch_and_move (condition, target,
14382 const1_rtx, const0_rtx);
14383 }
14384 }
14385
14386 /* Expand a bposge built-in function of type BUILTIN_TYPE. TARGET,
14387 if nonnull, suggests a good place to put the boolean result. */
14388
14389 static rtx
14390 mips_expand_builtin_bposge (enum mips_builtin_type builtin_type, rtx target)
14391 {
14392 rtx condition, cmp_result;
14393 int cmp_value;
14394
14395 if (target == 0 || GET_MODE (target) != SImode)
14396 target = gen_reg_rtx (SImode);
14397
14398 cmp_result = gen_rtx_REG (CCDSPmode, CCDSP_PO_REGNUM);
14399
14400 if (builtin_type == MIPS_BUILTIN_BPOSGE32)
14401 cmp_value = 32;
14402 else
14403 gcc_assert (0);
14404
14405 condition = gen_rtx_GE (VOIDmode, cmp_result, GEN_INT (cmp_value));
14406 return mips_builtin_branch_and_move (condition, target,
14407 const1_rtx, const0_rtx);
14408 }
14409
14410 /* Implement TARGET_EXPAND_BUILTIN. */
14411
14412 static rtx
14413 mips_expand_builtin (tree exp, rtx target, rtx subtarget ATTRIBUTE_UNUSED,
14414 enum machine_mode mode, int ignore)
14415 {
14416 tree fndecl;
14417 unsigned int fcode, avail;
14418 const struct mips_builtin_description *d;
14419
14420 fndecl = TREE_OPERAND (CALL_EXPR_FN (exp), 0);
14421 fcode = DECL_FUNCTION_CODE (fndecl);
14422 gcc_assert (fcode < ARRAY_SIZE (mips_builtins));
14423 d = &mips_builtins[fcode];
14424 avail = d->avail ();
14425 gcc_assert (avail != 0);
14426 if (TARGET_MIPS16)
14427 {
14428 error ("built-in function %qE not supported for MIPS16",
14429 DECL_NAME (fndecl));
14430 return ignore ? const0_rtx : CONST0_RTX (mode);
14431 }
14432 switch (d->builtin_type)
14433 {
14434 case MIPS_BUILTIN_DIRECT:
14435 return mips_expand_builtin_direct (d->icode, target, exp, true);
14436
14437 case MIPS_BUILTIN_DIRECT_NO_TARGET:
14438 return mips_expand_builtin_direct (d->icode, target, exp, false);
14439
14440 case MIPS_BUILTIN_MOVT:
14441 case MIPS_BUILTIN_MOVF:
14442 return mips_expand_builtin_movtf (d->builtin_type, d->icode,
14443 d->cond, target, exp);
14444
14445 case MIPS_BUILTIN_CMP_ANY:
14446 case MIPS_BUILTIN_CMP_ALL:
14447 case MIPS_BUILTIN_CMP_UPPER:
14448 case MIPS_BUILTIN_CMP_LOWER:
14449 case MIPS_BUILTIN_CMP_SINGLE:
14450 return mips_expand_builtin_compare (d->builtin_type, d->icode,
14451 d->cond, target, exp);
14452
14453 case MIPS_BUILTIN_BPOSGE32:
14454 return mips_expand_builtin_bposge (d->builtin_type, target);
14455 }
14456 gcc_unreachable ();
14457 }
14458 \f
14459 /* An entry in the MIPS16 constant pool. VALUE is the pool constant,
14460 MODE is its mode, and LABEL is the CODE_LABEL associated with it. */
14461 struct mips16_constant {
14462 struct mips16_constant *next;
14463 rtx value;
14464 rtx label;
14465 enum machine_mode mode;
14466 };
14467
14468 /* Information about an incomplete MIPS16 constant pool. FIRST is the
14469 first constant, HIGHEST_ADDRESS is the highest address that the first
14470 byte of the pool can have, and INSN_ADDRESS is the current instruction
14471 address. */
14472 struct mips16_constant_pool {
14473 struct mips16_constant *first;
14474 int highest_address;
14475 int insn_address;
14476 };
14477
14478 /* Add constant VALUE to POOL and return its label. MODE is the
14479 value's mode (used for CONST_INTs, etc.). */
14480
14481 static rtx
14482 mips16_add_constant (struct mips16_constant_pool *pool,
14483 rtx value, enum machine_mode mode)
14484 {
14485 struct mips16_constant **p, *c;
14486 bool first_of_size_p;
14487
14488 /* See whether the constant is already in the pool. If so, return the
14489 existing label, otherwise leave P pointing to the place where the
14490 constant should be added.
14491
14492 Keep the pool sorted in increasing order of mode size so that we can
14493 reduce the number of alignments needed. */
14494 first_of_size_p = true;
14495 for (p = &pool->first; *p != 0; p = &(*p)->next)
14496 {
14497 if (mode == (*p)->mode && rtx_equal_p (value, (*p)->value))
14498 return (*p)->label;
14499 if (GET_MODE_SIZE (mode) < GET_MODE_SIZE ((*p)->mode))
14500 break;
14501 if (GET_MODE_SIZE (mode) == GET_MODE_SIZE ((*p)->mode))
14502 first_of_size_p = false;
14503 }
14504
14505 /* In the worst case, the constant needed by the earliest instruction
14506 will end up at the end of the pool. The entire pool must then be
14507 accessible from that instruction.
14508
14509 When adding the first constant, set the pool's highest address to
14510 the address of the first out-of-range byte. Adjust this address
14511 downwards each time a new constant is added. */
14512 if (pool->first == 0)
14513 /* For LWPC, ADDIUPC and DADDIUPC, the base PC value is the address
14514 of the instruction with the lowest two bits clear. The base PC
14515 value for LDPC has the lowest three bits clear. Assume the worst
14516 case here; namely that the PC-relative instruction occupies the
14517 last 2 bytes in an aligned word. */
14518 pool->highest_address = pool->insn_address - (UNITS_PER_WORD - 2) + 0x8000;
14519 pool->highest_address -= GET_MODE_SIZE (mode);
14520 if (first_of_size_p)
14521 /* Take into account the worst possible padding due to alignment. */
14522 pool->highest_address -= GET_MODE_SIZE (mode) - 1;
14523
14524 /* Create a new entry. */
14525 c = XNEW (struct mips16_constant);
14526 c->value = value;
14527 c->mode = mode;
14528 c->label = gen_label_rtx ();
14529 c->next = *p;
14530 *p = c;
14531
14532 return c->label;
14533 }
14534
14535 /* Output constant VALUE after instruction INSN and return the last
14536 instruction emitted. MODE is the mode of the constant. */
14537
14538 static rtx
14539 mips16_emit_constants_1 (enum machine_mode mode, rtx value, rtx insn)
14540 {
14541 if (SCALAR_INT_MODE_P (mode) || ALL_SCALAR_FIXED_POINT_MODE_P (mode))
14542 {
14543 rtx size = GEN_INT (GET_MODE_SIZE (mode));
14544 return emit_insn_after (gen_consttable_int (value, size), insn);
14545 }
14546
14547 if (SCALAR_FLOAT_MODE_P (mode))
14548 return emit_insn_after (gen_consttable_float (value), insn);
14549
14550 if (VECTOR_MODE_P (mode))
14551 {
14552 int i;
14553
14554 for (i = 0; i < CONST_VECTOR_NUNITS (value); i++)
14555 insn = mips16_emit_constants_1 (GET_MODE_INNER (mode),
14556 CONST_VECTOR_ELT (value, i), insn);
14557 return insn;
14558 }
14559
14560 gcc_unreachable ();
14561 }
14562
14563 /* Dump out the constants in CONSTANTS after INSN. */
14564
14565 static void
14566 mips16_emit_constants (struct mips16_constant *constants, rtx insn)
14567 {
14568 struct mips16_constant *c, *next;
14569 int align;
14570
14571 align = 0;
14572 for (c = constants; c != NULL; c = next)
14573 {
14574 /* If necessary, increase the alignment of PC. */
14575 if (align < GET_MODE_SIZE (c->mode))
14576 {
14577 int align_log = floor_log2 (GET_MODE_SIZE (c->mode));
14578 insn = emit_insn_after (gen_align (GEN_INT (align_log)), insn);
14579 }
14580 align = GET_MODE_SIZE (c->mode);
14581
14582 insn = emit_label_after (c->label, insn);
14583 insn = mips16_emit_constants_1 (c->mode, c->value, insn);
14584
14585 next = c->next;
14586 free (c);
14587 }
14588
14589 emit_barrier_after (insn);
14590 }
14591
14592 /* Return the length of instruction INSN. */
14593
14594 static int
14595 mips16_insn_length (rtx insn)
14596 {
14597 if (JUMP_TABLE_DATA_P (insn))
14598 {
14599 rtx body = PATTERN (insn);
14600 if (GET_CODE (body) == ADDR_VEC)
14601 return GET_MODE_SIZE (GET_MODE (body)) * XVECLEN (body, 0);
14602 else if (GET_CODE (body) == ADDR_DIFF_VEC)
14603 return GET_MODE_SIZE (GET_MODE (body)) * XVECLEN (body, 1);
14604 else
14605 gcc_unreachable ();
14606 }
14607 return get_attr_length (insn);
14608 }
14609
14610 /* If *X is a symbolic constant that refers to the constant pool, add
14611 the constant to POOL and rewrite *X to use the constant's label. */
14612
14613 static void
14614 mips16_rewrite_pool_constant (struct mips16_constant_pool *pool, rtx *x)
14615 {
14616 rtx base, offset, label;
14617
14618 split_const (*x, &base, &offset);
14619 if (GET_CODE (base) == SYMBOL_REF && CONSTANT_POOL_ADDRESS_P (base))
14620 {
14621 label = mips16_add_constant (pool, copy_rtx (get_pool_constant (base)),
14622 get_pool_mode (base));
14623 base = gen_rtx_LABEL_REF (Pmode, label);
14624 *x = mips_unspec_address_offset (base, offset, SYMBOL_PC_RELATIVE);
14625 }
14626 }
14627
14628 /* This structure is used to communicate with mips16_rewrite_pool_refs.
14629 INSN is the instruction we're rewriting and POOL points to the current
14630 constant pool. */
14631 struct mips16_rewrite_pool_refs_info {
14632 rtx insn;
14633 struct mips16_constant_pool *pool;
14634 };
14635
14636 /* Rewrite *X so that constant pool references refer to the constant's
14637 label instead. DATA points to a mips16_rewrite_pool_refs_info
14638 structure. */
14639
14640 static int
14641 mips16_rewrite_pool_refs (rtx *x, void *data)
14642 {
14643 struct mips16_rewrite_pool_refs_info *info =
14644 (struct mips16_rewrite_pool_refs_info *) data;
14645
14646 if (force_to_mem_operand (*x, Pmode))
14647 {
14648 rtx mem = force_const_mem (GET_MODE (*x), *x);
14649 validate_change (info->insn, x, mem, false);
14650 }
14651
14652 if (MEM_P (*x))
14653 {
14654 mips16_rewrite_pool_constant (info->pool, &XEXP (*x, 0));
14655 return -1;
14656 }
14657
14658 /* Don't rewrite the __mips16_rdwr symbol. */
14659 if (GET_CODE (*x) == UNSPEC && XINT (*x, 1) == UNSPEC_TLS_GET_TP)
14660 return -1;
14661
14662 if (TARGET_MIPS16_TEXT_LOADS)
14663 mips16_rewrite_pool_constant (info->pool, x);
14664
14665 return GET_CODE (*x) == CONST ? -1 : 0;
14666 }
14667
14668 /* Return whether CFG is used in mips_reorg. */
14669
14670 static bool
14671 mips_cfg_in_reorg (void)
14672 {
14673 return (mips_r10k_cache_barrier != R10K_CACHE_BARRIER_NONE
14674 || TARGET_RELAX_PIC_CALLS);
14675 }
14676
14677 /* Build MIPS16 constant pools. Split the instructions if SPLIT_P,
14678 otherwise assume that they are already split. */
14679
14680 static void
14681 mips16_lay_out_constants (bool split_p)
14682 {
14683 struct mips16_constant_pool pool;
14684 struct mips16_rewrite_pool_refs_info info;
14685 rtx insn, barrier;
14686
14687 if (!TARGET_MIPS16_PCREL_LOADS)
14688 return;
14689
14690 if (split_p)
14691 {
14692 if (mips_cfg_in_reorg ())
14693 split_all_insns ();
14694 else
14695 split_all_insns_noflow ();
14696 }
14697 barrier = 0;
14698 memset (&pool, 0, sizeof (pool));
14699 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
14700 {
14701 /* Rewrite constant pool references in INSN. */
14702 if (USEFUL_INSN_P (insn))
14703 {
14704 info.insn = insn;
14705 info.pool = &pool;
14706 for_each_rtx (&PATTERN (insn), mips16_rewrite_pool_refs, &info);
14707 }
14708
14709 pool.insn_address += mips16_insn_length (insn);
14710
14711 if (pool.first != NULL)
14712 {
14713 /* If there are no natural barriers between the first user of
14714 the pool and the highest acceptable address, we'll need to
14715 create a new instruction to jump around the constant pool.
14716 In the worst case, this instruction will be 4 bytes long.
14717
14718 If it's too late to do this transformation after INSN,
14719 do it immediately before INSN. */
14720 if (barrier == 0 && pool.insn_address + 4 > pool.highest_address)
14721 {
14722 rtx label, jump;
14723
14724 label = gen_label_rtx ();
14725
14726 jump = emit_jump_insn_before (gen_jump (label), insn);
14727 JUMP_LABEL (jump) = label;
14728 LABEL_NUSES (label) = 1;
14729 barrier = emit_barrier_after (jump);
14730
14731 emit_label_after (label, barrier);
14732 pool.insn_address += 4;
14733 }
14734
14735 /* See whether the constant pool is now out of range of the first
14736 user. If so, output the constants after the previous barrier.
14737 Note that any instructions between BARRIER and INSN (inclusive)
14738 will use negative offsets to refer to the pool. */
14739 if (pool.insn_address > pool.highest_address)
14740 {
14741 mips16_emit_constants (pool.first, barrier);
14742 pool.first = NULL;
14743 barrier = 0;
14744 }
14745 else if (BARRIER_P (insn))
14746 barrier = insn;
14747 }
14748 }
14749 mips16_emit_constants (pool.first, get_last_insn ());
14750 }
14751 \f
14752 /* Return true if it is worth r10k_simplify_address's while replacing
14753 an address with X. We are looking for constants, and for addresses
14754 at a known offset from the incoming stack pointer. */
14755
14756 static bool
14757 r10k_simplified_address_p (rtx x)
14758 {
14759 if (GET_CODE (x) == PLUS && CONST_INT_P (XEXP (x, 1)))
14760 x = XEXP (x, 0);
14761 return x == virtual_incoming_args_rtx || CONSTANT_P (x);
14762 }
14763
14764 /* X is an expression that appears in INSN. Try to use the UD chains
14765 to simplify it, returning the simplified form on success and the
14766 original form otherwise. Replace the incoming value of $sp with
14767 virtual_incoming_args_rtx (which should never occur in X otherwise). */
14768
14769 static rtx
14770 r10k_simplify_address (rtx x, rtx insn)
14771 {
14772 rtx newx, op0, op1, set, def_insn, note;
14773 df_ref use, def;
14774 struct df_link *defs;
14775
14776 newx = NULL_RTX;
14777 if (UNARY_P (x))
14778 {
14779 op0 = r10k_simplify_address (XEXP (x, 0), insn);
14780 if (op0 != XEXP (x, 0))
14781 newx = simplify_gen_unary (GET_CODE (x), GET_MODE (x),
14782 op0, GET_MODE (XEXP (x, 0)));
14783 }
14784 else if (BINARY_P (x))
14785 {
14786 op0 = r10k_simplify_address (XEXP (x, 0), insn);
14787 op1 = r10k_simplify_address (XEXP (x, 1), insn);
14788 if (op0 != XEXP (x, 0) || op1 != XEXP (x, 1))
14789 newx = simplify_gen_binary (GET_CODE (x), GET_MODE (x), op0, op1);
14790 }
14791 else if (GET_CODE (x) == LO_SUM)
14792 {
14793 /* LO_SUMs can be offset from HIGHs, if we know they won't
14794 overflow. See mips_classify_address for the rationale behind
14795 the lax check. */
14796 op0 = r10k_simplify_address (XEXP (x, 0), insn);
14797 if (GET_CODE (op0) == HIGH)
14798 newx = XEXP (x, 1);
14799 }
14800 else if (REG_P (x))
14801 {
14802 /* Uses are recorded by regno_reg_rtx, not X itself. */
14803 use = df_find_use (insn, regno_reg_rtx[REGNO (x)]);
14804 gcc_assert (use);
14805 defs = DF_REF_CHAIN (use);
14806
14807 /* Require a single definition. */
14808 if (defs && defs->next == NULL)
14809 {
14810 def = defs->ref;
14811 if (DF_REF_IS_ARTIFICIAL (def))
14812 {
14813 /* Replace the incoming value of $sp with
14814 virtual_incoming_args_rtx. */
14815 if (x == stack_pointer_rtx
14816 && DF_REF_BB (def) == ENTRY_BLOCK_PTR)
14817 newx = virtual_incoming_args_rtx;
14818 }
14819 else if (dominated_by_p (CDI_DOMINATORS, DF_REF_BB (use),
14820 DF_REF_BB (def)))
14821 {
14822 /* Make sure that DEF_INSN is a single set of REG. */
14823 def_insn = DF_REF_INSN (def);
14824 if (NONJUMP_INSN_P (def_insn))
14825 {
14826 set = single_set (def_insn);
14827 if (set && rtx_equal_p (SET_DEST (set), x))
14828 {
14829 /* Prefer to use notes, since the def-use chains
14830 are often shorter. */
14831 note = find_reg_equal_equiv_note (def_insn);
14832 if (note)
14833 newx = XEXP (note, 0);
14834 else
14835 newx = SET_SRC (set);
14836 newx = r10k_simplify_address (newx, def_insn);
14837 }
14838 }
14839 }
14840 }
14841 }
14842 if (newx && r10k_simplified_address_p (newx))
14843 return newx;
14844 return x;
14845 }
14846
14847 /* Return true if ADDRESS is known to be an uncached address
14848 on R10K systems. */
14849
14850 static bool
14851 r10k_uncached_address_p (unsigned HOST_WIDE_INT address)
14852 {
14853 unsigned HOST_WIDE_INT upper;
14854
14855 /* Check for KSEG1. */
14856 if (address + 0x60000000 < 0x20000000)
14857 return true;
14858
14859 /* Check for uncached XKPHYS addresses. */
14860 if (Pmode == DImode)
14861 {
14862 upper = (address >> 40) & 0xf9ffff;
14863 if (upper == 0x900000 || upper == 0xb80000)
14864 return true;
14865 }
14866 return false;
14867 }
14868
14869 /* Return true if we can prove that an access to address X in instruction
14870 INSN would be safe from R10K speculation. This X is a general
14871 expression; it might not be a legitimate address. */
14872
14873 static bool
14874 r10k_safe_address_p (rtx x, rtx insn)
14875 {
14876 rtx base, offset;
14877 HOST_WIDE_INT offset_val;
14878
14879 x = r10k_simplify_address (x, insn);
14880
14881 /* Check for references to the stack frame. It doesn't really matter
14882 how much of the frame has been allocated at INSN; -mr10k-cache-barrier
14883 allows us to assume that accesses to any part of the eventual frame
14884 is safe from speculation at any point in the function. */
14885 mips_split_plus (x, &base, &offset_val);
14886 if (base == virtual_incoming_args_rtx
14887 && offset_val >= -cfun->machine->frame.total_size
14888 && offset_val < cfun->machine->frame.args_size)
14889 return true;
14890
14891 /* Check for uncached addresses. */
14892 if (CONST_INT_P (x))
14893 return r10k_uncached_address_p (INTVAL (x));
14894
14895 /* Check for accesses to a static object. */
14896 split_const (x, &base, &offset);
14897 return offset_within_block_p (base, INTVAL (offset));
14898 }
14899
14900 /* Return true if a MEM with MEM_EXPR EXPR and MEM_OFFSET OFFSET is
14901 an in-range access to an automatic variable, or to an object with
14902 a link-time-constant address. */
14903
14904 static bool
14905 r10k_safe_mem_expr_p (tree expr, HOST_WIDE_INT offset)
14906 {
14907 HOST_WIDE_INT bitoffset, bitsize;
14908 tree inner, var_offset;
14909 enum machine_mode mode;
14910 int unsigned_p, volatile_p;
14911
14912 inner = get_inner_reference (expr, &bitsize, &bitoffset, &var_offset, &mode,
14913 &unsigned_p, &volatile_p, false);
14914 if (!DECL_P (inner) || !DECL_SIZE_UNIT (inner) || var_offset)
14915 return false;
14916
14917 offset += bitoffset / BITS_PER_UNIT;
14918 return offset >= 0 && offset < tree_low_cst (DECL_SIZE_UNIT (inner), 1);
14919 }
14920
14921 /* A for_each_rtx callback for which DATA points to the instruction
14922 containing *X. Stop the search if we find a MEM that is not safe
14923 from R10K speculation. */
14924
14925 static int
14926 r10k_needs_protection_p_1 (rtx *loc, void *data)
14927 {
14928 rtx mem;
14929
14930 mem = *loc;
14931 if (!MEM_P (mem))
14932 return 0;
14933
14934 if (MEM_EXPR (mem)
14935 && MEM_OFFSET_KNOWN_P (mem)
14936 && r10k_safe_mem_expr_p (MEM_EXPR (mem), MEM_OFFSET (mem)))
14937 return -1;
14938
14939 if (r10k_safe_address_p (XEXP (mem, 0), (rtx) data))
14940 return -1;
14941
14942 return 1;
14943 }
14944
14945 /* A note_stores callback for which DATA points to an instruction pointer.
14946 If *DATA is nonnull, make it null if it X contains a MEM that is not
14947 safe from R10K speculation. */
14948
14949 static void
14950 r10k_needs_protection_p_store (rtx x, const_rtx pat ATTRIBUTE_UNUSED,
14951 void *data)
14952 {
14953 rtx *insn_ptr;
14954
14955 insn_ptr = (rtx *) data;
14956 if (*insn_ptr && for_each_rtx (&x, r10k_needs_protection_p_1, *insn_ptr))
14957 *insn_ptr = NULL_RTX;
14958 }
14959
14960 /* A for_each_rtx callback that iterates over the pattern of a CALL_INSN.
14961 Return nonzero if the call is not to a declared function. */
14962
14963 static int
14964 r10k_needs_protection_p_call (rtx *loc, void *data ATTRIBUTE_UNUSED)
14965 {
14966 rtx x;
14967
14968 x = *loc;
14969 if (!MEM_P (x))
14970 return 0;
14971
14972 x = XEXP (x, 0);
14973 if (GET_CODE (x) == SYMBOL_REF && SYMBOL_REF_DECL (x))
14974 return -1;
14975
14976 return 1;
14977 }
14978
14979 /* Return true if instruction INSN needs to be protected by an R10K
14980 cache barrier. */
14981
14982 static bool
14983 r10k_needs_protection_p (rtx insn)
14984 {
14985 if (CALL_P (insn))
14986 return for_each_rtx (&PATTERN (insn), r10k_needs_protection_p_call, NULL);
14987
14988 if (mips_r10k_cache_barrier == R10K_CACHE_BARRIER_STORE)
14989 {
14990 note_stores (PATTERN (insn), r10k_needs_protection_p_store, &insn);
14991 return insn == NULL_RTX;
14992 }
14993
14994 return for_each_rtx (&PATTERN (insn), r10k_needs_protection_p_1, insn);
14995 }
14996
14997 /* Return true if BB is only reached by blocks in PROTECTED_BBS and if every
14998 edge is unconditional. */
14999
15000 static bool
15001 r10k_protected_bb_p (basic_block bb, sbitmap protected_bbs)
15002 {
15003 edge_iterator ei;
15004 edge e;
15005
15006 FOR_EACH_EDGE (e, ei, bb->preds)
15007 if (!single_succ_p (e->src)
15008 || !bitmap_bit_p (protected_bbs, e->src->index)
15009 || (e->flags & EDGE_COMPLEX) != 0)
15010 return false;
15011 return true;
15012 }
15013
15014 /* Implement -mr10k-cache-barrier= for the current function. */
15015
15016 static void
15017 r10k_insert_cache_barriers (void)
15018 {
15019 int *rev_post_order;
15020 unsigned int i, n;
15021 basic_block bb;
15022 sbitmap protected_bbs;
15023 rtx insn, end, unprotected_region;
15024
15025 if (TARGET_MIPS16)
15026 {
15027 sorry ("%qs does not support MIPS16 code", "-mr10k-cache-barrier");
15028 return;
15029 }
15030
15031 /* Calculate dominators. */
15032 calculate_dominance_info (CDI_DOMINATORS);
15033
15034 /* Bit X of PROTECTED_BBS is set if the last operation in basic block
15035 X is protected by a cache barrier. */
15036 protected_bbs = sbitmap_alloc (last_basic_block);
15037 bitmap_clear (protected_bbs);
15038
15039 /* Iterate over the basic blocks in reverse post-order. */
15040 rev_post_order = XNEWVEC (int, last_basic_block);
15041 n = pre_and_rev_post_order_compute (NULL, rev_post_order, false);
15042 for (i = 0; i < n; i++)
15043 {
15044 bb = BASIC_BLOCK (rev_post_order[i]);
15045
15046 /* If this block is only reached by unconditional edges, and if the
15047 source of every edge is protected, the beginning of the block is
15048 also protected. */
15049 if (r10k_protected_bb_p (bb, protected_bbs))
15050 unprotected_region = NULL_RTX;
15051 else
15052 unprotected_region = pc_rtx;
15053 end = NEXT_INSN (BB_END (bb));
15054
15055 /* UNPROTECTED_REGION is:
15056
15057 - null if we are processing a protected region,
15058 - pc_rtx if we are processing an unprotected region but have
15059 not yet found the first instruction in it
15060 - the first instruction in an unprotected region otherwise. */
15061 for (insn = BB_HEAD (bb); insn != end; insn = NEXT_INSN (insn))
15062 {
15063 if (unprotected_region && USEFUL_INSN_P (insn))
15064 {
15065 if (recog_memoized (insn) == CODE_FOR_mips_cache)
15066 /* This CACHE instruction protects the following code. */
15067 unprotected_region = NULL_RTX;
15068 else
15069 {
15070 /* See if INSN is the first instruction in this
15071 unprotected region. */
15072 if (unprotected_region == pc_rtx)
15073 unprotected_region = insn;
15074
15075 /* See if INSN needs to be protected. If so,
15076 we must insert a cache barrier somewhere between
15077 PREV_INSN (UNPROTECTED_REGION) and INSN. It isn't
15078 clear which position is better performance-wise,
15079 but as a tie-breaker, we assume that it is better
15080 to allow delay slots to be back-filled where
15081 possible, and that it is better not to insert
15082 barriers in the middle of already-scheduled code.
15083 We therefore insert the barrier at the beginning
15084 of the region. */
15085 if (r10k_needs_protection_p (insn))
15086 {
15087 emit_insn_before (gen_r10k_cache_barrier (),
15088 unprotected_region);
15089 unprotected_region = NULL_RTX;
15090 }
15091 }
15092 }
15093
15094 if (CALL_P (insn))
15095 /* The called function is not required to protect the exit path.
15096 The code that follows a call is therefore unprotected. */
15097 unprotected_region = pc_rtx;
15098 }
15099
15100 /* Record whether the end of this block is protected. */
15101 if (unprotected_region == NULL_RTX)
15102 bitmap_set_bit (protected_bbs, bb->index);
15103 }
15104 XDELETEVEC (rev_post_order);
15105
15106 sbitmap_free (protected_bbs);
15107
15108 free_dominance_info (CDI_DOMINATORS);
15109 }
15110 \f
15111 /* If INSN is a call, return the underlying CALL expr. Return NULL_RTX
15112 otherwise. If INSN has two call rtx, then store the second one in
15113 SECOND_CALL. */
15114
15115 static rtx
15116 mips_call_expr_from_insn (rtx insn, rtx *second_call)
15117 {
15118 rtx x;
15119 rtx x2;
15120
15121 if (!CALL_P (insn))
15122 return NULL_RTX;
15123
15124 x = PATTERN (insn);
15125 if (GET_CODE (x) == PARALLEL)
15126 {
15127 /* Calls returning complex values have two CALL rtx. Look for the second
15128 one here, and return it via the SECOND_CALL arg. */
15129 x2 = XVECEXP (x, 0, 1);
15130 if (GET_CODE (x2) == SET)
15131 x2 = XEXP (x2, 1);
15132 if (GET_CODE (x2) == CALL)
15133 *second_call = x2;
15134
15135 x = XVECEXP (x, 0, 0);
15136 }
15137 if (GET_CODE (x) == SET)
15138 x = XEXP (x, 1);
15139 gcc_assert (GET_CODE (x) == CALL);
15140
15141 return x;
15142 }
15143
15144 /* REG is set in DEF. See if the definition is one of the ways we load a
15145 register with a symbol address for a mips_use_pic_fn_addr_reg_p call.
15146 If it is, return the symbol reference of the function, otherwise return
15147 NULL_RTX.
15148
15149 If RECURSE_P is true, use mips_find_pic_call_symbol to interpret
15150 the values of source registers, otherwise treat such registers as
15151 having an unknown value. */
15152
15153 static rtx
15154 mips_pic_call_symbol_from_set (df_ref def, rtx reg, bool recurse_p)
15155 {
15156 rtx def_insn, set;
15157
15158 if (DF_REF_IS_ARTIFICIAL (def))
15159 return NULL_RTX;
15160
15161 def_insn = DF_REF_INSN (def);
15162 set = single_set (def_insn);
15163 if (set && rtx_equal_p (SET_DEST (set), reg))
15164 {
15165 rtx note, src, symbol;
15166
15167 /* First see whether the source is a plain symbol. This is used
15168 when calling symbols that are not lazily bound. */
15169 src = SET_SRC (set);
15170 if (GET_CODE (src) == SYMBOL_REF)
15171 return src;
15172
15173 /* Handle %call16 references. */
15174 symbol = mips_strip_unspec_call (src);
15175 if (symbol)
15176 {
15177 gcc_assert (GET_CODE (symbol) == SYMBOL_REF);
15178 return symbol;
15179 }
15180
15181 /* If we have something more complicated, look for a
15182 REG_EQUAL or REG_EQUIV note. */
15183 note = find_reg_equal_equiv_note (def_insn);
15184 if (note && GET_CODE (XEXP (note, 0)) == SYMBOL_REF)
15185 return XEXP (note, 0);
15186
15187 /* Follow at most one simple register copy. Such copies are
15188 interesting in cases like:
15189
15190 for (...)
15191 {
15192 locally_binding_fn (...);
15193 }
15194
15195 and:
15196
15197 locally_binding_fn (...);
15198 ...
15199 locally_binding_fn (...);
15200
15201 where the load of locally_binding_fn can legitimately be
15202 hoisted or shared. However, we do not expect to see complex
15203 chains of copies, so a full worklist solution to the problem
15204 would probably be overkill. */
15205 if (recurse_p && REG_P (src))
15206 return mips_find_pic_call_symbol (def_insn, src, false);
15207 }
15208
15209 return NULL_RTX;
15210 }
15211
15212 /* Find the definition of the use of REG in INSN. See if the definition
15213 is one of the ways we load a register with a symbol address for a
15214 mips_use_pic_fn_addr_reg_p call. If it is return the symbol reference
15215 of the function, otherwise return NULL_RTX. RECURSE_P is as for
15216 mips_pic_call_symbol_from_set. */
15217
15218 static rtx
15219 mips_find_pic_call_symbol (rtx insn, rtx reg, bool recurse_p)
15220 {
15221 df_ref use;
15222 struct df_link *defs;
15223 rtx symbol;
15224
15225 use = df_find_use (insn, regno_reg_rtx[REGNO (reg)]);
15226 if (!use)
15227 return NULL_RTX;
15228 defs = DF_REF_CHAIN (use);
15229 if (!defs)
15230 return NULL_RTX;
15231 symbol = mips_pic_call_symbol_from_set (defs->ref, reg, recurse_p);
15232 if (!symbol)
15233 return NULL_RTX;
15234
15235 /* If we have more than one definition, they need to be identical. */
15236 for (defs = defs->next; defs; defs = defs->next)
15237 {
15238 rtx other;
15239
15240 other = mips_pic_call_symbol_from_set (defs->ref, reg, recurse_p);
15241 if (!rtx_equal_p (symbol, other))
15242 return NULL_RTX;
15243 }
15244
15245 return symbol;
15246 }
15247
15248 /* Replace the args_size operand of the call expression CALL with the
15249 call-attribute UNSPEC and fill in SYMBOL as the function symbol. */
15250
15251 static void
15252 mips_annotate_pic_call_expr (rtx call, rtx symbol)
15253 {
15254 rtx args_size;
15255
15256 args_size = XEXP (call, 1);
15257 XEXP (call, 1) = gen_rtx_UNSPEC (GET_MODE (args_size),
15258 gen_rtvec (2, args_size, symbol),
15259 UNSPEC_CALL_ATTR);
15260 }
15261
15262 /* OPERANDS[ARGS_SIZE_OPNO] is the arg_size operand of a CALL expression. See
15263 if instead of the arg_size argument it contains the call attributes. If
15264 yes return true along with setting OPERANDS[ARGS_SIZE_OPNO] to the function
15265 symbol from the call attributes. Also return false if ARGS_SIZE_OPNO is
15266 -1. */
15267
15268 bool
15269 mips_get_pic_call_symbol (rtx *operands, int args_size_opno)
15270 {
15271 rtx args_size, symbol;
15272
15273 if (!TARGET_RELAX_PIC_CALLS || args_size_opno == -1)
15274 return false;
15275
15276 args_size = operands[args_size_opno];
15277 if (GET_CODE (args_size) != UNSPEC)
15278 return false;
15279 gcc_assert (XINT (args_size, 1) == UNSPEC_CALL_ATTR);
15280
15281 symbol = XVECEXP (args_size, 0, 1);
15282 gcc_assert (GET_CODE (symbol) == SYMBOL_REF);
15283
15284 operands[args_size_opno] = symbol;
15285 return true;
15286 }
15287
15288 /* Use DF to annotate PIC indirect calls with the function symbol they
15289 dispatch to. */
15290
15291 static void
15292 mips_annotate_pic_calls (void)
15293 {
15294 basic_block bb;
15295 rtx insn;
15296
15297 FOR_EACH_BB (bb)
15298 FOR_BB_INSNS (bb, insn)
15299 {
15300 rtx call, reg, symbol, second_call;
15301
15302 second_call = 0;
15303 call = mips_call_expr_from_insn (insn, &second_call);
15304 if (!call)
15305 continue;
15306 gcc_assert (MEM_P (XEXP (call, 0)));
15307 reg = XEXP (XEXP (call, 0), 0);
15308 if (!REG_P (reg))
15309 continue;
15310
15311 symbol = mips_find_pic_call_symbol (insn, reg, true);
15312 if (symbol)
15313 {
15314 mips_annotate_pic_call_expr (call, symbol);
15315 if (second_call)
15316 mips_annotate_pic_call_expr (second_call, symbol);
15317 }
15318 }
15319 }
15320 \f
15321 /* A temporary variable used by for_each_rtx callbacks, etc. */
15322 static rtx mips_sim_insn;
15323
15324 /* A structure representing the state of the processor pipeline.
15325 Used by the mips_sim_* family of functions. */
15326 struct mips_sim {
15327 /* The maximum number of instructions that can be issued in a cycle.
15328 (Caches mips_issue_rate.) */
15329 unsigned int issue_rate;
15330
15331 /* The current simulation time. */
15332 unsigned int time;
15333
15334 /* How many more instructions can be issued in the current cycle. */
15335 unsigned int insns_left;
15336
15337 /* LAST_SET[X].INSN is the last instruction to set register X.
15338 LAST_SET[X].TIME is the time at which that instruction was issued.
15339 INSN is null if no instruction has yet set register X. */
15340 struct {
15341 rtx insn;
15342 unsigned int time;
15343 } last_set[FIRST_PSEUDO_REGISTER];
15344
15345 /* The pipeline's current DFA state. */
15346 state_t dfa_state;
15347 };
15348
15349 /* Reset STATE to the initial simulation state. */
15350
15351 static void
15352 mips_sim_reset (struct mips_sim *state)
15353 {
15354 curr_state = state->dfa_state;
15355
15356 state->time = 0;
15357 state->insns_left = state->issue_rate;
15358 memset (&state->last_set, 0, sizeof (state->last_set));
15359 state_reset (curr_state);
15360
15361 targetm.sched.init (0, false, 0);
15362 advance_state (curr_state);
15363 }
15364
15365 /* Initialize STATE before its first use. DFA_STATE points to an
15366 allocated but uninitialized DFA state. */
15367
15368 static void
15369 mips_sim_init (struct mips_sim *state, state_t dfa_state)
15370 {
15371 if (targetm.sched.init_dfa_pre_cycle_insn)
15372 targetm.sched.init_dfa_pre_cycle_insn ();
15373
15374 if (targetm.sched.init_dfa_post_cycle_insn)
15375 targetm.sched.init_dfa_post_cycle_insn ();
15376
15377 state->issue_rate = mips_issue_rate ();
15378 state->dfa_state = dfa_state;
15379 mips_sim_reset (state);
15380 }
15381
15382 /* Advance STATE by one clock cycle. */
15383
15384 static void
15385 mips_sim_next_cycle (struct mips_sim *state)
15386 {
15387 curr_state = state->dfa_state;
15388
15389 state->time++;
15390 state->insns_left = state->issue_rate;
15391 advance_state (curr_state);
15392 }
15393
15394 /* Advance simulation state STATE until instruction INSN can read
15395 register REG. */
15396
15397 static void
15398 mips_sim_wait_reg (struct mips_sim *state, rtx insn, rtx reg)
15399 {
15400 unsigned int regno, end_regno;
15401
15402 end_regno = END_REGNO (reg);
15403 for (regno = REGNO (reg); regno < end_regno; regno++)
15404 if (state->last_set[regno].insn != 0)
15405 {
15406 unsigned int t;
15407
15408 t = (state->last_set[regno].time
15409 + insn_latency (state->last_set[regno].insn, insn));
15410 while (state->time < t)
15411 mips_sim_next_cycle (state);
15412 }
15413 }
15414
15415 /* A for_each_rtx callback. If *X is a register, advance simulation state
15416 DATA until mips_sim_insn can read the register's value. */
15417
15418 static int
15419 mips_sim_wait_regs_2 (rtx *x, void *data)
15420 {
15421 if (REG_P (*x))
15422 mips_sim_wait_reg ((struct mips_sim *) data, mips_sim_insn, *x);
15423 return 0;
15424 }
15425
15426 /* Call mips_sim_wait_regs_2 (R, DATA) for each register R mentioned in *X. */
15427
15428 static void
15429 mips_sim_wait_regs_1 (rtx *x, void *data)
15430 {
15431 for_each_rtx (x, mips_sim_wait_regs_2, data);
15432 }
15433
15434 /* Advance simulation state STATE until all of INSN's register
15435 dependencies are satisfied. */
15436
15437 static void
15438 mips_sim_wait_regs (struct mips_sim *state, rtx insn)
15439 {
15440 mips_sim_insn = insn;
15441 note_uses (&PATTERN (insn), mips_sim_wait_regs_1, state);
15442 }
15443
15444 /* Advance simulation state STATE until the units required by
15445 instruction INSN are available. */
15446
15447 static void
15448 mips_sim_wait_units (struct mips_sim *state, rtx insn)
15449 {
15450 state_t tmp_state;
15451
15452 tmp_state = alloca (state_size ());
15453 while (state->insns_left == 0
15454 || (memcpy (tmp_state, state->dfa_state, state_size ()),
15455 state_transition (tmp_state, insn) >= 0))
15456 mips_sim_next_cycle (state);
15457 }
15458
15459 /* Advance simulation state STATE until INSN is ready to issue. */
15460
15461 static void
15462 mips_sim_wait_insn (struct mips_sim *state, rtx insn)
15463 {
15464 mips_sim_wait_regs (state, insn);
15465 mips_sim_wait_units (state, insn);
15466 }
15467
15468 /* mips_sim_insn has just set X. Update the LAST_SET array
15469 in simulation state DATA. */
15470
15471 static void
15472 mips_sim_record_set (rtx x, const_rtx pat ATTRIBUTE_UNUSED, void *data)
15473 {
15474 struct mips_sim *state;
15475
15476 state = (struct mips_sim *) data;
15477 if (REG_P (x))
15478 {
15479 unsigned int regno, end_regno;
15480
15481 end_regno = END_REGNO (x);
15482 for (regno = REGNO (x); regno < end_regno; regno++)
15483 {
15484 state->last_set[regno].insn = mips_sim_insn;
15485 state->last_set[regno].time = state->time;
15486 }
15487 }
15488 }
15489
15490 /* Issue instruction INSN in scheduler state STATE. Assume that INSN
15491 can issue immediately (i.e., that mips_sim_wait_insn has already
15492 been called). */
15493
15494 static void
15495 mips_sim_issue_insn (struct mips_sim *state, rtx insn)
15496 {
15497 curr_state = state->dfa_state;
15498
15499 state_transition (curr_state, insn);
15500 state->insns_left = targetm.sched.variable_issue (0, false, insn,
15501 state->insns_left);
15502
15503 mips_sim_insn = insn;
15504 note_stores (PATTERN (insn), mips_sim_record_set, state);
15505 }
15506
15507 /* Simulate issuing a NOP in state STATE. */
15508
15509 static void
15510 mips_sim_issue_nop (struct mips_sim *state)
15511 {
15512 if (state->insns_left == 0)
15513 mips_sim_next_cycle (state);
15514 state->insns_left--;
15515 }
15516
15517 /* Update simulation state STATE so that it's ready to accept the instruction
15518 after INSN. INSN should be part of the main rtl chain, not a member of a
15519 SEQUENCE. */
15520
15521 static void
15522 mips_sim_finish_insn (struct mips_sim *state, rtx insn)
15523 {
15524 /* If INSN is a jump with an implicit delay slot, simulate a nop. */
15525 if (JUMP_P (insn))
15526 mips_sim_issue_nop (state);
15527
15528 switch (GET_CODE (SEQ_BEGIN (insn)))
15529 {
15530 case CODE_LABEL:
15531 case CALL_INSN:
15532 /* We can't predict the processor state after a call or label. */
15533 mips_sim_reset (state);
15534 break;
15535
15536 case JUMP_INSN:
15537 /* The delay slots of branch likely instructions are only executed
15538 when the branch is taken. Therefore, if the caller has simulated
15539 the delay slot instruction, STATE does not really reflect the state
15540 of the pipeline for the instruction after the delay slot. Also,
15541 branch likely instructions tend to incur a penalty when not taken,
15542 so there will probably be an extra delay between the branch and
15543 the instruction after the delay slot. */
15544 if (INSN_ANNULLED_BRANCH_P (SEQ_BEGIN (insn)))
15545 mips_sim_reset (state);
15546 break;
15547
15548 default:
15549 break;
15550 }
15551 }
15552
15553 /* Use simulator state STATE to calculate the execution time of
15554 instruction sequence SEQ. */
15555
15556 static unsigned int
15557 mips_seq_time (struct mips_sim *state, rtx seq)
15558 {
15559 mips_sim_reset (state);
15560 for (rtx insn = seq; insn; insn = NEXT_INSN (insn))
15561 {
15562 mips_sim_wait_insn (state, insn);
15563 mips_sim_issue_insn (state, insn);
15564 }
15565 return state->time;
15566 }
15567 \f
15568 /* Return the execution-time cost of mips_tuning_info.fast_mult_zero_zero_p
15569 setting SETTING, using STATE to simulate instruction sequences. */
15570
15571 static unsigned int
15572 mips_mult_zero_zero_cost (struct mips_sim *state, bool setting)
15573 {
15574 mips_tuning_info.fast_mult_zero_zero_p = setting;
15575 start_sequence ();
15576
15577 enum machine_mode dword_mode = TARGET_64BIT ? TImode : DImode;
15578 rtx hilo = gen_rtx_REG (dword_mode, MD_REG_FIRST);
15579 mips_emit_move_or_split (hilo, const0_rtx, SPLIT_FOR_SPEED);
15580
15581 /* If the target provides mulsidi3_32bit then that's the most likely
15582 consumer of the result. Test for bypasses. */
15583 if (dword_mode == DImode && HAVE_maddsidi4)
15584 {
15585 rtx gpr = gen_rtx_REG (SImode, GP_REG_FIRST + 4);
15586 emit_insn (gen_maddsidi4 (hilo, gpr, gpr, hilo));
15587 }
15588
15589 unsigned int time = mips_seq_time (state, get_insns ());
15590 end_sequence ();
15591 return time;
15592 }
15593
15594 /* Check the relative speeds of "MULT $0,$0" and "MTLO $0; MTHI $0"
15595 and set up mips_tuning_info.fast_mult_zero_zero_p accordingly.
15596 Prefer MULT -- which is shorter -- in the event of a tie. */
15597
15598 static void
15599 mips_set_fast_mult_zero_zero_p (struct mips_sim *state)
15600 {
15601 if (TARGET_MIPS16)
15602 /* No MTLO or MTHI available. */
15603 mips_tuning_info.fast_mult_zero_zero_p = true;
15604 else
15605 {
15606 unsigned int true_time = mips_mult_zero_zero_cost (state, true);
15607 unsigned int false_time = mips_mult_zero_zero_cost (state, false);
15608 mips_tuning_info.fast_mult_zero_zero_p = (true_time <= false_time);
15609 }
15610 }
15611
15612 /* Set up costs based on the current architecture and tuning settings. */
15613
15614 static void
15615 mips_set_tuning_info (void)
15616 {
15617 if (mips_tuning_info.initialized_p
15618 && mips_tuning_info.arch == mips_arch
15619 && mips_tuning_info.tune == mips_tune
15620 && mips_tuning_info.mips16_p == TARGET_MIPS16)
15621 return;
15622
15623 mips_tuning_info.arch = mips_arch;
15624 mips_tuning_info.tune = mips_tune;
15625 mips_tuning_info.mips16_p = TARGET_MIPS16;
15626 mips_tuning_info.initialized_p = true;
15627
15628 dfa_start ();
15629
15630 struct mips_sim state;
15631 mips_sim_init (&state, alloca (state_size ()));
15632
15633 mips_set_fast_mult_zero_zero_p (&state);
15634
15635 dfa_finish ();
15636 }
15637
15638 /* Implement TARGET_EXPAND_TO_RTL_HOOK. */
15639
15640 static void
15641 mips_expand_to_rtl_hook (void)
15642 {
15643 /* We need to call this at a point where we can safely create sequences
15644 of instructions, so TARGET_OVERRIDE_OPTIONS is too early. We also
15645 need to call it at a point where the DFA infrastructure is not
15646 already in use, so we can't just call it lazily on demand.
15647
15648 At present, mips_tuning_info is only needed during post-expand
15649 RTL passes such as split_insns, so this hook should be early enough.
15650 We may need to move the call elsewhere if mips_tuning_info starts
15651 to be used for other things (such as rtx_costs, or expanders that
15652 could be called during gimple optimization). */
15653 mips_set_tuning_info ();
15654 }
15655 \f
15656 /* The VR4130 pipeline issues aligned pairs of instructions together,
15657 but it stalls the second instruction if it depends on the first.
15658 In order to cut down the amount of logic required, this dependence
15659 check is not based on a full instruction decode. Instead, any non-SPECIAL
15660 instruction is assumed to modify the register specified by bits 20-16
15661 (which is usually the "rt" field).
15662
15663 In BEQ, BEQL, BNE and BNEL instructions, the rt field is actually an
15664 input, so we can end up with a false dependence between the branch
15665 and its delay slot. If this situation occurs in instruction INSN,
15666 try to avoid it by swapping rs and rt. */
15667
15668 static void
15669 vr4130_avoid_branch_rt_conflict (rtx insn)
15670 {
15671 rtx first, second;
15672
15673 first = SEQ_BEGIN (insn);
15674 second = SEQ_END (insn);
15675 if (JUMP_P (first)
15676 && NONJUMP_INSN_P (second)
15677 && GET_CODE (PATTERN (first)) == SET
15678 && GET_CODE (SET_DEST (PATTERN (first))) == PC
15679 && GET_CODE (SET_SRC (PATTERN (first))) == IF_THEN_ELSE)
15680 {
15681 /* Check for the right kind of condition. */
15682 rtx cond = XEXP (SET_SRC (PATTERN (first)), 0);
15683 if ((GET_CODE (cond) == EQ || GET_CODE (cond) == NE)
15684 && REG_P (XEXP (cond, 0))
15685 && REG_P (XEXP (cond, 1))
15686 && reg_referenced_p (XEXP (cond, 1), PATTERN (second))
15687 && !reg_referenced_p (XEXP (cond, 0), PATTERN (second)))
15688 {
15689 /* SECOND mentions the rt register but not the rs register. */
15690 rtx tmp = XEXP (cond, 0);
15691 XEXP (cond, 0) = XEXP (cond, 1);
15692 XEXP (cond, 1) = tmp;
15693 }
15694 }
15695 }
15696
15697 /* Implement -mvr4130-align. Go through each basic block and simulate the
15698 processor pipeline. If we find that a pair of instructions could execute
15699 in parallel, and the first of those instructions is not 8-byte aligned,
15700 insert a nop to make it aligned. */
15701
15702 static void
15703 vr4130_align_insns (void)
15704 {
15705 struct mips_sim state;
15706 rtx insn, subinsn, last, last2, next;
15707 bool aligned_p;
15708
15709 dfa_start ();
15710
15711 /* LAST is the last instruction before INSN to have a nonzero length.
15712 LAST2 is the last such instruction before LAST. */
15713 last = 0;
15714 last2 = 0;
15715
15716 /* ALIGNED_P is true if INSN is known to be at an aligned address. */
15717 aligned_p = true;
15718
15719 mips_sim_init (&state, alloca (state_size ()));
15720 for (insn = get_insns (); insn != 0; insn = next)
15721 {
15722 unsigned int length;
15723
15724 next = NEXT_INSN (insn);
15725
15726 /* See the comment above vr4130_avoid_branch_rt_conflict for details.
15727 This isn't really related to the alignment pass, but we do it on
15728 the fly to avoid a separate instruction walk. */
15729 vr4130_avoid_branch_rt_conflict (insn);
15730
15731 length = get_attr_length (insn);
15732 if (length > 0 && USEFUL_INSN_P (insn))
15733 FOR_EACH_SUBINSN (subinsn, insn)
15734 {
15735 mips_sim_wait_insn (&state, subinsn);
15736
15737 /* If we want this instruction to issue in parallel with the
15738 previous one, make sure that the previous instruction is
15739 aligned. There are several reasons why this isn't worthwhile
15740 when the second instruction is a call:
15741
15742 - Calls are less likely to be performance critical,
15743 - There's a good chance that the delay slot can execute
15744 in parallel with the call.
15745 - The return address would then be unaligned.
15746
15747 In general, if we're going to insert a nop between instructions
15748 X and Y, it's better to insert it immediately after X. That
15749 way, if the nop makes Y aligned, it will also align any labels
15750 between X and Y. */
15751 if (state.insns_left != state.issue_rate
15752 && !CALL_P (subinsn))
15753 {
15754 if (subinsn == SEQ_BEGIN (insn) && aligned_p)
15755 {
15756 /* SUBINSN is the first instruction in INSN and INSN is
15757 aligned. We want to align the previous instruction
15758 instead, so insert a nop between LAST2 and LAST.
15759
15760 Note that LAST could be either a single instruction
15761 or a branch with a delay slot. In the latter case,
15762 LAST, like INSN, is already aligned, but the delay
15763 slot must have some extra delay that stops it from
15764 issuing at the same time as the branch. We therefore
15765 insert a nop before the branch in order to align its
15766 delay slot. */
15767 gcc_assert (last2);
15768 emit_insn_after (gen_nop (), last2);
15769 aligned_p = false;
15770 }
15771 else if (subinsn != SEQ_BEGIN (insn) && !aligned_p)
15772 {
15773 /* SUBINSN is the delay slot of INSN, but INSN is
15774 currently unaligned. Insert a nop between
15775 LAST and INSN to align it. */
15776 gcc_assert (last);
15777 emit_insn_after (gen_nop (), last);
15778 aligned_p = true;
15779 }
15780 }
15781 mips_sim_issue_insn (&state, subinsn);
15782 }
15783 mips_sim_finish_insn (&state, insn);
15784
15785 /* Update LAST, LAST2 and ALIGNED_P for the next instruction. */
15786 length = get_attr_length (insn);
15787 if (length > 0)
15788 {
15789 /* If the instruction is an asm statement or multi-instruction
15790 mips.md patern, the length is only an estimate. Insert an
15791 8 byte alignment after it so that the following instructions
15792 can be handled correctly. */
15793 if (NONJUMP_INSN_P (SEQ_BEGIN (insn))
15794 && (recog_memoized (insn) < 0 || length >= 8))
15795 {
15796 next = emit_insn_after (gen_align (GEN_INT (3)), insn);
15797 next = NEXT_INSN (next);
15798 mips_sim_next_cycle (&state);
15799 aligned_p = true;
15800 }
15801 else if (length & 4)
15802 aligned_p = !aligned_p;
15803 last2 = last;
15804 last = insn;
15805 }
15806
15807 /* See whether INSN is an aligned label. */
15808 if (LABEL_P (insn) && label_to_alignment (insn) >= 3)
15809 aligned_p = true;
15810 }
15811 dfa_finish ();
15812 }
15813 \f
15814 /* This structure records that the current function has a LO_SUM
15815 involving SYMBOL_REF or LABEL_REF BASE and that MAX_OFFSET is
15816 the largest offset applied to BASE by all such LO_SUMs. */
15817 struct mips_lo_sum_offset {
15818 rtx base;
15819 HOST_WIDE_INT offset;
15820 };
15821
15822 /* Return a hash value for SYMBOL_REF or LABEL_REF BASE. */
15823
15824 static hashval_t
15825 mips_hash_base (rtx base)
15826 {
15827 int do_not_record_p;
15828
15829 return hash_rtx (base, GET_MODE (base), &do_not_record_p, NULL, false);
15830 }
15831
15832 /* Hashtable helpers. */
15833
15834 struct mips_lo_sum_offset_hasher : typed_free_remove <mips_lo_sum_offset>
15835 {
15836 typedef mips_lo_sum_offset value_type;
15837 typedef rtx_def compare_type;
15838 static inline hashval_t hash (const value_type *);
15839 static inline bool equal (const value_type *, const compare_type *);
15840 };
15841
15842 /* Hash-table callbacks for mips_lo_sum_offsets. */
15843
15844 inline hashval_t
15845 mips_lo_sum_offset_hasher::hash (const value_type *entry)
15846 {
15847 return mips_hash_base (entry->base);
15848 }
15849
15850 inline bool
15851 mips_lo_sum_offset_hasher::equal (const value_type *entry,
15852 const compare_type *value)
15853 {
15854 return rtx_equal_p (entry->base, value);
15855 }
15856
15857 typedef hash_table <mips_lo_sum_offset_hasher> mips_offset_table;
15858
15859 /* Look up symbolic constant X in HTAB, which is a hash table of
15860 mips_lo_sum_offsets. If OPTION is NO_INSERT, return true if X can be
15861 paired with a recorded LO_SUM, otherwise record X in the table. */
15862
15863 static bool
15864 mips_lo_sum_offset_lookup (mips_offset_table htab, rtx x,
15865 enum insert_option option)
15866 {
15867 rtx base, offset;
15868 mips_lo_sum_offset **slot;
15869 struct mips_lo_sum_offset *entry;
15870
15871 /* Split X into a base and offset. */
15872 split_const (x, &base, &offset);
15873 if (UNSPEC_ADDRESS_P (base))
15874 base = UNSPEC_ADDRESS (base);
15875
15876 /* Look up the base in the hash table. */
15877 slot = htab.find_slot_with_hash (base, mips_hash_base (base), option);
15878 if (slot == NULL)
15879 return false;
15880
15881 entry = (struct mips_lo_sum_offset *) *slot;
15882 if (option == INSERT)
15883 {
15884 if (entry == NULL)
15885 {
15886 entry = XNEW (struct mips_lo_sum_offset);
15887 entry->base = base;
15888 entry->offset = INTVAL (offset);
15889 *slot = entry;
15890 }
15891 else
15892 {
15893 if (INTVAL (offset) > entry->offset)
15894 entry->offset = INTVAL (offset);
15895 }
15896 }
15897 return INTVAL (offset) <= entry->offset;
15898 }
15899
15900 /* A for_each_rtx callback for which DATA is a mips_lo_sum_offset hash table.
15901 Record every LO_SUM in *LOC. */
15902
15903 static int
15904 mips_record_lo_sum (rtx *loc, void *data)
15905 {
15906 if (GET_CODE (*loc) == LO_SUM)
15907 mips_lo_sum_offset_lookup (*(mips_offset_table*) data,
15908 XEXP (*loc, 1), INSERT);
15909 return 0;
15910 }
15911
15912 /* Return true if INSN is a SET of an orphaned high-part relocation.
15913 HTAB is a hash table of mips_lo_sum_offsets that describes all the
15914 LO_SUMs in the current function. */
15915
15916 static bool
15917 mips_orphaned_high_part_p (mips_offset_table htab, rtx insn)
15918 {
15919 enum mips_symbol_type type;
15920 rtx x, set;
15921
15922 set = single_set (insn);
15923 if (set)
15924 {
15925 /* Check for %his. */
15926 x = SET_SRC (set);
15927 if (GET_CODE (x) == HIGH
15928 && absolute_symbolic_operand (XEXP (x, 0), VOIDmode))
15929 return !mips_lo_sum_offset_lookup (htab, XEXP (x, 0), NO_INSERT);
15930
15931 /* Check for local %gots (and %got_pages, which is redundant but OK). */
15932 if (GET_CODE (x) == UNSPEC
15933 && XINT (x, 1) == UNSPEC_LOAD_GOT
15934 && mips_symbolic_constant_p (XVECEXP (x, 0, 1),
15935 SYMBOL_CONTEXT_LEA, &type)
15936 && type == SYMBOL_GOTOFF_PAGE)
15937 return !mips_lo_sum_offset_lookup (htab, XVECEXP (x, 0, 1), NO_INSERT);
15938 }
15939 return false;
15940 }
15941
15942 /* Subroutine of mips_reorg_process_insns. If there is a hazard between
15943 INSN and a previous instruction, avoid it by inserting nops after
15944 instruction AFTER.
15945
15946 *DELAYED_REG and *HILO_DELAY describe the hazards that apply at
15947 this point. If *DELAYED_REG is non-null, INSN must wait a cycle
15948 before using the value of that register. *HILO_DELAY counts the
15949 number of instructions since the last hilo hazard (that is,
15950 the number of instructions since the last MFLO or MFHI).
15951
15952 After inserting nops for INSN, update *DELAYED_REG and *HILO_DELAY
15953 for the next instruction.
15954
15955 LO_REG is an rtx for the LO register, used in dependence checking. */
15956
15957 static void
15958 mips_avoid_hazard (rtx after, rtx insn, int *hilo_delay,
15959 rtx *delayed_reg, rtx lo_reg)
15960 {
15961 rtx pattern, set;
15962 int nops, ninsns;
15963
15964 pattern = PATTERN (insn);
15965
15966 /* Do not put the whole function in .set noreorder if it contains
15967 an asm statement. We don't know whether there will be hazards
15968 between the asm statement and the gcc-generated code. */
15969 if (GET_CODE (pattern) == ASM_INPUT || asm_noperands (pattern) >= 0)
15970 cfun->machine->all_noreorder_p = false;
15971
15972 /* Ignore zero-length instructions (barriers and the like). */
15973 ninsns = get_attr_length (insn) / 4;
15974 if (ninsns == 0)
15975 return;
15976
15977 /* Work out how many nops are needed. Note that we only care about
15978 registers that are explicitly mentioned in the instruction's pattern.
15979 It doesn't matter that calls use the argument registers or that they
15980 clobber hi and lo. */
15981 if (*hilo_delay < 2 && reg_set_p (lo_reg, pattern))
15982 nops = 2 - *hilo_delay;
15983 else if (*delayed_reg != 0 && reg_referenced_p (*delayed_reg, pattern))
15984 nops = 1;
15985 else
15986 nops = 0;
15987
15988 /* Insert the nops between this instruction and the previous one.
15989 Each new nop takes us further from the last hilo hazard. */
15990 *hilo_delay += nops;
15991 while (nops-- > 0)
15992 emit_insn_after (gen_hazard_nop (), after);
15993
15994 /* Set up the state for the next instruction. */
15995 *hilo_delay += ninsns;
15996 *delayed_reg = 0;
15997 if (INSN_CODE (insn) >= 0)
15998 switch (get_attr_hazard (insn))
15999 {
16000 case HAZARD_NONE:
16001 break;
16002
16003 case HAZARD_HILO:
16004 *hilo_delay = 0;
16005 break;
16006
16007 case HAZARD_DELAY:
16008 set = single_set (insn);
16009 gcc_assert (set);
16010 *delayed_reg = SET_DEST (set);
16011 break;
16012 }
16013 }
16014
16015 /* Go through the instruction stream and insert nops where necessary.
16016 Also delete any high-part relocations whose partnering low parts
16017 are now all dead. See if the whole function can then be put into
16018 .set noreorder and .set nomacro. */
16019
16020 static void
16021 mips_reorg_process_insns (void)
16022 {
16023 rtx insn, last_insn, subinsn, next_insn, lo_reg, delayed_reg;
16024 int hilo_delay;
16025 mips_offset_table htab;
16026
16027 /* Force all instructions to be split into their final form. */
16028 split_all_insns_noflow ();
16029
16030 /* Recalculate instruction lengths without taking nops into account. */
16031 cfun->machine->ignore_hazard_length_p = true;
16032 shorten_branches (get_insns ());
16033
16034 cfun->machine->all_noreorder_p = true;
16035
16036 /* We don't track MIPS16 PC-relative offsets closely enough to make
16037 a good job of "set .noreorder" code in MIPS16 mode. */
16038 if (TARGET_MIPS16)
16039 cfun->machine->all_noreorder_p = false;
16040
16041 /* Code that doesn't use explicit relocs can't be ".set nomacro". */
16042 if (!TARGET_EXPLICIT_RELOCS)
16043 cfun->machine->all_noreorder_p = false;
16044
16045 /* Profiled functions can't be all noreorder because the profiler
16046 support uses assembler macros. */
16047 if (crtl->profile)
16048 cfun->machine->all_noreorder_p = false;
16049
16050 /* Code compiled with -mfix-vr4120 or -mfix-24k can't be all noreorder
16051 because we rely on the assembler to work around some errata.
16052 The r5900 too has several bugs. */
16053 if (TARGET_FIX_VR4120 || TARGET_FIX_24K || TARGET_MIPS5900)
16054 cfun->machine->all_noreorder_p = false;
16055
16056 /* The same is true for -mfix-vr4130 if we might generate MFLO or
16057 MFHI instructions. Note that we avoid using MFLO and MFHI if
16058 the VR4130 MACC and DMACC instructions are available instead;
16059 see the *mfhilo_{si,di}_macc patterns. */
16060 if (TARGET_FIX_VR4130 && !ISA_HAS_MACCHI)
16061 cfun->machine->all_noreorder_p = false;
16062
16063 htab.create (37);
16064
16065 /* Make a first pass over the instructions, recording all the LO_SUMs. */
16066 for (insn = get_insns (); insn != 0; insn = NEXT_INSN (insn))
16067 FOR_EACH_SUBINSN (subinsn, insn)
16068 if (USEFUL_INSN_P (subinsn))
16069 for_each_rtx (&PATTERN (subinsn), mips_record_lo_sum, &htab);
16070
16071 last_insn = 0;
16072 hilo_delay = 2;
16073 delayed_reg = 0;
16074 lo_reg = gen_rtx_REG (SImode, LO_REGNUM);
16075
16076 /* Make a second pass over the instructions. Delete orphaned
16077 high-part relocations or turn them into NOPs. Avoid hazards
16078 by inserting NOPs. */
16079 for (insn = get_insns (); insn != 0; insn = next_insn)
16080 {
16081 next_insn = NEXT_INSN (insn);
16082 if (USEFUL_INSN_P (insn))
16083 {
16084 if (GET_CODE (PATTERN (insn)) == SEQUENCE)
16085 {
16086 /* If we find an orphaned high-part relocation in a delay
16087 slot, it's easier to turn that instruction into a NOP than
16088 to delete it. The delay slot will be a NOP either way. */
16089 FOR_EACH_SUBINSN (subinsn, insn)
16090 if (INSN_P (subinsn))
16091 {
16092 if (mips_orphaned_high_part_p (htab, subinsn))
16093 {
16094 PATTERN (subinsn) = gen_nop ();
16095 INSN_CODE (subinsn) = CODE_FOR_nop;
16096 }
16097 mips_avoid_hazard (last_insn, subinsn, &hilo_delay,
16098 &delayed_reg, lo_reg);
16099 }
16100 last_insn = insn;
16101 }
16102 else
16103 {
16104 /* INSN is a single instruction. Delete it if it's an
16105 orphaned high-part relocation. */
16106 if (mips_orphaned_high_part_p (htab, insn))
16107 delete_insn (insn);
16108 /* Also delete cache barriers if the last instruction
16109 was an annulled branch. INSN will not be speculatively
16110 executed. */
16111 else if (recog_memoized (insn) == CODE_FOR_r10k_cache_barrier
16112 && last_insn
16113 && JUMP_P (SEQ_BEGIN (last_insn))
16114 && INSN_ANNULLED_BRANCH_P (SEQ_BEGIN (last_insn)))
16115 delete_insn (insn);
16116 else
16117 {
16118 mips_avoid_hazard (last_insn, insn, &hilo_delay,
16119 &delayed_reg, lo_reg);
16120 last_insn = insn;
16121 }
16122 }
16123 }
16124 }
16125
16126 htab.dispose ();
16127 }
16128
16129 /* Return true if the function has a long branch instruction. */
16130
16131 static bool
16132 mips_has_long_branch_p (void)
16133 {
16134 rtx insn, subinsn;
16135 int normal_length;
16136
16137 /* We need up-to-date instruction lengths. */
16138 shorten_branches (get_insns ());
16139
16140 /* Look for a branch that is longer than normal. The normal length for
16141 non-MIPS16 branches is 8, because the length includes the delay slot.
16142 It is 4 for MIPS16, because MIPS16 branches are extended instructions,
16143 but they have no delay slot. */
16144 normal_length = (TARGET_MIPS16 ? 4 : 8);
16145 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
16146 FOR_EACH_SUBINSN (subinsn, insn)
16147 if (JUMP_P (subinsn)
16148 && get_attr_length (subinsn) > normal_length
16149 && (any_condjump_p (subinsn) || any_uncondjump_p (subinsn)))
16150 return true;
16151
16152 return false;
16153 }
16154
16155 /* If we are using a GOT, but have not decided to use a global pointer yet,
16156 see whether we need one to implement long branches. Convert the ghost
16157 global-pointer instructions into real ones if so. */
16158
16159 static bool
16160 mips_expand_ghost_gp_insns (void)
16161 {
16162 /* Quick exit if we already know that we will or won't need a
16163 global pointer. */
16164 if (!TARGET_USE_GOT
16165 || cfun->machine->global_pointer == INVALID_REGNUM
16166 || mips_must_initialize_gp_p ())
16167 return false;
16168
16169 /* Run a full check for long branches. */
16170 if (!mips_has_long_branch_p ())
16171 return false;
16172
16173 /* We've now established that we need $gp. */
16174 cfun->machine->must_initialize_gp_p = true;
16175 split_all_insns_noflow ();
16176
16177 return true;
16178 }
16179
16180 /* Subroutine of mips_reorg to manage passes that require DF. */
16181
16182 static void
16183 mips_df_reorg (void)
16184 {
16185 /* Create def-use chains. */
16186 df_set_flags (DF_EQ_NOTES);
16187 df_chain_add_problem (DF_UD_CHAIN);
16188 df_analyze ();
16189
16190 if (TARGET_RELAX_PIC_CALLS)
16191 mips_annotate_pic_calls ();
16192
16193 if (mips_r10k_cache_barrier != R10K_CACHE_BARRIER_NONE)
16194 r10k_insert_cache_barriers ();
16195
16196 df_finish_pass (false);
16197 }
16198
16199 /* Emit code to load LABEL_REF SRC into MIPS16 register DEST. This is
16200 called very late in mips_reorg, but the caller is required to run
16201 mips16_lay_out_constants on the result. */
16202
16203 static void
16204 mips16_load_branch_target (rtx dest, rtx src)
16205 {
16206 if (TARGET_ABICALLS && !TARGET_ABSOLUTE_ABICALLS)
16207 {
16208 rtx page, low;
16209
16210 if (mips_cfun_has_cprestore_slot_p ())
16211 mips_emit_move (dest, mips_cprestore_slot (dest, true));
16212 else
16213 mips_emit_move (dest, pic_offset_table_rtx);
16214 page = mips_unspec_address (src, SYMBOL_GOTOFF_PAGE);
16215 low = mips_unspec_address (src, SYMBOL_GOT_PAGE_OFST);
16216 emit_insn (gen_rtx_SET (VOIDmode, dest,
16217 PMODE_INSN (gen_unspec_got, (dest, page))));
16218 emit_insn (gen_rtx_SET (VOIDmode, dest,
16219 gen_rtx_LO_SUM (Pmode, dest, low)));
16220 }
16221 else
16222 {
16223 src = mips_unspec_address (src, SYMBOL_ABSOLUTE);
16224 mips_emit_move (dest, src);
16225 }
16226 }
16227
16228 /* If we're compiling a MIPS16 function, look for and split any long branches.
16229 This must be called after all other instruction modifications in
16230 mips_reorg. */
16231
16232 static void
16233 mips16_split_long_branches (void)
16234 {
16235 bool something_changed;
16236
16237 if (!TARGET_MIPS16)
16238 return;
16239
16240 /* Loop until the alignments for all targets are sufficient. */
16241 do
16242 {
16243 rtx insn;
16244
16245 shorten_branches (get_insns ());
16246 something_changed = false;
16247 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
16248 if (JUMP_P (insn)
16249 && get_attr_length (insn) > 4
16250 && (any_condjump_p (insn) || any_uncondjump_p (insn)))
16251 {
16252 rtx old_label, new_label, temp, saved_temp;
16253 rtx target, jump, jump_sequence;
16254
16255 start_sequence ();
16256
16257 /* Free up a MIPS16 register by saving it in $1. */
16258 saved_temp = gen_rtx_REG (Pmode, AT_REGNUM);
16259 temp = gen_rtx_REG (Pmode, GP_REG_FIRST + 2);
16260 emit_move_insn (saved_temp, temp);
16261
16262 /* Load the branch target into TEMP. */
16263 old_label = JUMP_LABEL (insn);
16264 target = gen_rtx_LABEL_REF (Pmode, old_label);
16265 mips16_load_branch_target (temp, target);
16266
16267 /* Jump to the target and restore the register's
16268 original value. */
16269 jump = emit_jump_insn (PMODE_INSN (gen_indirect_jump_and_restore,
16270 (temp, temp, saved_temp)));
16271 JUMP_LABEL (jump) = old_label;
16272 LABEL_NUSES (old_label)++;
16273
16274 /* Rewrite any symbolic references that are supposed to use
16275 a PC-relative constant pool. */
16276 mips16_lay_out_constants (false);
16277
16278 if (simplejump_p (insn))
16279 /* We're going to replace INSN with a longer form. */
16280 new_label = NULL_RTX;
16281 else
16282 {
16283 /* Create a branch-around label for the original
16284 instruction. */
16285 new_label = gen_label_rtx ();
16286 emit_label (new_label);
16287 }
16288
16289 jump_sequence = get_insns ();
16290 end_sequence ();
16291
16292 emit_insn_after (jump_sequence, insn);
16293 if (new_label)
16294 invert_jump (insn, new_label, false);
16295 else
16296 delete_insn (insn);
16297 something_changed = true;
16298 }
16299 }
16300 while (something_changed);
16301 }
16302
16303 /* Implement TARGET_MACHINE_DEPENDENT_REORG. */
16304
16305 static void
16306 mips_reorg (void)
16307 {
16308 /* Restore the BLOCK_FOR_INSN pointers, which are needed by DF. Also during
16309 insn splitting in mips16_lay_out_constants, DF insn info is only kept up
16310 to date if the CFG is available. */
16311 if (mips_cfg_in_reorg ())
16312 compute_bb_for_insn ();
16313 mips16_lay_out_constants (true);
16314 if (mips_cfg_in_reorg ())
16315 {
16316 mips_df_reorg ();
16317 free_bb_for_insn ();
16318 }
16319 }
16320
16321 /* We use a machine specific pass to do a second machine dependent reorg
16322 pass after delay branch scheduling. */
16323
16324 static unsigned int
16325 mips_machine_reorg2 (void)
16326 {
16327 mips_reorg_process_insns ();
16328 if (!TARGET_MIPS16
16329 && TARGET_EXPLICIT_RELOCS
16330 && TUNE_MIPS4130
16331 && TARGET_VR4130_ALIGN)
16332 vr4130_align_insns ();
16333 if (mips_expand_ghost_gp_insns ())
16334 /* The expansion could invalidate some of the VR4130 alignment
16335 optimizations, but this should be an extremely rare case anyhow. */
16336 mips_reorg_process_insns ();
16337 mips16_split_long_branches ();
16338 return 0;
16339 }
16340
16341 namespace {
16342
16343 const pass_data pass_data_mips_machine_reorg2 =
16344 {
16345 RTL_PASS, /* type */
16346 "mach2", /* name */
16347 OPTGROUP_NONE, /* optinfo_flags */
16348 false, /* has_gate */
16349 true, /* has_execute */
16350 TV_MACH_DEP, /* tv_id */
16351 0, /* properties_required */
16352 0, /* properties_provided */
16353 0, /* properties_destroyed */
16354 0, /* todo_flags_start */
16355 TODO_verify_rtl_sharing, /* todo_flags_finish */
16356 };
16357
16358 class pass_mips_machine_reorg2 : public rtl_opt_pass
16359 {
16360 public:
16361 pass_mips_machine_reorg2(gcc::context *ctxt)
16362 : rtl_opt_pass(pass_data_mips_machine_reorg2, ctxt)
16363 {}
16364
16365 /* opt_pass methods: */
16366 unsigned int execute () { return mips_machine_reorg2 (); }
16367
16368 }; // class pass_mips_machine_reorg2
16369
16370 } // anon namespace
16371
16372 rtl_opt_pass *
16373 make_pass_mips_machine_reorg2 (gcc::context *ctxt)
16374 {
16375 return new pass_mips_machine_reorg2 (ctxt);
16376 }
16377
16378 \f
16379 /* Implement TARGET_ASM_OUTPUT_MI_THUNK. Generate rtl rather than asm text
16380 in order to avoid duplicating too much logic from elsewhere. */
16381
16382 static void
16383 mips_output_mi_thunk (FILE *file, tree thunk_fndecl ATTRIBUTE_UNUSED,
16384 HOST_WIDE_INT delta, HOST_WIDE_INT vcall_offset,
16385 tree function)
16386 {
16387 rtx this_rtx, temp1, temp2, insn, fnaddr;
16388 bool use_sibcall_p;
16389
16390 /* Pretend to be a post-reload pass while generating rtl. */
16391 reload_completed = 1;
16392
16393 /* Mark the end of the (empty) prologue. */
16394 emit_note (NOTE_INSN_PROLOGUE_END);
16395
16396 /* Determine if we can use a sibcall to call FUNCTION directly. */
16397 fnaddr = XEXP (DECL_RTL (function), 0);
16398 use_sibcall_p = (mips_function_ok_for_sibcall (function, NULL)
16399 && const_call_insn_operand (fnaddr, Pmode));
16400
16401 /* Determine if we need to load FNADDR from the GOT. */
16402 if (!use_sibcall_p
16403 && (mips_got_symbol_type_p
16404 (mips_classify_symbol (fnaddr, SYMBOL_CONTEXT_LEA))))
16405 {
16406 /* Pick a global pointer. Use a call-clobbered register if
16407 TARGET_CALL_SAVED_GP. */
16408 cfun->machine->global_pointer
16409 = TARGET_CALL_SAVED_GP ? 15 : GLOBAL_POINTER_REGNUM;
16410 cfun->machine->must_initialize_gp_p = true;
16411 SET_REGNO (pic_offset_table_rtx, cfun->machine->global_pointer);
16412
16413 /* Set up the global pointer for n32 or n64 abicalls. */
16414 mips_emit_loadgp ();
16415 }
16416
16417 /* We need two temporary registers in some cases. */
16418 temp1 = gen_rtx_REG (Pmode, 2);
16419 temp2 = gen_rtx_REG (Pmode, 3);
16420
16421 /* Find out which register contains the "this" pointer. */
16422 if (aggregate_value_p (TREE_TYPE (TREE_TYPE (function)), function))
16423 this_rtx = gen_rtx_REG (Pmode, GP_ARG_FIRST + 1);
16424 else
16425 this_rtx = gen_rtx_REG (Pmode, GP_ARG_FIRST);
16426
16427 /* Add DELTA to THIS_RTX. */
16428 if (delta != 0)
16429 {
16430 rtx offset = GEN_INT (delta);
16431 if (!SMALL_OPERAND (delta))
16432 {
16433 mips_emit_move (temp1, offset);
16434 offset = temp1;
16435 }
16436 emit_insn (gen_add3_insn (this_rtx, this_rtx, offset));
16437 }
16438
16439 /* If needed, add *(*THIS_RTX + VCALL_OFFSET) to THIS_RTX. */
16440 if (vcall_offset != 0)
16441 {
16442 rtx addr;
16443
16444 /* Set TEMP1 to *THIS_RTX. */
16445 mips_emit_move (temp1, gen_rtx_MEM (Pmode, this_rtx));
16446
16447 /* Set ADDR to a legitimate address for *THIS_RTX + VCALL_OFFSET. */
16448 addr = mips_add_offset (temp2, temp1, vcall_offset);
16449
16450 /* Load the offset and add it to THIS_RTX. */
16451 mips_emit_move (temp1, gen_rtx_MEM (Pmode, addr));
16452 emit_insn (gen_add3_insn (this_rtx, this_rtx, temp1));
16453 }
16454
16455 /* Jump to the target function. Use a sibcall if direct jumps are
16456 allowed, otherwise load the address into a register first. */
16457 if (use_sibcall_p)
16458 {
16459 insn = emit_call_insn (gen_sibcall_internal (fnaddr, const0_rtx));
16460 SIBLING_CALL_P (insn) = 1;
16461 }
16462 else
16463 {
16464 /* This is messy. GAS treats "la $25,foo" as part of a call
16465 sequence and may allow a global "foo" to be lazily bound.
16466 The general move patterns therefore reject this combination.
16467
16468 In this context, lazy binding would actually be OK
16469 for TARGET_CALL_CLOBBERED_GP, but it's still wrong for
16470 TARGET_CALL_SAVED_GP; see mips_load_call_address.
16471 We must therefore load the address via a temporary
16472 register if mips_dangerous_for_la25_p.
16473
16474 If we jump to the temporary register rather than $25,
16475 the assembler can use the move insn to fill the jump's
16476 delay slot.
16477
16478 We can use the same technique for MIPS16 code, where $25
16479 is not a valid JR register. */
16480 if (TARGET_USE_PIC_FN_ADDR_REG
16481 && !TARGET_MIPS16
16482 && !mips_dangerous_for_la25_p (fnaddr))
16483 temp1 = gen_rtx_REG (Pmode, PIC_FUNCTION_ADDR_REGNUM);
16484 mips_load_call_address (MIPS_CALL_SIBCALL, temp1, fnaddr);
16485
16486 if (TARGET_USE_PIC_FN_ADDR_REG
16487 && REGNO (temp1) != PIC_FUNCTION_ADDR_REGNUM)
16488 mips_emit_move (gen_rtx_REG (Pmode, PIC_FUNCTION_ADDR_REGNUM), temp1);
16489 emit_jump_insn (gen_indirect_jump (temp1));
16490 }
16491
16492 /* Run just enough of rest_of_compilation. This sequence was
16493 "borrowed" from alpha.c. */
16494 insn = get_insns ();
16495 split_all_insns_noflow ();
16496 mips16_lay_out_constants (true);
16497 shorten_branches (insn);
16498 final_start_function (insn, file, 1);
16499 final (insn, file, 1);
16500 final_end_function ();
16501
16502 /* Clean up the vars set above. Note that final_end_function resets
16503 the global pointer for us. */
16504 reload_completed = 0;
16505 }
16506 \f
16507
16508 /* The last argument passed to mips_set_compression_mode,
16509 or negative if the function hasn't been called yet. */
16510 static unsigned int old_compression_mode = -1;
16511
16512 /* Set up the target-dependent global state for ISA mode COMPRESSION_MODE,
16513 which is either MASK_MIPS16 or MASK_MICROMIPS. */
16514
16515 static void
16516 mips_set_compression_mode (unsigned int compression_mode)
16517 {
16518
16519 if (compression_mode == old_compression_mode)
16520 return;
16521
16522 /* Restore base settings of various flags. */
16523 target_flags = mips_base_target_flags;
16524 flag_schedule_insns = mips_base_schedule_insns;
16525 flag_reorder_blocks_and_partition = mips_base_reorder_blocks_and_partition;
16526 flag_move_loop_invariants = mips_base_move_loop_invariants;
16527 align_loops = mips_base_align_loops;
16528 align_jumps = mips_base_align_jumps;
16529 align_functions = mips_base_align_functions;
16530 target_flags &= ~(MASK_MIPS16 | MASK_MICROMIPS);
16531 target_flags |= compression_mode;
16532
16533 if (compression_mode & MASK_MIPS16)
16534 {
16535 /* Switch to MIPS16 mode. */
16536 target_flags |= MASK_MIPS16;
16537
16538 /* Turn off SYNCI if it was on, MIPS16 doesn't support it. */
16539 target_flags &= ~MASK_SYNCI;
16540
16541 /* Don't run the scheduler before reload, since it tends to
16542 increase register pressure. */
16543 flag_schedule_insns = 0;
16544
16545 /* Don't do hot/cold partitioning. mips16_lay_out_constants expects
16546 the whole function to be in a single section. */
16547 flag_reorder_blocks_and_partition = 0;
16548
16549 /* Don't move loop invariants, because it tends to increase
16550 register pressure. It also introduces an extra move in cases
16551 where the constant is the first operand in a two-operand binary
16552 instruction, or when it forms a register argument to a functon
16553 call. */
16554 flag_move_loop_invariants = 0;
16555
16556 target_flags |= MASK_EXPLICIT_RELOCS;
16557
16558 /* Experiments suggest we get the best overall section-anchor
16559 results from using the range of an unextended LW or SW. Code
16560 that makes heavy use of byte or short accesses can do better
16561 with ranges of 0...31 and 0...63 respectively, but most code is
16562 sensitive to the range of LW and SW instead. */
16563 targetm.min_anchor_offset = 0;
16564 targetm.max_anchor_offset = 127;
16565
16566 targetm.const_anchor = 0;
16567
16568 /* MIPS16 has no BAL instruction. */
16569 target_flags &= ~MASK_RELAX_PIC_CALLS;
16570
16571 /* The R4000 errata don't apply to any known MIPS16 cores.
16572 It's simpler to make the R4000 fixes and MIPS16 mode
16573 mutually exclusive. */
16574 target_flags &= ~MASK_FIX_R4000;
16575
16576 if (flag_pic && !TARGET_OLDABI)
16577 sorry ("MIPS16 PIC for ABIs other than o32 and o64");
16578
16579 if (TARGET_XGOT)
16580 sorry ("MIPS16 -mxgot code");
16581
16582 if (TARGET_HARD_FLOAT_ABI && !TARGET_OLDABI)
16583 sorry ("hard-float MIPS16 code for ABIs other than o32 and o64");
16584 }
16585 else
16586 {
16587 /* Switch to microMIPS or the standard encoding. */
16588
16589 if (TARGET_MICROMIPS)
16590 /* Avoid branch likely. */
16591 target_flags &= ~MASK_BRANCHLIKELY;
16592
16593 /* Provide default values for align_* for 64-bit targets. */
16594 if (TARGET_64BIT)
16595 {
16596 if (align_loops == 0)
16597 align_loops = 8;
16598 if (align_jumps == 0)
16599 align_jumps = 8;
16600 if (align_functions == 0)
16601 align_functions = 8;
16602 }
16603
16604 targetm.min_anchor_offset = -32768;
16605 targetm.max_anchor_offset = 32767;
16606
16607 targetm.const_anchor = 0x8000;
16608 }
16609
16610 /* (Re)initialize MIPS target internals for new ISA. */
16611 mips_init_relocs ();
16612
16613 if (compression_mode & MASK_MIPS16)
16614 {
16615 if (!mips16_globals)
16616 mips16_globals = save_target_globals_default_opts ();
16617 else
16618 restore_target_globals (mips16_globals);
16619 }
16620 else
16621 restore_target_globals (&default_target_globals);
16622
16623 old_compression_mode = compression_mode;
16624 }
16625
16626 /* Implement TARGET_SET_CURRENT_FUNCTION. Decide whether the current
16627 function should use the MIPS16 or microMIPS ISA and switch modes
16628 accordingly. */
16629
16630 static void
16631 mips_set_current_function (tree fndecl)
16632 {
16633 mips_set_compression_mode (mips_get_compress_mode (fndecl));
16634 }
16635 \f
16636 /* Allocate a chunk of memory for per-function machine-dependent data. */
16637
16638 static struct machine_function *
16639 mips_init_machine_status (void)
16640 {
16641 return ggc_alloc_cleared_machine_function ();
16642 }
16643
16644 /* Return the processor associated with the given ISA level, or null
16645 if the ISA isn't valid. */
16646
16647 static const struct mips_cpu_info *
16648 mips_cpu_info_from_isa (int isa)
16649 {
16650 unsigned int i;
16651
16652 for (i = 0; i < ARRAY_SIZE (mips_cpu_info_table); i++)
16653 if (mips_cpu_info_table[i].isa == isa)
16654 return mips_cpu_info_table + i;
16655
16656 return NULL;
16657 }
16658
16659 /* Return a mips_cpu_info entry determined by an option valued
16660 OPT. */
16661
16662 static const struct mips_cpu_info *
16663 mips_cpu_info_from_opt (int opt)
16664 {
16665 switch (opt)
16666 {
16667 case MIPS_ARCH_OPTION_FROM_ABI:
16668 /* 'from-abi' selects the most compatible architecture for the
16669 given ABI: MIPS I for 32-bit ABIs and MIPS III for 64-bit
16670 ABIs. For the EABIs, we have to decide whether we're using
16671 the 32-bit or 64-bit version. */
16672 return mips_cpu_info_from_isa (ABI_NEEDS_32BIT_REGS ? 1
16673 : ABI_NEEDS_64BIT_REGS ? 3
16674 : (TARGET_64BIT ? 3 : 1));
16675
16676 case MIPS_ARCH_OPTION_NATIVE:
16677 gcc_unreachable ();
16678
16679 default:
16680 return &mips_cpu_info_table[opt];
16681 }
16682 }
16683
16684 /* Return a default mips_cpu_info entry, given that no -march= option
16685 was explicitly specified. */
16686
16687 static const struct mips_cpu_info *
16688 mips_default_arch (void)
16689 {
16690 #if defined (MIPS_CPU_STRING_DEFAULT)
16691 unsigned int i;
16692 for (i = 0; i < ARRAY_SIZE (mips_cpu_info_table); i++)
16693 if (strcmp (mips_cpu_info_table[i].name, MIPS_CPU_STRING_DEFAULT) == 0)
16694 return mips_cpu_info_table + i;
16695 gcc_unreachable ();
16696 #elif defined (MIPS_ISA_DEFAULT)
16697 return mips_cpu_info_from_isa (MIPS_ISA_DEFAULT);
16698 #else
16699 /* 'from-abi' makes a good default: you get whatever the ABI
16700 requires. */
16701 return mips_cpu_info_from_opt (MIPS_ARCH_OPTION_FROM_ABI);
16702 #endif
16703 }
16704
16705 /* Set up globals to generate code for the ISA or processor
16706 described by INFO. */
16707
16708 static void
16709 mips_set_architecture (const struct mips_cpu_info *info)
16710 {
16711 if (info != 0)
16712 {
16713 mips_arch_info = info;
16714 mips_arch = info->cpu;
16715 mips_isa = info->isa;
16716 }
16717 }
16718
16719 /* Likewise for tuning. */
16720
16721 static void
16722 mips_set_tune (const struct mips_cpu_info *info)
16723 {
16724 if (info != 0)
16725 {
16726 mips_tune_info = info;
16727 mips_tune = info->cpu;
16728 }
16729 }
16730
16731 /* Implement TARGET_OPTION_OVERRIDE. */
16732
16733 static void
16734 mips_option_override (void)
16735 {
16736 int i, start, regno, mode;
16737
16738 if (global_options_set.x_mips_isa_option)
16739 mips_isa_option_info = &mips_cpu_info_table[mips_isa_option];
16740
16741 #ifdef SUBTARGET_OVERRIDE_OPTIONS
16742 SUBTARGET_OVERRIDE_OPTIONS;
16743 #endif
16744
16745 /* MIPS16 and microMIPS cannot coexist. */
16746 if (TARGET_MICROMIPS && TARGET_MIPS16)
16747 error ("unsupported combination: %s", "-mips16 -mmicromips");
16748
16749 /* Save the base compression state and process flags as though we
16750 were generating uncompressed code. */
16751 mips_base_compression_flags = TARGET_COMPRESSION;
16752 target_flags &= ~TARGET_COMPRESSION;
16753
16754 /* -mno-float overrides -mhard-float and -msoft-float. */
16755 if (TARGET_NO_FLOAT)
16756 {
16757 target_flags |= MASK_SOFT_FLOAT_ABI;
16758 target_flags_explicit |= MASK_SOFT_FLOAT_ABI;
16759 }
16760
16761 if (TARGET_FLIP_MIPS16)
16762 TARGET_INTERLINK_COMPRESSED = 1;
16763
16764 /* Set the small data limit. */
16765 mips_small_data_threshold = (global_options_set.x_g_switch_value
16766 ? g_switch_value
16767 : MIPS_DEFAULT_GVALUE);
16768
16769 /* The following code determines the architecture and register size.
16770 Similar code was added to GAS 2.14 (see tc-mips.c:md_after_parse_args()).
16771 The GAS and GCC code should be kept in sync as much as possible. */
16772
16773 if (global_options_set.x_mips_arch_option)
16774 mips_set_architecture (mips_cpu_info_from_opt (mips_arch_option));
16775
16776 if (mips_isa_option_info != 0)
16777 {
16778 if (mips_arch_info == 0)
16779 mips_set_architecture (mips_isa_option_info);
16780 else if (mips_arch_info->isa != mips_isa_option_info->isa)
16781 error ("%<-%s%> conflicts with the other architecture options, "
16782 "which specify a %s processor",
16783 mips_isa_option_info->name,
16784 mips_cpu_info_from_isa (mips_arch_info->isa)->name);
16785 }
16786
16787 if (mips_arch_info == 0)
16788 mips_set_architecture (mips_default_arch ());
16789
16790 if (ABI_NEEDS_64BIT_REGS && !ISA_HAS_64BIT_REGS)
16791 error ("%<-march=%s%> is not compatible with the selected ABI",
16792 mips_arch_info->name);
16793
16794 /* Optimize for mips_arch, unless -mtune selects a different processor. */
16795 if (global_options_set.x_mips_tune_option)
16796 mips_set_tune (mips_cpu_info_from_opt (mips_tune_option));
16797
16798 if (mips_tune_info == 0)
16799 mips_set_tune (mips_arch_info);
16800
16801 if ((target_flags_explicit & MASK_64BIT) != 0)
16802 {
16803 /* The user specified the size of the integer registers. Make sure
16804 it agrees with the ABI and ISA. */
16805 if (TARGET_64BIT && !ISA_HAS_64BIT_REGS)
16806 error ("%<-mgp64%> used with a 32-bit processor");
16807 else if (!TARGET_64BIT && ABI_NEEDS_64BIT_REGS)
16808 error ("%<-mgp32%> used with a 64-bit ABI");
16809 else if (TARGET_64BIT && ABI_NEEDS_32BIT_REGS)
16810 error ("%<-mgp64%> used with a 32-bit ABI");
16811 }
16812 else
16813 {
16814 /* Infer the integer register size from the ABI and processor.
16815 Restrict ourselves to 32-bit registers if that's all the
16816 processor has, or if the ABI cannot handle 64-bit registers. */
16817 if (ABI_NEEDS_32BIT_REGS || !ISA_HAS_64BIT_REGS)
16818 target_flags &= ~MASK_64BIT;
16819 else
16820 target_flags |= MASK_64BIT;
16821 }
16822
16823 if ((target_flags_explicit & MASK_FLOAT64) != 0)
16824 {
16825 if (TARGET_SINGLE_FLOAT && TARGET_FLOAT64)
16826 error ("unsupported combination: %s", "-mfp64 -msingle-float");
16827 else if (TARGET_64BIT && TARGET_DOUBLE_FLOAT && !TARGET_FLOAT64)
16828 error ("unsupported combination: %s", "-mgp64 -mfp32 -mdouble-float");
16829 else if (!TARGET_64BIT && TARGET_FLOAT64)
16830 {
16831 if (!ISA_HAS_MXHC1)
16832 error ("%<-mgp32%> and %<-mfp64%> can only be combined if"
16833 " the target supports the mfhc1 and mthc1 instructions");
16834 else if (mips_abi != ABI_32)
16835 error ("%<-mgp32%> and %<-mfp64%> can only be combined when using"
16836 " the o32 ABI");
16837 }
16838 }
16839 else
16840 {
16841 /* -msingle-float selects 32-bit float registers. Otherwise the
16842 float registers should be the same size as the integer ones. */
16843 if (TARGET_64BIT && TARGET_DOUBLE_FLOAT)
16844 target_flags |= MASK_FLOAT64;
16845 else
16846 target_flags &= ~MASK_FLOAT64;
16847 }
16848
16849 /* End of code shared with GAS. */
16850
16851 /* The R5900 FPU only supports single precision. */
16852 if (TARGET_MIPS5900 && TARGET_HARD_FLOAT_ABI && TARGET_DOUBLE_FLOAT)
16853 error ("unsupported combination: %s",
16854 "-march=r5900 -mhard-float -mdouble-float");
16855
16856 /* If a -mlong* option was given, check that it matches the ABI,
16857 otherwise infer the -mlong* setting from the other options. */
16858 if ((target_flags_explicit & MASK_LONG64) != 0)
16859 {
16860 if (TARGET_LONG64)
16861 {
16862 if (mips_abi == ABI_N32)
16863 error ("%qs is incompatible with %qs", "-mabi=n32", "-mlong64");
16864 else if (mips_abi == ABI_32)
16865 error ("%qs is incompatible with %qs", "-mabi=32", "-mlong64");
16866 else if (mips_abi == ABI_O64 && TARGET_ABICALLS)
16867 /* We have traditionally allowed non-abicalls code to use
16868 an LP64 form of o64. However, it would take a bit more
16869 effort to support the combination of 32-bit GOT entries
16870 and 64-bit pointers, so we treat the abicalls case as
16871 an error. */
16872 error ("the combination of %qs and %qs is incompatible with %qs",
16873 "-mabi=o64", "-mabicalls", "-mlong64");
16874 }
16875 else
16876 {
16877 if (mips_abi == ABI_64)
16878 error ("%qs is incompatible with %qs", "-mabi=64", "-mlong32");
16879 }
16880 }
16881 else
16882 {
16883 if ((mips_abi == ABI_EABI && TARGET_64BIT) || mips_abi == ABI_64)
16884 target_flags |= MASK_LONG64;
16885 else
16886 target_flags &= ~MASK_LONG64;
16887 }
16888
16889 if (!TARGET_OLDABI)
16890 flag_pcc_struct_return = 0;
16891
16892 /* Decide which rtx_costs structure to use. */
16893 if (optimize_size)
16894 mips_cost = &mips_rtx_cost_optimize_size;
16895 else
16896 mips_cost = &mips_rtx_cost_data[mips_tune];
16897
16898 /* If the user hasn't specified a branch cost, use the processor's
16899 default. */
16900 if (mips_branch_cost == 0)
16901 mips_branch_cost = mips_cost->branch_cost;
16902
16903 /* If neither -mbranch-likely nor -mno-branch-likely was given
16904 on the command line, set MASK_BRANCHLIKELY based on the target
16905 architecture and tuning flags. Annulled delay slots are a
16906 size win, so we only consider the processor-specific tuning
16907 for !optimize_size. */
16908 if ((target_flags_explicit & MASK_BRANCHLIKELY) == 0)
16909 {
16910 if (ISA_HAS_BRANCHLIKELY
16911 && (optimize_size
16912 || (mips_tune_info->tune_flags & PTF_AVOID_BRANCHLIKELY) == 0))
16913 target_flags |= MASK_BRANCHLIKELY;
16914 else
16915 target_flags &= ~MASK_BRANCHLIKELY;
16916 }
16917 else if (TARGET_BRANCHLIKELY && !ISA_HAS_BRANCHLIKELY)
16918 warning (0, "the %qs architecture does not support branch-likely"
16919 " instructions", mips_arch_info->name);
16920
16921 /* If the user hasn't specified -mimadd or -mno-imadd set
16922 MASK_IMADD based on the target architecture and tuning
16923 flags. */
16924 if ((target_flags_explicit & MASK_IMADD) == 0)
16925 {
16926 if (ISA_HAS_MADD_MSUB &&
16927 (mips_tune_info->tune_flags & PTF_AVOID_IMADD) == 0)
16928 target_flags |= MASK_IMADD;
16929 else
16930 target_flags &= ~MASK_IMADD;
16931 }
16932 else if (TARGET_IMADD && !ISA_HAS_MADD_MSUB)
16933 warning (0, "the %qs architecture does not support madd or msub"
16934 " instructions", mips_arch_info->name);
16935
16936 /* The effect of -mabicalls isn't defined for the EABI. */
16937 if (mips_abi == ABI_EABI && TARGET_ABICALLS)
16938 {
16939 error ("unsupported combination: %s", "-mabicalls -mabi=eabi");
16940 target_flags &= ~MASK_ABICALLS;
16941 }
16942
16943 /* PIC requires -mabicalls. */
16944 if (flag_pic)
16945 {
16946 if (mips_abi == ABI_EABI)
16947 error ("cannot generate position-independent code for %qs",
16948 "-mabi=eabi");
16949 else if (!TARGET_ABICALLS)
16950 error ("position-independent code requires %qs", "-mabicalls");
16951 }
16952
16953 if (TARGET_ABICALLS_PIC2)
16954 /* We need to set flag_pic for executables as well as DSOs
16955 because we may reference symbols that are not defined in
16956 the final executable. (MIPS does not use things like
16957 copy relocs, for example.)
16958
16959 There is a body of code that uses __PIC__ to distinguish
16960 between -mabicalls and -mno-abicalls code. The non-__PIC__
16961 variant is usually appropriate for TARGET_ABICALLS_PIC0, as
16962 long as any indirect jumps use $25. */
16963 flag_pic = 1;
16964
16965 /* -mvr4130-align is a "speed over size" optimization: it usually produces
16966 faster code, but at the expense of more nops. Enable it at -O3 and
16967 above. */
16968 if (optimize > 2 && (target_flags_explicit & MASK_VR4130_ALIGN) == 0)
16969 target_flags |= MASK_VR4130_ALIGN;
16970
16971 /* Prefer a call to memcpy over inline code when optimizing for size,
16972 though see MOVE_RATIO in mips.h. */
16973 if (optimize_size && (target_flags_explicit & MASK_MEMCPY) == 0)
16974 target_flags |= MASK_MEMCPY;
16975
16976 /* If we have a nonzero small-data limit, check that the -mgpopt
16977 setting is consistent with the other target flags. */
16978 if (mips_small_data_threshold > 0)
16979 {
16980 if (!TARGET_GPOPT)
16981 {
16982 if (!TARGET_EXPLICIT_RELOCS)
16983 error ("%<-mno-gpopt%> needs %<-mexplicit-relocs%>");
16984
16985 TARGET_LOCAL_SDATA = false;
16986 TARGET_EXTERN_SDATA = false;
16987 }
16988 else
16989 {
16990 if (TARGET_VXWORKS_RTP)
16991 warning (0, "cannot use small-data accesses for %qs", "-mrtp");
16992
16993 if (TARGET_ABICALLS)
16994 warning (0, "cannot use small-data accesses for %qs",
16995 "-mabicalls");
16996 }
16997 }
16998
16999 /* Pre-IEEE 754-2008 MIPS hardware has a quirky almost-IEEE format
17000 for all its floating point. */
17001 if (mips_nan != MIPS_IEEE_754_2008)
17002 {
17003 REAL_MODE_FORMAT (SFmode) = &mips_single_format;
17004 REAL_MODE_FORMAT (DFmode) = &mips_double_format;
17005 REAL_MODE_FORMAT (TFmode) = &mips_quad_format;
17006 }
17007
17008 /* Make sure that the user didn't turn off paired single support when
17009 MIPS-3D support is requested. */
17010 if (TARGET_MIPS3D
17011 && (target_flags_explicit & MASK_PAIRED_SINGLE_FLOAT)
17012 && !TARGET_PAIRED_SINGLE_FLOAT)
17013 error ("%<-mips3d%> requires %<-mpaired-single%>");
17014
17015 /* If TARGET_MIPS3D, enable MASK_PAIRED_SINGLE_FLOAT. */
17016 if (TARGET_MIPS3D)
17017 target_flags |= MASK_PAIRED_SINGLE_FLOAT;
17018
17019 /* Make sure that when TARGET_PAIRED_SINGLE_FLOAT is true, TARGET_FLOAT64
17020 and TARGET_HARD_FLOAT_ABI are both true. */
17021 if (TARGET_PAIRED_SINGLE_FLOAT && !(TARGET_FLOAT64 && TARGET_HARD_FLOAT_ABI))
17022 error ("%qs must be used with %qs",
17023 TARGET_MIPS3D ? "-mips3d" : "-mpaired-single",
17024 TARGET_HARD_FLOAT_ABI ? "-mfp64" : "-mhard-float");
17025
17026 /* Make sure that the ISA supports TARGET_PAIRED_SINGLE_FLOAT when it is
17027 enabled. */
17028 if (TARGET_PAIRED_SINGLE_FLOAT && !ISA_HAS_PAIRED_SINGLE)
17029 warning (0, "the %qs architecture does not support paired-single"
17030 " instructions", mips_arch_info->name);
17031
17032 if (mips_r10k_cache_barrier != R10K_CACHE_BARRIER_NONE
17033 && !TARGET_CACHE_BUILTIN)
17034 {
17035 error ("%qs requires a target that provides the %qs instruction",
17036 "-mr10k-cache-barrier", "cache");
17037 mips_r10k_cache_barrier = R10K_CACHE_BARRIER_NONE;
17038 }
17039
17040 /* If TARGET_DSPR2, enable MASK_DSP. */
17041 if (TARGET_DSPR2)
17042 target_flags |= MASK_DSP;
17043
17044 /* .eh_frame addresses should be the same width as a C pointer.
17045 Most MIPS ABIs support only one pointer size, so the assembler
17046 will usually know exactly how big an .eh_frame address is.
17047
17048 Unfortunately, this is not true of the 64-bit EABI. The ABI was
17049 originally defined to use 64-bit pointers (i.e. it is LP64), and
17050 this is still the default mode. However, we also support an n32-like
17051 ILP32 mode, which is selected by -mlong32. The problem is that the
17052 assembler has traditionally not had an -mlong option, so it has
17053 traditionally not known whether we're using the ILP32 or LP64 form.
17054
17055 As it happens, gas versions up to and including 2.19 use _32-bit_
17056 addresses for EABI64 .cfi_* directives. This is wrong for the
17057 default LP64 mode, so we can't use the directives by default.
17058 Moreover, since gas's current behavior is at odds with gcc's
17059 default behavior, it seems unwise to rely on future versions
17060 of gas behaving the same way. We therefore avoid using .cfi
17061 directives for -mlong32 as well. */
17062 if (mips_abi == ABI_EABI && TARGET_64BIT)
17063 flag_dwarf2_cfi_asm = 0;
17064
17065 /* .cfi_* directives generate a read-only section, so fall back on
17066 manual .eh_frame creation if we need the section to be writable. */
17067 if (TARGET_WRITABLE_EH_FRAME)
17068 flag_dwarf2_cfi_asm = 0;
17069
17070 mips_init_print_operand_punct ();
17071
17072 /* Set up array to map GCC register number to debug register number.
17073 Ignore the special purpose register numbers. */
17074
17075 for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
17076 {
17077 mips_dbx_regno[i] = IGNORED_DWARF_REGNUM;
17078 if (GP_REG_P (i) || FP_REG_P (i) || ALL_COP_REG_P (i))
17079 mips_dwarf_regno[i] = i;
17080 else
17081 mips_dwarf_regno[i] = INVALID_REGNUM;
17082 }
17083
17084 start = GP_DBX_FIRST - GP_REG_FIRST;
17085 for (i = GP_REG_FIRST; i <= GP_REG_LAST; i++)
17086 mips_dbx_regno[i] = i + start;
17087
17088 start = FP_DBX_FIRST - FP_REG_FIRST;
17089 for (i = FP_REG_FIRST; i <= FP_REG_LAST; i++)
17090 mips_dbx_regno[i] = i + start;
17091
17092 /* Accumulator debug registers use big-endian ordering. */
17093 mips_dbx_regno[HI_REGNUM] = MD_DBX_FIRST + 0;
17094 mips_dbx_regno[LO_REGNUM] = MD_DBX_FIRST + 1;
17095 mips_dwarf_regno[HI_REGNUM] = MD_REG_FIRST + 0;
17096 mips_dwarf_regno[LO_REGNUM] = MD_REG_FIRST + 1;
17097 for (i = DSP_ACC_REG_FIRST; i <= DSP_ACC_REG_LAST; i += 2)
17098 {
17099 mips_dwarf_regno[i + TARGET_LITTLE_ENDIAN] = i;
17100 mips_dwarf_regno[i + TARGET_BIG_ENDIAN] = i + 1;
17101 }
17102
17103 /* Set up mips_hard_regno_mode_ok. */
17104 for (mode = 0; mode < MAX_MACHINE_MODE; mode++)
17105 for (regno = 0; regno < FIRST_PSEUDO_REGISTER; regno++)
17106 mips_hard_regno_mode_ok[mode][regno]
17107 = mips_hard_regno_mode_ok_p (regno, (enum machine_mode) mode);
17108
17109 /* Function to allocate machine-dependent function status. */
17110 init_machine_status = &mips_init_machine_status;
17111
17112 /* Default to working around R4000 errata only if the processor
17113 was selected explicitly. */
17114 if ((target_flags_explicit & MASK_FIX_R4000) == 0
17115 && strcmp (mips_arch_info->name, "r4000") == 0)
17116 target_flags |= MASK_FIX_R4000;
17117
17118 /* Default to working around R4400 errata only if the processor
17119 was selected explicitly. */
17120 if ((target_flags_explicit & MASK_FIX_R4400) == 0
17121 && strcmp (mips_arch_info->name, "r4400") == 0)
17122 target_flags |= MASK_FIX_R4400;
17123
17124 /* Default to working around R10000 errata only if the processor
17125 was selected explicitly. */
17126 if ((target_flags_explicit & MASK_FIX_R10000) == 0
17127 && strcmp (mips_arch_info->name, "r10000") == 0)
17128 target_flags |= MASK_FIX_R10000;
17129
17130 /* Make sure that branch-likely instructions available when using
17131 -mfix-r10000. The instructions are not available if either:
17132
17133 1. -mno-branch-likely was passed.
17134 2. The selected ISA does not support branch-likely and
17135 the command line does not include -mbranch-likely. */
17136 if (TARGET_FIX_R10000
17137 && ((target_flags_explicit & MASK_BRANCHLIKELY) == 0
17138 ? !ISA_HAS_BRANCHLIKELY
17139 : !TARGET_BRANCHLIKELY))
17140 sorry ("%qs requires branch-likely instructions", "-mfix-r10000");
17141
17142 if (TARGET_SYNCI && !ISA_HAS_SYNCI)
17143 {
17144 warning (0, "the %qs architecture does not support the synci "
17145 "instruction", mips_arch_info->name);
17146 target_flags &= ~MASK_SYNCI;
17147 }
17148
17149 /* Only optimize PIC indirect calls if they are actually required. */
17150 if (!TARGET_USE_GOT || !TARGET_EXPLICIT_RELOCS)
17151 target_flags &= ~MASK_RELAX_PIC_CALLS;
17152
17153 /* Save base state of options. */
17154 mips_base_target_flags = target_flags;
17155 mips_base_schedule_insns = flag_schedule_insns;
17156 mips_base_reorder_blocks_and_partition = flag_reorder_blocks_and_partition;
17157 mips_base_move_loop_invariants = flag_move_loop_invariants;
17158 mips_base_align_loops = align_loops;
17159 mips_base_align_jumps = align_jumps;
17160 mips_base_align_functions = align_functions;
17161
17162 /* Now select the ISA mode.
17163
17164 Do all CPP-sensitive stuff in uncompressed mode; we'll switch modes
17165 later if required. */
17166 mips_set_compression_mode (0);
17167
17168 /* We register a second machine specific reorg pass after delay slot
17169 filling. Registering the pass must be done at start up. It's
17170 convenient to do it here. */
17171 opt_pass *new_pass = make_pass_mips_machine_reorg2 (g);
17172 struct register_pass_info insert_pass_mips_machine_reorg2 =
17173 {
17174 new_pass, /* pass */
17175 "dbr", /* reference_pass_name */
17176 1, /* ref_pass_instance_number */
17177 PASS_POS_INSERT_AFTER /* po_op */
17178 };
17179 register_pass (&insert_pass_mips_machine_reorg2);
17180
17181 if (TARGET_HARD_FLOAT_ABI && TARGET_MIPS5900)
17182 REAL_MODE_FORMAT (SFmode) = &spu_single_format;
17183 }
17184
17185 /* Swap the register information for registers I and I + 1, which
17186 currently have the wrong endianness. Note that the registers'
17187 fixedness and call-clobberedness might have been set on the
17188 command line. */
17189
17190 static void
17191 mips_swap_registers (unsigned int i)
17192 {
17193 int tmpi;
17194 const char *tmps;
17195
17196 #define SWAP_INT(X, Y) (tmpi = (X), (X) = (Y), (Y) = tmpi)
17197 #define SWAP_STRING(X, Y) (tmps = (X), (X) = (Y), (Y) = tmps)
17198
17199 SWAP_INT (fixed_regs[i], fixed_regs[i + 1]);
17200 SWAP_INT (call_used_regs[i], call_used_regs[i + 1]);
17201 SWAP_INT (call_really_used_regs[i], call_really_used_regs[i + 1]);
17202 SWAP_STRING (reg_names[i], reg_names[i + 1]);
17203
17204 #undef SWAP_STRING
17205 #undef SWAP_INT
17206 }
17207
17208 /* Implement TARGET_CONDITIONAL_REGISTER_USAGE. */
17209
17210 static void
17211 mips_conditional_register_usage (void)
17212 {
17213
17214 if (ISA_HAS_DSP)
17215 {
17216 /* These DSP control register fields are global. */
17217 global_regs[CCDSP_PO_REGNUM] = 1;
17218 global_regs[CCDSP_SC_REGNUM] = 1;
17219 }
17220 else
17221 AND_COMPL_HARD_REG_SET (accessible_reg_set,
17222 reg_class_contents[(int) DSP_ACC_REGS]);
17223
17224 if (!TARGET_HARD_FLOAT)
17225 {
17226 AND_COMPL_HARD_REG_SET (accessible_reg_set,
17227 reg_class_contents[(int) FP_REGS]);
17228 AND_COMPL_HARD_REG_SET (accessible_reg_set,
17229 reg_class_contents[(int) ST_REGS]);
17230 }
17231 else if (!ISA_HAS_8CC)
17232 {
17233 /* We only have a single condition-code register. We implement
17234 this by fixing all the condition-code registers and generating
17235 RTL that refers directly to ST_REG_FIRST. */
17236 AND_COMPL_HARD_REG_SET (accessible_reg_set,
17237 reg_class_contents[(int) ST_REGS]);
17238 SET_HARD_REG_BIT (accessible_reg_set, FPSW_REGNUM);
17239 fixed_regs[FPSW_REGNUM] = call_used_regs[FPSW_REGNUM] = 1;
17240 }
17241 if (TARGET_MIPS16)
17242 {
17243 /* In MIPS16 mode, we prohibit the unused $s registers, since they
17244 are call-saved, and saving them via a MIPS16 register would
17245 probably waste more time than just reloading the value.
17246
17247 We permit the $t temporary registers when optimizing for speed
17248 but not when optimizing for space because using them results in
17249 code that is larger (but faster) then not using them. We do
17250 allow $24 (t8) because it is used in CMP and CMPI instructions
17251 and $25 (t9) because it is used as the function call address in
17252 SVR4 PIC code. */
17253
17254 fixed_regs[18] = call_used_regs[18] = 1;
17255 fixed_regs[19] = call_used_regs[19] = 1;
17256 fixed_regs[20] = call_used_regs[20] = 1;
17257 fixed_regs[21] = call_used_regs[21] = 1;
17258 fixed_regs[22] = call_used_regs[22] = 1;
17259 fixed_regs[23] = call_used_regs[23] = 1;
17260 fixed_regs[26] = call_used_regs[26] = 1;
17261 fixed_regs[27] = call_used_regs[27] = 1;
17262 fixed_regs[30] = call_used_regs[30] = 1;
17263 if (optimize_size)
17264 {
17265 fixed_regs[8] = call_used_regs[8] = 1;
17266 fixed_regs[9] = call_used_regs[9] = 1;
17267 fixed_regs[10] = call_used_regs[10] = 1;
17268 fixed_regs[11] = call_used_regs[11] = 1;
17269 fixed_regs[12] = call_used_regs[12] = 1;
17270 fixed_regs[13] = call_used_regs[13] = 1;
17271 fixed_regs[14] = call_used_regs[14] = 1;
17272 fixed_regs[15] = call_used_regs[15] = 1;
17273 }
17274
17275 /* Do not allow HI and LO to be treated as register operands.
17276 There are no MTHI or MTLO instructions (or any real need
17277 for them) and one-way registers cannot easily be reloaded. */
17278 AND_COMPL_HARD_REG_SET (operand_reg_set,
17279 reg_class_contents[(int) MD_REGS]);
17280 }
17281 /* $f20-$f23 are call-clobbered for n64. */
17282 if (mips_abi == ABI_64)
17283 {
17284 int regno;
17285 for (regno = FP_REG_FIRST + 20; regno < FP_REG_FIRST + 24; regno++)
17286 call_really_used_regs[regno] = call_used_regs[regno] = 1;
17287 }
17288 /* Odd registers in the range $f21-$f31 (inclusive) are call-clobbered
17289 for n32. */
17290 if (mips_abi == ABI_N32)
17291 {
17292 int regno;
17293 for (regno = FP_REG_FIRST + 21; regno <= FP_REG_FIRST + 31; regno+=2)
17294 call_really_used_regs[regno] = call_used_regs[regno] = 1;
17295 }
17296 /* Make sure that double-register accumulator values are correctly
17297 ordered for the current endianness. */
17298 if (TARGET_LITTLE_ENDIAN)
17299 {
17300 unsigned int regno;
17301
17302 mips_swap_registers (MD_REG_FIRST);
17303 for (regno = DSP_ACC_REG_FIRST; regno <= DSP_ACC_REG_LAST; regno += 2)
17304 mips_swap_registers (regno);
17305 }
17306 }
17307
17308 /* When generating MIPS16 code, we want to allocate $24 (T_REG) before
17309 other registers for instructions for which it is possible. This
17310 encourages the compiler to use CMP in cases where an XOR would
17311 require some register shuffling. */
17312
17313 void
17314 mips_order_regs_for_local_alloc (void)
17315 {
17316 int i;
17317
17318 for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
17319 reg_alloc_order[i] = i;
17320
17321 if (TARGET_MIPS16)
17322 {
17323 /* It really doesn't matter where we put register 0, since it is
17324 a fixed register anyhow. */
17325 reg_alloc_order[0] = 24;
17326 reg_alloc_order[24] = 0;
17327 }
17328 }
17329
17330 /* Implement EH_USES. */
17331
17332 bool
17333 mips_eh_uses (unsigned int regno)
17334 {
17335 if (reload_completed && !TARGET_ABSOLUTE_JUMPS)
17336 {
17337 /* We need to force certain registers to be live in order to handle
17338 PIC long branches correctly. See mips_must_initialize_gp_p for
17339 details. */
17340 if (mips_cfun_has_cprestore_slot_p ())
17341 {
17342 if (regno == CPRESTORE_SLOT_REGNUM)
17343 return true;
17344 }
17345 else
17346 {
17347 if (cfun->machine->global_pointer == regno)
17348 return true;
17349 }
17350 }
17351
17352 return false;
17353 }
17354
17355 /* Implement EPILOGUE_USES. */
17356
17357 bool
17358 mips_epilogue_uses (unsigned int regno)
17359 {
17360 /* Say that the epilogue uses the return address register. Note that
17361 in the case of sibcalls, the values "used by the epilogue" are
17362 considered live at the start of the called function. */
17363 if (regno == RETURN_ADDR_REGNUM)
17364 return true;
17365
17366 /* If using a GOT, say that the epilogue also uses GOT_VERSION_REGNUM.
17367 See the comment above load_call<mode> for details. */
17368 if (TARGET_USE_GOT && (regno) == GOT_VERSION_REGNUM)
17369 return true;
17370
17371 /* An interrupt handler must preserve some registers that are
17372 ordinarily call-clobbered. */
17373 if (cfun->machine->interrupt_handler_p
17374 && mips_interrupt_extra_call_saved_reg_p (regno))
17375 return true;
17376
17377 return false;
17378 }
17379
17380 /* A for_each_rtx callback. Stop the search if *X is an AT register. */
17381
17382 static int
17383 mips_at_reg_p (rtx *x, void *data ATTRIBUTE_UNUSED)
17384 {
17385 return REG_P (*x) && REGNO (*x) == AT_REGNUM;
17386 }
17387
17388 /* Return true if INSN needs to be wrapped in ".set noat".
17389 INSN has NOPERANDS operands, stored in OPVEC. */
17390
17391 static bool
17392 mips_need_noat_wrapper_p (rtx insn, rtx *opvec, int noperands)
17393 {
17394 int i;
17395
17396 if (recog_memoized (insn) >= 0)
17397 for (i = 0; i < noperands; i++)
17398 if (for_each_rtx (&opvec[i], mips_at_reg_p, NULL))
17399 return true;
17400 return false;
17401 }
17402
17403 /* Implement FINAL_PRESCAN_INSN. */
17404
17405 void
17406 mips_final_prescan_insn (rtx insn, rtx *opvec, int noperands)
17407 {
17408 if (mips_need_noat_wrapper_p (insn, opvec, noperands))
17409 mips_push_asm_switch (&mips_noat);
17410 }
17411
17412 /* Implement TARGET_ASM_FINAL_POSTSCAN_INSN. */
17413
17414 static void
17415 mips_final_postscan_insn (FILE *file ATTRIBUTE_UNUSED, rtx insn,
17416 rtx *opvec, int noperands)
17417 {
17418 if (mips_need_noat_wrapper_p (insn, opvec, noperands))
17419 mips_pop_asm_switch (&mips_noat);
17420 }
17421
17422 /* Return the function that is used to expand the <u>mulsidi3 pattern.
17423 EXT_CODE is the code of the extension used. Return NULL if widening
17424 multiplication shouldn't be used. */
17425
17426 mulsidi3_gen_fn
17427 mips_mulsidi3_gen_fn (enum rtx_code ext_code)
17428 {
17429 bool signed_p;
17430
17431 signed_p = ext_code == SIGN_EXTEND;
17432 if (TARGET_64BIT)
17433 {
17434 /* Don't use widening multiplication with MULT when we have DMUL. Even
17435 with the extension of its input operands DMUL is faster. Note that
17436 the extension is not needed for signed multiplication. In order to
17437 ensure that we always remove the redundant sign-extension in this
17438 case we still expand mulsidi3 for DMUL. */
17439 if (ISA_HAS_DMUL3)
17440 return signed_p ? gen_mulsidi3_64bit_dmul : NULL;
17441 if (TARGET_MIPS16)
17442 return (signed_p
17443 ? gen_mulsidi3_64bit_mips16
17444 : gen_umulsidi3_64bit_mips16);
17445 if (TARGET_FIX_R4000)
17446 return NULL;
17447 return signed_p ? gen_mulsidi3_64bit : gen_umulsidi3_64bit;
17448 }
17449 else
17450 {
17451 if (TARGET_MIPS16)
17452 return (signed_p
17453 ? gen_mulsidi3_32bit_mips16
17454 : gen_umulsidi3_32bit_mips16);
17455 if (TARGET_FIX_R4000 && !ISA_HAS_DSP)
17456 return signed_p ? gen_mulsidi3_32bit_r4000 : gen_umulsidi3_32bit_r4000;
17457 return signed_p ? gen_mulsidi3_32bit : gen_umulsidi3_32bit;
17458 }
17459 }
17460
17461 /* Return true if PATTERN matches the kind of instruction generated by
17462 umips_build_save_restore. SAVE_P is true for store. */
17463
17464 bool
17465 umips_save_restore_pattern_p (bool save_p, rtx pattern)
17466 {
17467 int n;
17468 unsigned int i;
17469 HOST_WIDE_INT first_offset = 0;
17470 rtx first_base = 0;
17471 unsigned int regmask = 0;
17472
17473 for (n = 0; n < XVECLEN (pattern, 0); n++)
17474 {
17475 rtx set, reg, mem, this_base;
17476 HOST_WIDE_INT this_offset;
17477
17478 /* Check that we have a SET. */
17479 set = XVECEXP (pattern, 0, n);
17480 if (GET_CODE (set) != SET)
17481 return false;
17482
17483 /* Check that the SET is a load (if restoring) or a store
17484 (if saving). */
17485 mem = save_p ? SET_DEST (set) : SET_SRC (set);
17486 if (!MEM_P (mem) || MEM_VOLATILE_P (mem))
17487 return false;
17488
17489 /* Check that the address is the sum of base and a possibly-zero
17490 constant offset. Determine if the offset is in range. */
17491 mips_split_plus (XEXP (mem, 0), &this_base, &this_offset);
17492 if (!REG_P (this_base))
17493 return false;
17494
17495 if (n == 0)
17496 {
17497 if (!UMIPS_12BIT_OFFSET_P (this_offset))
17498 return false;
17499 first_base = this_base;
17500 first_offset = this_offset;
17501 }
17502 else
17503 {
17504 /* Check that the save slots are consecutive. */
17505 if (REGNO (this_base) != REGNO (first_base)
17506 || this_offset != first_offset + UNITS_PER_WORD * n)
17507 return false;
17508 }
17509
17510 /* Check that SET's other operand is a register. */
17511 reg = save_p ? SET_SRC (set) : SET_DEST (set);
17512 if (!REG_P (reg))
17513 return false;
17514
17515 regmask |= 1 << REGNO (reg);
17516 }
17517
17518 for (i = 0; i < ARRAY_SIZE (umips_swm_mask); i++)
17519 if (regmask == umips_swm_mask[i])
17520 return true;
17521
17522 return false;
17523 }
17524
17525 /* Return the assembly instruction for microMIPS LWM or SWM.
17526 SAVE_P and PATTERN are as for umips_save_restore_pattern_p. */
17527
17528 const char *
17529 umips_output_save_restore (bool save_p, rtx pattern)
17530 {
17531 static char buffer[300];
17532 char *s;
17533 int n;
17534 HOST_WIDE_INT offset;
17535 rtx base, mem, set, last_set, last_reg;
17536
17537 /* Parse the pattern. */
17538 gcc_assert (umips_save_restore_pattern_p (save_p, pattern));
17539
17540 s = strcpy (buffer, save_p ? "swm\t" : "lwm\t");
17541 s += strlen (s);
17542 n = XVECLEN (pattern, 0);
17543
17544 set = XVECEXP (pattern, 0, 0);
17545 mem = save_p ? SET_DEST (set) : SET_SRC (set);
17546 mips_split_plus (XEXP (mem, 0), &base, &offset);
17547
17548 last_set = XVECEXP (pattern, 0, n - 1);
17549 last_reg = save_p ? SET_SRC (last_set) : SET_DEST (last_set);
17550
17551 if (REGNO (last_reg) == 31)
17552 n--;
17553
17554 gcc_assert (n <= 9);
17555 if (n == 0)
17556 ;
17557 else if (n == 1)
17558 s += sprintf (s, "%s,", reg_names[16]);
17559 else if (n < 9)
17560 s += sprintf (s, "%s-%s,", reg_names[16], reg_names[15 + n]);
17561 else if (n == 9)
17562 s += sprintf (s, "%s-%s,%s,", reg_names[16], reg_names[23],
17563 reg_names[30]);
17564
17565 if (REGNO (last_reg) == 31)
17566 s += sprintf (s, "%s,", reg_names[31]);
17567
17568 s += sprintf (s, "%d(%s)", (int)offset, reg_names[REGNO (base)]);
17569 return buffer;
17570 }
17571
17572 /* Return true if MEM1 and MEM2 use the same base register, and the
17573 offset of MEM2 equals the offset of MEM1 plus 4. FIRST_REG is the
17574 register into (from) which the contents of MEM1 will be loaded
17575 (stored), depending on the value of LOAD_P.
17576 SWAP_P is true when the 1st and 2nd instructions are swapped. */
17577
17578 static bool
17579 umips_load_store_pair_p_1 (bool load_p, bool swap_p,
17580 rtx first_reg, rtx mem1, rtx mem2)
17581 {
17582 rtx base1, base2;
17583 HOST_WIDE_INT offset1, offset2;
17584
17585 if (!MEM_P (mem1) || !MEM_P (mem2))
17586 return false;
17587
17588 mips_split_plus (XEXP (mem1, 0), &base1, &offset1);
17589 mips_split_plus (XEXP (mem2, 0), &base2, &offset2);
17590
17591 if (!REG_P (base1) || !rtx_equal_p (base1, base2))
17592 return false;
17593
17594 /* Avoid invalid load pair instructions. */
17595 if (load_p && REGNO (first_reg) == REGNO (base1))
17596 return false;
17597
17598 /* We must avoid this case for anti-dependence.
17599 Ex: lw $3, 4($3)
17600 lw $2, 0($3)
17601 first_reg is $2, but the base is $3. */
17602 if (load_p
17603 && swap_p
17604 && REGNO (first_reg) + 1 == REGNO (base1))
17605 return false;
17606
17607 if (offset2 != offset1 + 4)
17608 return false;
17609
17610 if (!UMIPS_12BIT_OFFSET_P (offset1))
17611 return false;
17612
17613 return true;
17614 }
17615
17616 /* OPERANDS describes the operands to a pair of SETs, in the order
17617 dest1, src1, dest2, src2. Return true if the operands can be used
17618 in an LWP or SWP instruction; LOAD_P says which. */
17619
17620 bool
17621 umips_load_store_pair_p (bool load_p, rtx *operands)
17622 {
17623 rtx reg1, reg2, mem1, mem2;
17624
17625 if (load_p)
17626 {
17627 reg1 = operands[0];
17628 reg2 = operands[2];
17629 mem1 = operands[1];
17630 mem2 = operands[3];
17631 }
17632 else
17633 {
17634 reg1 = operands[1];
17635 reg2 = operands[3];
17636 mem1 = operands[0];
17637 mem2 = operands[2];
17638 }
17639
17640 if (REGNO (reg2) == REGNO (reg1) + 1)
17641 return umips_load_store_pair_p_1 (load_p, false, reg1, mem1, mem2);
17642
17643 if (REGNO (reg1) == REGNO (reg2) + 1)
17644 return umips_load_store_pair_p_1 (load_p, true, reg2, mem2, mem1);
17645
17646 return false;
17647 }
17648
17649 /* Return the assembly instruction for a microMIPS LWP or SWP in which
17650 the first register is REG and the first memory slot is MEM.
17651 LOAD_P is true for LWP. */
17652
17653 static void
17654 umips_output_load_store_pair_1 (bool load_p, rtx reg, rtx mem)
17655 {
17656 rtx ops[] = {reg, mem};
17657
17658 if (load_p)
17659 output_asm_insn ("lwp\t%0,%1", ops);
17660 else
17661 output_asm_insn ("swp\t%0,%1", ops);
17662 }
17663
17664 /* Output the assembly instruction for a microMIPS LWP or SWP instruction.
17665 LOAD_P and OPERANDS are as for umips_load_store_pair_p. */
17666
17667 void
17668 umips_output_load_store_pair (bool load_p, rtx *operands)
17669 {
17670 rtx reg1, reg2, mem1, mem2;
17671 if (load_p)
17672 {
17673 reg1 = operands[0];
17674 reg2 = operands[2];
17675 mem1 = operands[1];
17676 mem2 = operands[3];
17677 }
17678 else
17679 {
17680 reg1 = operands[1];
17681 reg2 = operands[3];
17682 mem1 = operands[0];
17683 mem2 = operands[2];
17684 }
17685
17686 if (REGNO (reg2) == REGNO (reg1) + 1)
17687 {
17688 umips_output_load_store_pair_1 (load_p, reg1, mem1);
17689 return;
17690 }
17691
17692 gcc_assert (REGNO (reg1) == REGNO (reg2) + 1);
17693 umips_output_load_store_pair_1 (load_p, reg2, mem2);
17694 }
17695
17696 /* Return true if REG1 and REG2 match the criteria for a movep insn. */
17697
17698 bool
17699 umips_movep_target_p (rtx reg1, rtx reg2)
17700 {
17701 int regno1, regno2, pair;
17702 unsigned int i;
17703 static const int match[8] = {
17704 0x00000060, /* 5, 6 */
17705 0x000000a0, /* 5, 7 */
17706 0x000000c0, /* 6, 7 */
17707 0x00200010, /* 4, 21 */
17708 0x00400010, /* 4, 22 */
17709 0x00000030, /* 4, 5 */
17710 0x00000050, /* 4, 6 */
17711 0x00000090 /* 4, 7 */
17712 };
17713
17714 if (!REG_P (reg1) || !REG_P (reg2))
17715 return false;
17716
17717 regno1 = REGNO (reg1);
17718 regno2 = REGNO (reg2);
17719
17720 if (!GP_REG_P (regno1) || !GP_REG_P (regno2))
17721 return false;
17722
17723 pair = (1 << regno1) | (1 << regno2);
17724
17725 for (i = 0; i < ARRAY_SIZE (match); i++)
17726 if (pair == match[i])
17727 return true;
17728
17729 return false;
17730 }
17731 \f
17732 /* Return the size in bytes of the trampoline code, padded to
17733 TRAMPOLINE_ALIGNMENT bits. The static chain pointer and target
17734 function address immediately follow. */
17735
17736 int
17737 mips_trampoline_code_size (void)
17738 {
17739 if (TARGET_USE_PIC_FN_ADDR_REG)
17740 return 4 * 4;
17741 else if (ptr_mode == DImode)
17742 return 8 * 4;
17743 else if (ISA_HAS_LOAD_DELAY)
17744 return 6 * 4;
17745 else
17746 return 4 * 4;
17747 }
17748
17749 /* Implement TARGET_TRAMPOLINE_INIT. */
17750
17751 static void
17752 mips_trampoline_init (rtx m_tramp, tree fndecl, rtx chain_value)
17753 {
17754 rtx addr, end_addr, high, low, opcode, mem;
17755 rtx trampoline[8];
17756 unsigned int i, j;
17757 HOST_WIDE_INT end_addr_offset, static_chain_offset, target_function_offset;
17758
17759 /* Work out the offsets of the pointers from the start of the
17760 trampoline code. */
17761 end_addr_offset = mips_trampoline_code_size ();
17762 static_chain_offset = end_addr_offset;
17763 target_function_offset = static_chain_offset + GET_MODE_SIZE (ptr_mode);
17764
17765 /* Get pointers to the beginning and end of the code block. */
17766 addr = force_reg (Pmode, XEXP (m_tramp, 0));
17767 end_addr = mips_force_binary (Pmode, PLUS, addr, GEN_INT (end_addr_offset));
17768
17769 #define OP(X) gen_int_mode (X, SImode)
17770
17771 /* Build up the code in TRAMPOLINE. */
17772 i = 0;
17773 if (TARGET_USE_PIC_FN_ADDR_REG)
17774 {
17775 /* $25 contains the address of the trampoline. Emit code of the form:
17776
17777 l[wd] $1, target_function_offset($25)
17778 l[wd] $static_chain, static_chain_offset($25)
17779 jr $1
17780 move $25,$1. */
17781 trampoline[i++] = OP (MIPS_LOAD_PTR (AT_REGNUM,
17782 target_function_offset,
17783 PIC_FUNCTION_ADDR_REGNUM));
17784 trampoline[i++] = OP (MIPS_LOAD_PTR (STATIC_CHAIN_REGNUM,
17785 static_chain_offset,
17786 PIC_FUNCTION_ADDR_REGNUM));
17787 trampoline[i++] = OP (MIPS_JR (AT_REGNUM));
17788 trampoline[i++] = OP (MIPS_MOVE (PIC_FUNCTION_ADDR_REGNUM, AT_REGNUM));
17789 }
17790 else if (ptr_mode == DImode)
17791 {
17792 /* It's too cumbersome to create the full 64-bit address, so let's
17793 instead use:
17794
17795 move $1, $31
17796 bal 1f
17797 nop
17798 1: l[wd] $25, target_function_offset - 12($31)
17799 l[wd] $static_chain, static_chain_offset - 12($31)
17800 jr $25
17801 move $31, $1
17802
17803 where 12 is the offset of "1:" from the start of the code block. */
17804 trampoline[i++] = OP (MIPS_MOVE (AT_REGNUM, RETURN_ADDR_REGNUM));
17805 trampoline[i++] = OP (MIPS_BAL (1));
17806 trampoline[i++] = OP (MIPS_NOP);
17807 trampoline[i++] = OP (MIPS_LOAD_PTR (PIC_FUNCTION_ADDR_REGNUM,
17808 target_function_offset - 12,
17809 RETURN_ADDR_REGNUM));
17810 trampoline[i++] = OP (MIPS_LOAD_PTR (STATIC_CHAIN_REGNUM,
17811 static_chain_offset - 12,
17812 RETURN_ADDR_REGNUM));
17813 trampoline[i++] = OP (MIPS_JR (PIC_FUNCTION_ADDR_REGNUM));
17814 trampoline[i++] = OP (MIPS_MOVE (RETURN_ADDR_REGNUM, AT_REGNUM));
17815 }
17816 else
17817 {
17818 /* If the target has load delays, emit:
17819
17820 lui $1, %hi(end_addr)
17821 lw $25, %lo(end_addr + ...)($1)
17822 lw $static_chain, %lo(end_addr + ...)($1)
17823 jr $25
17824 nop
17825
17826 Otherwise emit:
17827
17828 lui $1, %hi(end_addr)
17829 lw $25, %lo(end_addr + ...)($1)
17830 jr $25
17831 lw $static_chain, %lo(end_addr + ...)($1). */
17832
17833 /* Split END_ADDR into %hi and %lo values. Trampolines are aligned
17834 to 64 bits, so the %lo value will have the bottom 3 bits clear. */
17835 high = expand_simple_binop (SImode, PLUS, end_addr, GEN_INT (0x8000),
17836 NULL, false, OPTAB_WIDEN);
17837 high = expand_simple_binop (SImode, LSHIFTRT, high, GEN_INT (16),
17838 NULL, false, OPTAB_WIDEN);
17839 low = convert_to_mode (SImode, gen_lowpart (HImode, end_addr), true);
17840
17841 /* Emit the LUI. */
17842 opcode = OP (MIPS_LUI (AT_REGNUM, 0));
17843 trampoline[i++] = expand_simple_binop (SImode, IOR, opcode, high,
17844 NULL, false, OPTAB_WIDEN);
17845
17846 /* Emit the load of the target function. */
17847 opcode = OP (MIPS_LOAD_PTR (PIC_FUNCTION_ADDR_REGNUM,
17848 target_function_offset - end_addr_offset,
17849 AT_REGNUM));
17850 trampoline[i++] = expand_simple_binop (SImode, IOR, opcode, low,
17851 NULL, false, OPTAB_WIDEN);
17852
17853 /* Emit the JR here, if we can. */
17854 if (!ISA_HAS_LOAD_DELAY)
17855 trampoline[i++] = OP (MIPS_JR (PIC_FUNCTION_ADDR_REGNUM));
17856
17857 /* Emit the load of the static chain register. */
17858 opcode = OP (MIPS_LOAD_PTR (STATIC_CHAIN_REGNUM,
17859 static_chain_offset - end_addr_offset,
17860 AT_REGNUM));
17861 trampoline[i++] = expand_simple_binop (SImode, IOR, opcode, low,
17862 NULL, false, OPTAB_WIDEN);
17863
17864 /* Emit the JR, if we couldn't above. */
17865 if (ISA_HAS_LOAD_DELAY)
17866 {
17867 trampoline[i++] = OP (MIPS_JR (PIC_FUNCTION_ADDR_REGNUM));
17868 trampoline[i++] = OP (MIPS_NOP);
17869 }
17870 }
17871
17872 #undef OP
17873
17874 /* Copy the trampoline code. Leave any padding uninitialized. */
17875 for (j = 0; j < i; j++)
17876 {
17877 mem = adjust_address (m_tramp, SImode, j * GET_MODE_SIZE (SImode));
17878 mips_emit_move (mem, trampoline[j]);
17879 }
17880
17881 /* Set up the static chain pointer field. */
17882 mem = adjust_address (m_tramp, ptr_mode, static_chain_offset);
17883 mips_emit_move (mem, chain_value);
17884
17885 /* Set up the target function field. */
17886 mem = adjust_address (m_tramp, ptr_mode, target_function_offset);
17887 mips_emit_move (mem, XEXP (DECL_RTL (fndecl), 0));
17888
17889 /* Flush the code part of the trampoline. */
17890 emit_insn (gen_add3_insn (end_addr, addr, GEN_INT (TRAMPOLINE_SIZE)));
17891 emit_insn (gen_clear_cache (addr, end_addr));
17892 }
17893
17894 /* Implement FUNCTION_PROFILER. */
17895
17896 void mips_function_profiler (FILE *file)
17897 {
17898 if (TARGET_MIPS16)
17899 sorry ("mips16 function profiling");
17900 if (TARGET_LONG_CALLS)
17901 {
17902 /* For TARGET_LONG_CALLS use $3 for the address of _mcount. */
17903 if (Pmode == DImode)
17904 fprintf (file, "\tdla\t%s,_mcount\n", reg_names[3]);
17905 else
17906 fprintf (file, "\tla\t%s,_mcount\n", reg_names[3]);
17907 }
17908 mips_push_asm_switch (&mips_noat);
17909 fprintf (file, "\tmove\t%s,%s\t\t# save current return address\n",
17910 reg_names[AT_REGNUM], reg_names[RETURN_ADDR_REGNUM]);
17911 /* _mcount treats $2 as the static chain register. */
17912 if (cfun->static_chain_decl != NULL)
17913 fprintf (file, "\tmove\t%s,%s\n", reg_names[2],
17914 reg_names[STATIC_CHAIN_REGNUM]);
17915 if (TARGET_MCOUNT_RA_ADDRESS)
17916 {
17917 /* If TARGET_MCOUNT_RA_ADDRESS load $12 with the address of the
17918 ra save location. */
17919 if (cfun->machine->frame.ra_fp_offset == 0)
17920 /* ra not saved, pass zero. */
17921 fprintf (file, "\tmove\t%s,%s\n", reg_names[12], reg_names[0]);
17922 else
17923 fprintf (file, "\t%s\t%s," HOST_WIDE_INT_PRINT_DEC "(%s)\n",
17924 Pmode == DImode ? "dla" : "la", reg_names[12],
17925 cfun->machine->frame.ra_fp_offset,
17926 reg_names[STACK_POINTER_REGNUM]);
17927 }
17928 if (!TARGET_NEWABI)
17929 fprintf (file,
17930 "\t%s\t%s,%s,%d\t\t# _mcount pops 2 words from stack\n",
17931 TARGET_64BIT ? "dsubu" : "subu",
17932 reg_names[STACK_POINTER_REGNUM],
17933 reg_names[STACK_POINTER_REGNUM],
17934 Pmode == DImode ? 16 : 8);
17935
17936 if (TARGET_LONG_CALLS)
17937 fprintf (file, "\tjalr\t%s\n", reg_names[3]);
17938 else
17939 fprintf (file, "\tjal\t_mcount\n");
17940 mips_pop_asm_switch (&mips_noat);
17941 /* _mcount treats $2 as the static chain register. */
17942 if (cfun->static_chain_decl != NULL)
17943 fprintf (file, "\tmove\t%s,%s\n", reg_names[STATIC_CHAIN_REGNUM],
17944 reg_names[2]);
17945 }
17946
17947 /* Implement TARGET_SHIFT_TRUNCATION_MASK. We want to keep the default
17948 behaviour of TARGET_SHIFT_TRUNCATION_MASK for non-vector modes even
17949 when TARGET_LOONGSON_VECTORS is true. */
17950
17951 static unsigned HOST_WIDE_INT
17952 mips_shift_truncation_mask (enum machine_mode mode)
17953 {
17954 if (TARGET_LOONGSON_VECTORS && VECTOR_MODE_P (mode))
17955 return 0;
17956
17957 return GET_MODE_BITSIZE (mode) - 1;
17958 }
17959
17960 /* Implement TARGET_PREPARE_PCH_SAVE. */
17961
17962 static void
17963 mips_prepare_pch_save (void)
17964 {
17965 /* We are called in a context where the current MIPS16 vs. non-MIPS16
17966 setting should be irrelevant. The question then is: which setting
17967 makes most sense at load time?
17968
17969 The PCH is loaded before the first token is read. We should never
17970 have switched into MIPS16 mode by that point, and thus should not
17971 have populated mips16_globals. Nor can we load the entire contents
17972 of mips16_globals from the PCH file, because mips16_globals contains
17973 a combination of GGC and non-GGC data.
17974
17975 There is therefore no point in trying save the GGC part of
17976 mips16_globals to the PCH file, or to preserve MIPS16ness across
17977 the PCH save and load. The loading compiler would not have access
17978 to the non-GGC parts of mips16_globals (either from the PCH file,
17979 or from a copy that the loading compiler generated itself) and would
17980 have to call target_reinit anyway.
17981
17982 It therefore seems best to switch back to non-MIPS16 mode at
17983 save time, and to ensure that mips16_globals remains null after
17984 a PCH load. */
17985 mips_set_compression_mode (0);
17986 mips16_globals = 0;
17987 }
17988 \f
17989 /* Generate or test for an insn that supports a constant permutation. */
17990
17991 #define MAX_VECT_LEN 8
17992
17993 struct expand_vec_perm_d
17994 {
17995 rtx target, op0, op1;
17996 unsigned char perm[MAX_VECT_LEN];
17997 enum machine_mode vmode;
17998 unsigned char nelt;
17999 bool one_vector_p;
18000 bool testing_p;
18001 };
18002
18003 /* Construct (set target (vec_select op0 (parallel perm))) and
18004 return true if that's a valid instruction in the active ISA. */
18005
18006 static bool
18007 mips_expand_vselect (rtx target, rtx op0,
18008 const unsigned char *perm, unsigned nelt)
18009 {
18010 rtx rperm[MAX_VECT_LEN], x;
18011 unsigned i;
18012
18013 for (i = 0; i < nelt; ++i)
18014 rperm[i] = GEN_INT (perm[i]);
18015
18016 x = gen_rtx_PARALLEL (VOIDmode, gen_rtvec_v (nelt, rperm));
18017 x = gen_rtx_VEC_SELECT (GET_MODE (target), op0, x);
18018 x = gen_rtx_SET (VOIDmode, target, x);
18019
18020 x = emit_insn (x);
18021 if (recog_memoized (x) < 0)
18022 {
18023 remove_insn (x);
18024 return false;
18025 }
18026 return true;
18027 }
18028
18029 /* Similar, but generate a vec_concat from op0 and op1 as well. */
18030
18031 static bool
18032 mips_expand_vselect_vconcat (rtx target, rtx op0, rtx op1,
18033 const unsigned char *perm, unsigned nelt)
18034 {
18035 enum machine_mode v2mode;
18036 rtx x;
18037
18038 v2mode = GET_MODE_2XWIDER_MODE (GET_MODE (op0));
18039 x = gen_rtx_VEC_CONCAT (v2mode, op0, op1);
18040 return mips_expand_vselect (target, x, perm, nelt);
18041 }
18042
18043 /* Recognize patterns for even-odd extraction. */
18044
18045 static bool
18046 mips_expand_vpc_loongson_even_odd (struct expand_vec_perm_d *d)
18047 {
18048 unsigned i, odd, nelt = d->nelt;
18049 rtx t0, t1, t2, t3;
18050
18051 if (!(TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS))
18052 return false;
18053 /* Even-odd for V2SI/V2SFmode is matched by interleave directly. */
18054 if (nelt < 4)
18055 return false;
18056
18057 odd = d->perm[0];
18058 if (odd > 1)
18059 return false;
18060 for (i = 1; i < nelt; ++i)
18061 if (d->perm[i] != i * 2 + odd)
18062 return false;
18063
18064 if (d->testing_p)
18065 return true;
18066
18067 /* We need 2*log2(N)-1 operations to achieve odd/even with interleave. */
18068 t0 = gen_reg_rtx (d->vmode);
18069 t1 = gen_reg_rtx (d->vmode);
18070 switch (d->vmode)
18071 {
18072 case V4HImode:
18073 emit_insn (gen_loongson_punpckhhw (t0, d->op0, d->op1));
18074 emit_insn (gen_loongson_punpcklhw (t1, d->op0, d->op1));
18075 if (odd)
18076 emit_insn (gen_loongson_punpckhhw (d->target, t1, t0));
18077 else
18078 emit_insn (gen_loongson_punpcklhw (d->target, t1, t0));
18079 break;
18080
18081 case V8QImode:
18082 t2 = gen_reg_rtx (d->vmode);
18083 t3 = gen_reg_rtx (d->vmode);
18084 emit_insn (gen_loongson_punpckhbh (t0, d->op0, d->op1));
18085 emit_insn (gen_loongson_punpcklbh (t1, d->op0, d->op1));
18086 emit_insn (gen_loongson_punpckhbh (t2, t1, t0));
18087 emit_insn (gen_loongson_punpcklbh (t3, t1, t0));
18088 if (odd)
18089 emit_insn (gen_loongson_punpckhbh (d->target, t3, t2));
18090 else
18091 emit_insn (gen_loongson_punpcklbh (d->target, t3, t2));
18092 break;
18093
18094 default:
18095 gcc_unreachable ();
18096 }
18097 return true;
18098 }
18099
18100 /* Recognize patterns for the Loongson PSHUFH instruction. */
18101
18102 static bool
18103 mips_expand_vpc_loongson_pshufh (struct expand_vec_perm_d *d)
18104 {
18105 unsigned i, mask;
18106 rtx rmask;
18107
18108 if (!(TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS))
18109 return false;
18110 if (d->vmode != V4HImode)
18111 return false;
18112 if (d->testing_p)
18113 return true;
18114
18115 /* Convert the selector into the packed 8-bit form for pshufh. */
18116 /* Recall that loongson is little-endian only. No big-endian
18117 adjustment required. */
18118 for (i = mask = 0; i < 4; i++)
18119 mask |= (d->perm[i] & 3) << (i * 2);
18120 rmask = force_reg (SImode, GEN_INT (mask));
18121
18122 if (d->one_vector_p)
18123 emit_insn (gen_loongson_pshufh (d->target, d->op0, rmask));
18124 else
18125 {
18126 rtx t0, t1, x, merge, rmerge[4];
18127
18128 t0 = gen_reg_rtx (V4HImode);
18129 t1 = gen_reg_rtx (V4HImode);
18130 emit_insn (gen_loongson_pshufh (t1, d->op1, rmask));
18131 emit_insn (gen_loongson_pshufh (t0, d->op0, rmask));
18132
18133 for (i = 0; i < 4; ++i)
18134 rmerge[i] = (d->perm[i] & 4 ? constm1_rtx : const0_rtx);
18135 merge = gen_rtx_CONST_VECTOR (V4HImode, gen_rtvec_v (4, rmerge));
18136 merge = force_reg (V4HImode, merge);
18137
18138 x = gen_rtx_AND (V4HImode, merge, t1);
18139 emit_insn (gen_rtx_SET (VOIDmode, t1, x));
18140
18141 x = gen_rtx_NOT (V4HImode, merge);
18142 x = gen_rtx_AND (V4HImode, x, t0);
18143 emit_insn (gen_rtx_SET (VOIDmode, t0, x));
18144
18145 x = gen_rtx_IOR (V4HImode, t0, t1);
18146 emit_insn (gen_rtx_SET (VOIDmode, d->target, x));
18147 }
18148
18149 return true;
18150 }
18151
18152 /* Recognize broadcast patterns for the Loongson. */
18153
18154 static bool
18155 mips_expand_vpc_loongson_bcast (struct expand_vec_perm_d *d)
18156 {
18157 unsigned i, elt;
18158 rtx t0, t1;
18159
18160 if (!(TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS))
18161 return false;
18162 /* Note that we've already matched V2SI via punpck and V4HI via pshufh. */
18163 if (d->vmode != V8QImode)
18164 return false;
18165 if (!d->one_vector_p)
18166 return false;
18167
18168 elt = d->perm[0];
18169 for (i = 1; i < 8; ++i)
18170 if (d->perm[i] != elt)
18171 return false;
18172
18173 if (d->testing_p)
18174 return true;
18175
18176 /* With one interleave we put two of the desired element adjacent. */
18177 t0 = gen_reg_rtx (V8QImode);
18178 if (elt < 4)
18179 emit_insn (gen_loongson_punpcklbh (t0, d->op0, d->op0));
18180 else
18181 emit_insn (gen_loongson_punpckhbh (t0, d->op0, d->op0));
18182
18183 /* Shuffle that one HImode element into all locations. */
18184 elt &= 3;
18185 elt *= 0x55;
18186 t1 = gen_reg_rtx (V4HImode);
18187 emit_insn (gen_loongson_pshufh (t1, gen_lowpart (V4HImode, t0),
18188 force_reg (SImode, GEN_INT (elt))));
18189
18190 emit_move_insn (d->target, gen_lowpart (V8QImode, t1));
18191 return true;
18192 }
18193
18194 static bool
18195 mips_expand_vec_perm_const_1 (struct expand_vec_perm_d *d)
18196 {
18197 unsigned int i, nelt = d->nelt;
18198 unsigned char perm2[MAX_VECT_LEN];
18199
18200 if (d->one_vector_p)
18201 {
18202 /* Try interleave with alternating operands. */
18203 memcpy (perm2, d->perm, sizeof(perm2));
18204 for (i = 1; i < nelt; i += 2)
18205 perm2[i] += nelt;
18206 if (mips_expand_vselect_vconcat (d->target, d->op0, d->op1, perm2, nelt))
18207 return true;
18208 }
18209 else
18210 {
18211 if (mips_expand_vselect_vconcat (d->target, d->op0, d->op1,
18212 d->perm, nelt))
18213 return true;
18214
18215 /* Try again with swapped operands. */
18216 for (i = 0; i < nelt; ++i)
18217 perm2[i] = (d->perm[i] + nelt) & (2 * nelt - 1);
18218 if (mips_expand_vselect_vconcat (d->target, d->op1, d->op0, perm2, nelt))
18219 return true;
18220 }
18221
18222 if (mips_expand_vpc_loongson_even_odd (d))
18223 return true;
18224 if (mips_expand_vpc_loongson_pshufh (d))
18225 return true;
18226 if (mips_expand_vpc_loongson_bcast (d))
18227 return true;
18228 return false;
18229 }
18230
18231 /* Expand a vec_perm_const pattern. */
18232
18233 bool
18234 mips_expand_vec_perm_const (rtx operands[4])
18235 {
18236 struct expand_vec_perm_d d;
18237 int i, nelt, which;
18238 unsigned char orig_perm[MAX_VECT_LEN];
18239 rtx sel;
18240 bool ok;
18241
18242 d.target = operands[0];
18243 d.op0 = operands[1];
18244 d.op1 = operands[2];
18245 sel = operands[3];
18246
18247 d.vmode = GET_MODE (d.target);
18248 gcc_assert (VECTOR_MODE_P (d.vmode));
18249 d.nelt = nelt = GET_MODE_NUNITS (d.vmode);
18250 d.testing_p = false;
18251
18252 for (i = which = 0; i < nelt; ++i)
18253 {
18254 rtx e = XVECEXP (sel, 0, i);
18255 int ei = INTVAL (e) & (2 * nelt - 1);
18256 which |= (ei < nelt ? 1 : 2);
18257 orig_perm[i] = ei;
18258 }
18259 memcpy (d.perm, orig_perm, MAX_VECT_LEN);
18260
18261 switch (which)
18262 {
18263 default:
18264 gcc_unreachable();
18265
18266 case 3:
18267 d.one_vector_p = false;
18268 if (!rtx_equal_p (d.op0, d.op1))
18269 break;
18270 /* FALLTHRU */
18271
18272 case 2:
18273 for (i = 0; i < nelt; ++i)
18274 d.perm[i] &= nelt - 1;
18275 d.op0 = d.op1;
18276 d.one_vector_p = true;
18277 break;
18278
18279 case 1:
18280 d.op1 = d.op0;
18281 d.one_vector_p = true;
18282 break;
18283 }
18284
18285 ok = mips_expand_vec_perm_const_1 (&d);
18286
18287 /* If we were given a two-vector permutation which just happened to
18288 have both input vectors equal, we folded this into a one-vector
18289 permutation. There are several loongson patterns that are matched
18290 via direct vec_select+vec_concat expansion, but we do not have
18291 support in mips_expand_vec_perm_const_1 to guess the adjustment
18292 that should be made for a single operand. Just try again with
18293 the original permutation. */
18294 if (!ok && which == 3)
18295 {
18296 d.op0 = operands[1];
18297 d.op1 = operands[2];
18298 d.one_vector_p = false;
18299 memcpy (d.perm, orig_perm, MAX_VECT_LEN);
18300 ok = mips_expand_vec_perm_const_1 (&d);
18301 }
18302
18303 return ok;
18304 }
18305
18306 /* Implement TARGET_VECTORIZE_VEC_PERM_CONST_OK. */
18307
18308 static bool
18309 mips_vectorize_vec_perm_const_ok (enum machine_mode vmode,
18310 const unsigned char *sel)
18311 {
18312 struct expand_vec_perm_d d;
18313 unsigned int i, nelt, which;
18314 bool ret;
18315
18316 d.vmode = vmode;
18317 d.nelt = nelt = GET_MODE_NUNITS (d.vmode);
18318 d.testing_p = true;
18319 memcpy (d.perm, sel, nelt);
18320
18321 /* Categorize the set of elements in the selector. */
18322 for (i = which = 0; i < nelt; ++i)
18323 {
18324 unsigned char e = d.perm[i];
18325 gcc_assert (e < 2 * nelt);
18326 which |= (e < nelt ? 1 : 2);
18327 }
18328
18329 /* For all elements from second vector, fold the elements to first. */
18330 if (which == 2)
18331 for (i = 0; i < nelt; ++i)
18332 d.perm[i] -= nelt;
18333
18334 /* Check whether the mask can be applied to the vector type. */
18335 d.one_vector_p = (which != 3);
18336
18337 d.target = gen_raw_REG (d.vmode, LAST_VIRTUAL_REGISTER + 1);
18338 d.op1 = d.op0 = gen_raw_REG (d.vmode, LAST_VIRTUAL_REGISTER + 2);
18339 if (!d.one_vector_p)
18340 d.op1 = gen_raw_REG (d.vmode, LAST_VIRTUAL_REGISTER + 3);
18341
18342 start_sequence ();
18343 ret = mips_expand_vec_perm_const_1 (&d);
18344 end_sequence ();
18345
18346 return ret;
18347 }
18348
18349 /* Expand an integral vector unpack operation. */
18350
18351 void
18352 mips_expand_vec_unpack (rtx operands[2], bool unsigned_p, bool high_p)
18353 {
18354 enum machine_mode imode = GET_MODE (operands[1]);
18355 rtx (*unpack) (rtx, rtx, rtx);
18356 rtx (*cmpgt) (rtx, rtx, rtx);
18357 rtx tmp, dest, zero;
18358
18359 switch (imode)
18360 {
18361 case V8QImode:
18362 if (high_p)
18363 unpack = gen_loongson_punpckhbh;
18364 else
18365 unpack = gen_loongson_punpcklbh;
18366 cmpgt = gen_loongson_pcmpgtb;
18367 break;
18368 case V4HImode:
18369 if (high_p)
18370 unpack = gen_loongson_punpckhhw;
18371 else
18372 unpack = gen_loongson_punpcklhw;
18373 cmpgt = gen_loongson_pcmpgth;
18374 break;
18375 default:
18376 gcc_unreachable ();
18377 }
18378
18379 zero = force_reg (imode, CONST0_RTX (imode));
18380 if (unsigned_p)
18381 tmp = zero;
18382 else
18383 {
18384 tmp = gen_reg_rtx (imode);
18385 emit_insn (cmpgt (tmp, zero, operands[1]));
18386 }
18387
18388 dest = gen_reg_rtx (imode);
18389 emit_insn (unpack (dest, operands[1], tmp));
18390
18391 emit_move_insn (operands[0], gen_lowpart (GET_MODE (operands[0]), dest));
18392 }
18393
18394 /* A subroutine of mips_expand_vec_init, match constant vector elements. */
18395
18396 static inline bool
18397 mips_constant_elt_p (rtx x)
18398 {
18399 return CONST_INT_P (x) || GET_CODE (x) == CONST_DOUBLE;
18400 }
18401
18402 /* A subroutine of mips_expand_vec_init, expand via broadcast. */
18403
18404 static void
18405 mips_expand_vi_broadcast (enum machine_mode vmode, rtx target, rtx elt)
18406 {
18407 struct expand_vec_perm_d d;
18408 rtx t1;
18409 bool ok;
18410
18411 if (elt != const0_rtx)
18412 elt = force_reg (GET_MODE_INNER (vmode), elt);
18413 if (REG_P (elt))
18414 elt = gen_lowpart (DImode, elt);
18415
18416 t1 = gen_reg_rtx (vmode);
18417 switch (vmode)
18418 {
18419 case V8QImode:
18420 emit_insn (gen_loongson_vec_init1_v8qi (t1, elt));
18421 break;
18422 case V4HImode:
18423 emit_insn (gen_loongson_vec_init1_v4hi (t1, elt));
18424 break;
18425 default:
18426 gcc_unreachable ();
18427 }
18428
18429 memset (&d, 0, sizeof (d));
18430 d.target = target;
18431 d.op0 = t1;
18432 d.op1 = t1;
18433 d.vmode = vmode;
18434 d.nelt = GET_MODE_NUNITS (vmode);
18435 d.one_vector_p = true;
18436
18437 ok = mips_expand_vec_perm_const_1 (&d);
18438 gcc_assert (ok);
18439 }
18440
18441 /* A subroutine of mips_expand_vec_init, replacing all of the non-constant
18442 elements of VALS with zeros, copy the constant vector to TARGET. */
18443
18444 static void
18445 mips_expand_vi_constant (enum machine_mode vmode, unsigned nelt,
18446 rtx target, rtx vals)
18447 {
18448 rtvec vec = shallow_copy_rtvec (XVEC (vals, 0));
18449 unsigned i;
18450
18451 for (i = 0; i < nelt; ++i)
18452 {
18453 if (!mips_constant_elt_p (RTVEC_ELT (vec, i)))
18454 RTVEC_ELT (vec, i) = const0_rtx;
18455 }
18456
18457 emit_move_insn (target, gen_rtx_CONST_VECTOR (vmode, vec));
18458 }
18459
18460
18461 /* A subroutine of mips_expand_vec_init, expand via pinsrh. */
18462
18463 static void
18464 mips_expand_vi_loongson_one_pinsrh (rtx target, rtx vals, unsigned one_var)
18465 {
18466 mips_expand_vi_constant (V4HImode, 4, target, vals);
18467
18468 emit_insn (gen_vec_setv4hi (target, target, XVECEXP (vals, 0, one_var),
18469 GEN_INT (one_var)));
18470 }
18471
18472 /* A subroutine of mips_expand_vec_init, expand anything via memory. */
18473
18474 static void
18475 mips_expand_vi_general (enum machine_mode vmode, enum machine_mode imode,
18476 unsigned nelt, unsigned nvar, rtx target, rtx vals)
18477 {
18478 rtx mem = assign_stack_temp (vmode, GET_MODE_SIZE (vmode));
18479 unsigned int i, isize = GET_MODE_SIZE (imode);
18480
18481 if (nvar < nelt)
18482 mips_expand_vi_constant (vmode, nelt, mem, vals);
18483
18484 for (i = 0; i < nelt; ++i)
18485 {
18486 rtx x = XVECEXP (vals, 0, i);
18487 if (!mips_constant_elt_p (x))
18488 emit_move_insn (adjust_address (mem, imode, i * isize), x);
18489 }
18490
18491 emit_move_insn (target, mem);
18492 }
18493
18494 /* Expand a vector initialization. */
18495
18496 void
18497 mips_expand_vector_init (rtx target, rtx vals)
18498 {
18499 enum machine_mode vmode = GET_MODE (target);
18500 enum machine_mode imode = GET_MODE_INNER (vmode);
18501 unsigned i, nelt = GET_MODE_NUNITS (vmode);
18502 unsigned nvar = 0, one_var = -1u;
18503 bool all_same = true;
18504 rtx x;
18505
18506 for (i = 0; i < nelt; ++i)
18507 {
18508 x = XVECEXP (vals, 0, i);
18509 if (!mips_constant_elt_p (x))
18510 nvar++, one_var = i;
18511 if (i > 0 && !rtx_equal_p (x, XVECEXP (vals, 0, 0)))
18512 all_same = false;
18513 }
18514
18515 /* Load constants from the pool, or whatever's handy. */
18516 if (nvar == 0)
18517 {
18518 emit_move_insn (target, gen_rtx_CONST_VECTOR (vmode, XVEC (vals, 0)));
18519 return;
18520 }
18521
18522 /* For two-part initialization, always use CONCAT. */
18523 if (nelt == 2)
18524 {
18525 rtx op0 = force_reg (imode, XVECEXP (vals, 0, 0));
18526 rtx op1 = force_reg (imode, XVECEXP (vals, 0, 1));
18527 x = gen_rtx_VEC_CONCAT (vmode, op0, op1);
18528 emit_insn (gen_rtx_SET (VOIDmode, target, x));
18529 return;
18530 }
18531
18532 /* Loongson is the only cpu with vectors with more elements. */
18533 gcc_assert (TARGET_HARD_FLOAT && TARGET_LOONGSON_VECTORS);
18534
18535 /* If all values are identical, broadcast the value. */
18536 if (all_same)
18537 {
18538 mips_expand_vi_broadcast (vmode, target, XVECEXP (vals, 0, 0));
18539 return;
18540 }
18541
18542 /* If we've only got one non-variable V4HImode, use PINSRH. */
18543 if (nvar == 1 && vmode == V4HImode)
18544 {
18545 mips_expand_vi_loongson_one_pinsrh (target, vals, one_var);
18546 return;
18547 }
18548
18549 mips_expand_vi_general (vmode, imode, nelt, nvar, target, vals);
18550 }
18551
18552 /* Expand a vector reduction. */
18553
18554 void
18555 mips_expand_vec_reduc (rtx target, rtx in, rtx (*gen)(rtx, rtx, rtx))
18556 {
18557 enum machine_mode vmode = GET_MODE (in);
18558 unsigned char perm2[2];
18559 rtx last, next, fold, x;
18560 bool ok;
18561
18562 last = in;
18563 fold = gen_reg_rtx (vmode);
18564 switch (vmode)
18565 {
18566 case V2SFmode:
18567 /* Use PUL/PLU to produce { L, H } op { H, L }.
18568 By reversing the pair order, rather than a pure interleave high,
18569 we avoid erroneous exceptional conditions that we might otherwise
18570 produce from the computation of H op H. */
18571 perm2[0] = 1;
18572 perm2[1] = 2;
18573 ok = mips_expand_vselect_vconcat (fold, last, last, perm2, 2);
18574 gcc_assert (ok);
18575 break;
18576
18577 case V2SImode:
18578 /* Use interleave to produce { H, L } op { H, H }. */
18579 emit_insn (gen_loongson_punpckhwd (fold, last, last));
18580 break;
18581
18582 case V4HImode:
18583 /* Perform the first reduction with interleave,
18584 and subsequent reductions with shifts. */
18585 emit_insn (gen_loongson_punpckhwd_hi (fold, last, last));
18586
18587 next = gen_reg_rtx (vmode);
18588 emit_insn (gen (next, last, fold));
18589 last = next;
18590
18591 fold = gen_reg_rtx (vmode);
18592 x = force_reg (SImode, GEN_INT (16));
18593 emit_insn (gen_vec_shr_v4hi (fold, last, x));
18594 break;
18595
18596 case V8QImode:
18597 emit_insn (gen_loongson_punpckhwd_qi (fold, last, last));
18598
18599 next = gen_reg_rtx (vmode);
18600 emit_insn (gen (next, last, fold));
18601 last = next;
18602
18603 fold = gen_reg_rtx (vmode);
18604 x = force_reg (SImode, GEN_INT (16));
18605 emit_insn (gen_vec_shr_v8qi (fold, last, x));
18606
18607 next = gen_reg_rtx (vmode);
18608 emit_insn (gen (next, last, fold));
18609 last = next;
18610
18611 fold = gen_reg_rtx (vmode);
18612 x = force_reg (SImode, GEN_INT (8));
18613 emit_insn (gen_vec_shr_v8qi (fold, last, x));
18614 break;
18615
18616 default:
18617 gcc_unreachable ();
18618 }
18619
18620 emit_insn (gen (target, last, fold));
18621 }
18622
18623 /* Expand a vector minimum/maximum. */
18624
18625 void
18626 mips_expand_vec_minmax (rtx target, rtx op0, rtx op1,
18627 rtx (*cmp) (rtx, rtx, rtx), bool min_p)
18628 {
18629 enum machine_mode vmode = GET_MODE (target);
18630 rtx tc, t0, t1, x;
18631
18632 tc = gen_reg_rtx (vmode);
18633 t0 = gen_reg_rtx (vmode);
18634 t1 = gen_reg_rtx (vmode);
18635
18636 /* op0 > op1 */
18637 emit_insn (cmp (tc, op0, op1));
18638
18639 x = gen_rtx_AND (vmode, tc, (min_p ? op1 : op0));
18640 emit_insn (gen_rtx_SET (VOIDmode, t0, x));
18641
18642 x = gen_rtx_NOT (vmode, tc);
18643 x = gen_rtx_AND (vmode, x, (min_p ? op0 : op1));
18644 emit_insn (gen_rtx_SET (VOIDmode, t1, x));
18645
18646 x = gen_rtx_IOR (vmode, t0, t1);
18647 emit_insn (gen_rtx_SET (VOIDmode, target, x));
18648 }
18649
18650 /* Implement TARGET_CASE_VALUES_THRESHOLD. */
18651
18652 unsigned int
18653 mips_case_values_threshold (void)
18654 {
18655 /* In MIPS16 mode using a larger case threshold generates smaller code. */
18656 if (TARGET_MIPS16 && optimize_size)
18657 return 10;
18658 else
18659 return default_case_values_threshold ();
18660 }
18661 \f
18662 /* Initialize the GCC target structure. */
18663 #undef TARGET_ASM_ALIGNED_HI_OP
18664 #define TARGET_ASM_ALIGNED_HI_OP "\t.half\t"
18665 #undef TARGET_ASM_ALIGNED_SI_OP
18666 #define TARGET_ASM_ALIGNED_SI_OP "\t.word\t"
18667 #undef TARGET_ASM_ALIGNED_DI_OP
18668 #define TARGET_ASM_ALIGNED_DI_OP "\t.dword\t"
18669
18670 #undef TARGET_OPTION_OVERRIDE
18671 #define TARGET_OPTION_OVERRIDE mips_option_override
18672
18673 #undef TARGET_LEGITIMIZE_ADDRESS
18674 #define TARGET_LEGITIMIZE_ADDRESS mips_legitimize_address
18675
18676 #undef TARGET_ASM_FUNCTION_PROLOGUE
18677 #define TARGET_ASM_FUNCTION_PROLOGUE mips_output_function_prologue
18678 #undef TARGET_ASM_FUNCTION_EPILOGUE
18679 #define TARGET_ASM_FUNCTION_EPILOGUE mips_output_function_epilogue
18680 #undef TARGET_ASM_SELECT_RTX_SECTION
18681 #define TARGET_ASM_SELECT_RTX_SECTION mips_select_rtx_section
18682 #undef TARGET_ASM_FUNCTION_RODATA_SECTION
18683 #define TARGET_ASM_FUNCTION_RODATA_SECTION mips_function_rodata_section
18684
18685 #undef TARGET_SCHED_INIT
18686 #define TARGET_SCHED_INIT mips_sched_init
18687 #undef TARGET_SCHED_REORDER
18688 #define TARGET_SCHED_REORDER mips_sched_reorder
18689 #undef TARGET_SCHED_REORDER2
18690 #define TARGET_SCHED_REORDER2 mips_sched_reorder2
18691 #undef TARGET_SCHED_VARIABLE_ISSUE
18692 #define TARGET_SCHED_VARIABLE_ISSUE mips_variable_issue
18693 #undef TARGET_SCHED_ADJUST_COST
18694 #define TARGET_SCHED_ADJUST_COST mips_adjust_cost
18695 #undef TARGET_SCHED_ISSUE_RATE
18696 #define TARGET_SCHED_ISSUE_RATE mips_issue_rate
18697 #undef TARGET_SCHED_INIT_DFA_POST_CYCLE_INSN
18698 #define TARGET_SCHED_INIT_DFA_POST_CYCLE_INSN mips_init_dfa_post_cycle_insn
18699 #undef TARGET_SCHED_DFA_POST_ADVANCE_CYCLE
18700 #define TARGET_SCHED_DFA_POST_ADVANCE_CYCLE mips_dfa_post_advance_cycle
18701 #undef TARGET_SCHED_FIRST_CYCLE_MULTIPASS_DFA_LOOKAHEAD
18702 #define TARGET_SCHED_FIRST_CYCLE_MULTIPASS_DFA_LOOKAHEAD \
18703 mips_multipass_dfa_lookahead
18704 #undef TARGET_SMALL_REGISTER_CLASSES_FOR_MODE_P
18705 #define TARGET_SMALL_REGISTER_CLASSES_FOR_MODE_P \
18706 mips_small_register_classes_for_mode_p
18707
18708 #undef TARGET_FUNCTION_OK_FOR_SIBCALL
18709 #define TARGET_FUNCTION_OK_FOR_SIBCALL mips_function_ok_for_sibcall
18710
18711 #undef TARGET_INSERT_ATTRIBUTES
18712 #define TARGET_INSERT_ATTRIBUTES mips_insert_attributes
18713 #undef TARGET_MERGE_DECL_ATTRIBUTES
18714 #define TARGET_MERGE_DECL_ATTRIBUTES mips_merge_decl_attributes
18715 #undef TARGET_CAN_INLINE_P
18716 #define TARGET_CAN_INLINE_P mips_can_inline_p
18717 #undef TARGET_SET_CURRENT_FUNCTION
18718 #define TARGET_SET_CURRENT_FUNCTION mips_set_current_function
18719
18720 #undef TARGET_VALID_POINTER_MODE
18721 #define TARGET_VALID_POINTER_MODE mips_valid_pointer_mode
18722 #undef TARGET_REGISTER_MOVE_COST
18723 #define TARGET_REGISTER_MOVE_COST mips_register_move_cost
18724 #undef TARGET_MEMORY_MOVE_COST
18725 #define TARGET_MEMORY_MOVE_COST mips_memory_move_cost
18726 #undef TARGET_RTX_COSTS
18727 #define TARGET_RTX_COSTS mips_rtx_costs
18728 #undef TARGET_ADDRESS_COST
18729 #define TARGET_ADDRESS_COST mips_address_cost
18730
18731 #undef TARGET_IN_SMALL_DATA_P
18732 #define TARGET_IN_SMALL_DATA_P mips_in_small_data_p
18733
18734 #undef TARGET_MACHINE_DEPENDENT_REORG
18735 #define TARGET_MACHINE_DEPENDENT_REORG mips_reorg
18736
18737 #undef TARGET_PREFERRED_RELOAD_CLASS
18738 #define TARGET_PREFERRED_RELOAD_CLASS mips_preferred_reload_class
18739
18740 #undef TARGET_EXPAND_TO_RTL_HOOK
18741 #define TARGET_EXPAND_TO_RTL_HOOK mips_expand_to_rtl_hook
18742 #undef TARGET_ASM_FILE_START
18743 #define TARGET_ASM_FILE_START mips_file_start
18744 #undef TARGET_ASM_FILE_START_FILE_DIRECTIVE
18745 #define TARGET_ASM_FILE_START_FILE_DIRECTIVE true
18746 #undef TARGET_ASM_CODE_END
18747 #define TARGET_ASM_CODE_END mips_code_end
18748
18749 #undef TARGET_INIT_LIBFUNCS
18750 #define TARGET_INIT_LIBFUNCS mips_init_libfuncs
18751
18752 #undef TARGET_BUILD_BUILTIN_VA_LIST
18753 #define TARGET_BUILD_BUILTIN_VA_LIST mips_build_builtin_va_list
18754 #undef TARGET_EXPAND_BUILTIN_VA_START
18755 #define TARGET_EXPAND_BUILTIN_VA_START mips_va_start
18756 #undef TARGET_GIMPLIFY_VA_ARG_EXPR
18757 #define TARGET_GIMPLIFY_VA_ARG_EXPR mips_gimplify_va_arg_expr
18758
18759 #undef TARGET_PROMOTE_FUNCTION_MODE
18760 #define TARGET_PROMOTE_FUNCTION_MODE default_promote_function_mode_always_promote
18761 #undef TARGET_PROMOTE_PROTOTYPES
18762 #define TARGET_PROMOTE_PROTOTYPES hook_bool_const_tree_true
18763
18764 #undef TARGET_FUNCTION_VALUE
18765 #define TARGET_FUNCTION_VALUE mips_function_value
18766 #undef TARGET_LIBCALL_VALUE
18767 #define TARGET_LIBCALL_VALUE mips_libcall_value
18768 #undef TARGET_FUNCTION_VALUE_REGNO_P
18769 #define TARGET_FUNCTION_VALUE_REGNO_P mips_function_value_regno_p
18770 #undef TARGET_RETURN_IN_MEMORY
18771 #define TARGET_RETURN_IN_MEMORY mips_return_in_memory
18772 #undef TARGET_RETURN_IN_MSB
18773 #define TARGET_RETURN_IN_MSB mips_return_in_msb
18774
18775 #undef TARGET_ASM_OUTPUT_MI_THUNK
18776 #define TARGET_ASM_OUTPUT_MI_THUNK mips_output_mi_thunk
18777 #undef TARGET_ASM_CAN_OUTPUT_MI_THUNK
18778 #define TARGET_ASM_CAN_OUTPUT_MI_THUNK hook_bool_const_tree_hwi_hwi_const_tree_true
18779
18780 #undef TARGET_PRINT_OPERAND
18781 #define TARGET_PRINT_OPERAND mips_print_operand
18782 #undef TARGET_PRINT_OPERAND_ADDRESS
18783 #define TARGET_PRINT_OPERAND_ADDRESS mips_print_operand_address
18784 #undef TARGET_PRINT_OPERAND_PUNCT_VALID_P
18785 #define TARGET_PRINT_OPERAND_PUNCT_VALID_P mips_print_operand_punct_valid_p
18786
18787 #undef TARGET_SETUP_INCOMING_VARARGS
18788 #define TARGET_SETUP_INCOMING_VARARGS mips_setup_incoming_varargs
18789 #undef TARGET_STRICT_ARGUMENT_NAMING
18790 #define TARGET_STRICT_ARGUMENT_NAMING mips_strict_argument_naming
18791 #undef TARGET_MUST_PASS_IN_STACK
18792 #define TARGET_MUST_PASS_IN_STACK must_pass_in_stack_var_size
18793 #undef TARGET_PASS_BY_REFERENCE
18794 #define TARGET_PASS_BY_REFERENCE mips_pass_by_reference
18795 #undef TARGET_CALLEE_COPIES
18796 #define TARGET_CALLEE_COPIES mips_callee_copies
18797 #undef TARGET_ARG_PARTIAL_BYTES
18798 #define TARGET_ARG_PARTIAL_BYTES mips_arg_partial_bytes
18799 #undef TARGET_FUNCTION_ARG
18800 #define TARGET_FUNCTION_ARG mips_function_arg
18801 #undef TARGET_FUNCTION_ARG_ADVANCE
18802 #define TARGET_FUNCTION_ARG_ADVANCE mips_function_arg_advance
18803 #undef TARGET_FUNCTION_ARG_BOUNDARY
18804 #define TARGET_FUNCTION_ARG_BOUNDARY mips_function_arg_boundary
18805
18806 #undef TARGET_MODE_REP_EXTENDED
18807 #define TARGET_MODE_REP_EXTENDED mips_mode_rep_extended
18808
18809 #undef TARGET_VECTOR_MODE_SUPPORTED_P
18810 #define TARGET_VECTOR_MODE_SUPPORTED_P mips_vector_mode_supported_p
18811
18812 #undef TARGET_SCALAR_MODE_SUPPORTED_P
18813 #define TARGET_SCALAR_MODE_SUPPORTED_P mips_scalar_mode_supported_p
18814
18815 #undef TARGET_VECTORIZE_PREFERRED_SIMD_MODE
18816 #define TARGET_VECTORIZE_PREFERRED_SIMD_MODE mips_preferred_simd_mode
18817
18818 #undef TARGET_INIT_BUILTINS
18819 #define TARGET_INIT_BUILTINS mips_init_builtins
18820 #undef TARGET_BUILTIN_DECL
18821 #define TARGET_BUILTIN_DECL mips_builtin_decl
18822 #undef TARGET_EXPAND_BUILTIN
18823 #define TARGET_EXPAND_BUILTIN mips_expand_builtin
18824
18825 #undef TARGET_HAVE_TLS
18826 #define TARGET_HAVE_TLS HAVE_AS_TLS
18827
18828 #undef TARGET_CANNOT_FORCE_CONST_MEM
18829 #define TARGET_CANNOT_FORCE_CONST_MEM mips_cannot_force_const_mem
18830
18831 #undef TARGET_LEGITIMATE_CONSTANT_P
18832 #define TARGET_LEGITIMATE_CONSTANT_P mips_legitimate_constant_p
18833
18834 #undef TARGET_ENCODE_SECTION_INFO
18835 #define TARGET_ENCODE_SECTION_INFO mips_encode_section_info
18836
18837 #undef TARGET_ATTRIBUTE_TABLE
18838 #define TARGET_ATTRIBUTE_TABLE mips_attribute_table
18839 /* All our function attributes are related to how out-of-line copies should
18840 be compiled or called. They don't in themselves prevent inlining. */
18841 #undef TARGET_FUNCTION_ATTRIBUTE_INLINABLE_P
18842 #define TARGET_FUNCTION_ATTRIBUTE_INLINABLE_P hook_bool_const_tree_true
18843
18844 #undef TARGET_EXTRA_LIVE_ON_ENTRY
18845 #define TARGET_EXTRA_LIVE_ON_ENTRY mips_extra_live_on_entry
18846
18847 #undef TARGET_USE_BLOCKS_FOR_CONSTANT_P
18848 #define TARGET_USE_BLOCKS_FOR_CONSTANT_P mips_use_blocks_for_constant_p
18849 #undef TARGET_USE_ANCHORS_FOR_SYMBOL_P
18850 #define TARGET_USE_ANCHORS_FOR_SYMBOL_P mips_use_anchors_for_symbol_p
18851
18852 #undef TARGET_COMP_TYPE_ATTRIBUTES
18853 #define TARGET_COMP_TYPE_ATTRIBUTES mips_comp_type_attributes
18854
18855 #ifdef HAVE_AS_DTPRELWORD
18856 #undef TARGET_ASM_OUTPUT_DWARF_DTPREL
18857 #define TARGET_ASM_OUTPUT_DWARF_DTPREL mips_output_dwarf_dtprel
18858 #endif
18859 #undef TARGET_DWARF_REGISTER_SPAN
18860 #define TARGET_DWARF_REGISTER_SPAN mips_dwarf_register_span
18861
18862 #undef TARGET_ASM_FINAL_POSTSCAN_INSN
18863 #define TARGET_ASM_FINAL_POSTSCAN_INSN mips_final_postscan_insn
18864
18865 #undef TARGET_LEGITIMATE_ADDRESS_P
18866 #define TARGET_LEGITIMATE_ADDRESS_P mips_legitimate_address_p
18867
18868 #undef TARGET_FRAME_POINTER_REQUIRED
18869 #define TARGET_FRAME_POINTER_REQUIRED mips_frame_pointer_required
18870
18871 #undef TARGET_CAN_ELIMINATE
18872 #define TARGET_CAN_ELIMINATE mips_can_eliminate
18873
18874 #undef TARGET_CONDITIONAL_REGISTER_USAGE
18875 #define TARGET_CONDITIONAL_REGISTER_USAGE mips_conditional_register_usage
18876
18877 #undef TARGET_TRAMPOLINE_INIT
18878 #define TARGET_TRAMPOLINE_INIT mips_trampoline_init
18879
18880 #undef TARGET_ASM_OUTPUT_SOURCE_FILENAME
18881 #define TARGET_ASM_OUTPUT_SOURCE_FILENAME mips_output_filename
18882
18883 #undef TARGET_SHIFT_TRUNCATION_MASK
18884 #define TARGET_SHIFT_TRUNCATION_MASK mips_shift_truncation_mask
18885
18886 #undef TARGET_PREPARE_PCH_SAVE
18887 #define TARGET_PREPARE_PCH_SAVE mips_prepare_pch_save
18888
18889 #undef TARGET_VECTORIZE_VEC_PERM_CONST_OK
18890 #define TARGET_VECTORIZE_VEC_PERM_CONST_OK mips_vectorize_vec_perm_const_ok
18891
18892 #undef TARGET_CASE_VALUES_THRESHOLD
18893 #define TARGET_CASE_VALUES_THRESHOLD mips_case_values_threshold
18894
18895 struct gcc_target targetm = TARGET_INITIALIZER;
18896 \f
18897 #include "gt-mips.h"